{ "6": { "dfa": { "log": { "train_loss": [ 2.0821874879455566, 2.0482772801208498, 2.047201838607788, 2.0446329682159425, 2.0396667890930176, 2.036854875450134, 2.035803484649658, 2.0357003843688966, 2.030295910644531, 2.027509428253174, 2.027801731262207, 2.026494747467041, 2.023713701324463, 2.0224919934082033, 2.0218288256835937, 2.0183722845840455, 2.0188908798217775, 2.0174379263305666, 2.0145048645782473, 2.0172035501098633, 2.01550293838501, 2.013378846511841, 2.015203825531006, 2.016428701705933, 2.011487791137695, 2.010817546157837, 2.01103433883667, 2.011530419845581, 2.0120579361724853, 2.0116470166778564, 2.008692329330444, 2.009709241294861, 2.008519637374878, 2.0078509032440186, 2.0077528884124756, 2.006431950531006, 2.0055743618011475, 2.005430025024414, 2.0056805452728272, 2.007569041595459, 2.004868392677307, 2.0057909046936033, 2.0064586280822754, 2.005987978057861, 2.00688329624176, 2.00672064743042, 2.0048528481292727, 2.005383738861084, 2.0018666375732423, 2.0059955949401855, 2.003435557899475, 2.001197138328552, 2.0012222803497313, 2.003032783164978, 2.003918945236206, 2.0043967723083496, 2.0035451693725586, 2.003359081878662, 2.001155726585388, 2.001671184616089, 2.0038728633880614, 2.00498755947113, 2.002938235092163, 2.000668586883545, 2.0018935997772216, 2.0039958557128905, 2.001610350112915, 2.000534170913696, 2.001975674972534, 2.002237940979004, 2.0009369605255127, 2.003139477081299, 2.00191648399353, 2.003141210899353, 1.9998547933578492, 2.000947899513245, 2.0015833082580565, 2.0008020196151732, 2.0014297840118407, 2.00010564907074, 2.0010018926239015, 2.0015807587051393, 2.0006349613952636, 2.0010920279693605, 2.000114615020752, 2.001875145263672, 2.001294381980896, 2.001243436965942, 1.9999162873077392, 1.998048712120056, 2.000587540740967, 2.0002040885162353, 2.00153217338562, 2.0005496265411375, 2.000687266998291, 2.000036004295349, 1.9989564297866822, 1.9997446877288818, 1.9997422592163085, 2.000641355895996 ], "train_acc": [ 0.23088, 0.24298, 0.242, 0.24386, 0.24422, 0.24566, 0.24754, 0.24998, 0.25214, 0.25368, 0.25348, 0.2556, 0.2568, 0.25746, 0.2569, 0.25902, 0.26116, 0.2581, 0.26084, 0.26254, 0.26022, 0.26164, 0.26092, 0.26324, 0.26598, 0.26604, 0.26308, 0.26346, 0.26408, 0.26498, 0.2656, 0.26436, 0.26714, 0.26778, 0.26842, 0.26646, 0.26986, 0.26788, 0.26944, 0.2679, 0.26858, 0.269, 0.26802, 0.26894, 0.26892, 0.26996, 0.26784, 0.27018, 0.26922, 0.2704, 0.26998, 0.27222, 0.2733, 0.27004, 0.2688, 0.26874, 0.26814, 0.27284, 0.26872, 0.272, 0.26908, 0.27148, 0.27176, 0.27322, 0.2711, 0.26946, 0.27102, 0.27338, 0.27226, 0.2703, 0.27122, 0.27198, 0.27138, 0.27356, 0.27036, 0.27104, 0.27176, 0.27334, 0.27254, 0.27312, 0.27288, 0.27076, 0.2713, 0.27096, 0.27414, 0.27154, 0.27082, 0.27156, 0.27418, 0.27186, 0.27248, 0.27316, 0.27146, 0.27196, 0.27248, 0.27434, 0.27286, 0.27322, 0.26998, 0.272 ], "test_acc": [ 0.2459, 0.2608, 0.2635, 0.2517, 0.253, 0.2671, 0.2464, 0.2581, 0.2752, 0.2714, 0.2801, 0.2721, 0.2781, 0.2735, 0.2757, 0.2879, 0.2731, 0.2825, 0.271, 0.2808, 0.2798, 0.2898, 0.2713, 0.2935, 0.2878, 0.2873, 0.268, 0.2934, 0.2831, 0.2992, 0.2915, 0.2887, 0.2797, 0.2998, 0.2957, 0.2824, 0.2818, 0.289, 0.2951, 0.2906, 0.2842, 0.2772, 0.2962, 0.2715, 0.3031, 0.2834, 0.299, 0.2881, 0.2849, 0.2939, 0.2801, 0.279, 0.2819, 0.2841, 0.3013, 0.2908, 0.2906, 0.2845, 0.2931, 0.2816, 0.2975, 0.2963, 0.2953, 0.288, 0.2836, 0.2878, 0.2906, 0.2879, 0.2969, 0.2892, 0.286, 0.282, 0.2914, 0.2885, 0.2892, 0.2904, 0.295, 0.2865, 0.2949, 0.2902, 0.2894, 0.2898, 0.2913, 0.2929, 0.2868, 0.2869, 0.2905, 0.2895, 0.29, 0.2896, 0.2882, 0.2908, 0.2912, 0.2901, 0.2893, 0.2888, 0.2895, 0.2894, 0.2896, 0.2896 ] }, "diagnostics": { "bp_cosine": [ 0.36949819326400757, 0.0005479701794683933, -0.0006032834062352777, 0.00028805271722376347, -0.0005946755409240723, -0.0002685927611310035, -0.00046556672896258533, -0.00010807066428242251, -0.0003351868945173919, 0.00010062567162094638, -0.000464106589788571, -4.078936035512015e-05 ], "perturbation_rho": [ -0.011094596236944199, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -2.4400651454925537e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -9.699724614620209e-07, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.01": [ -3.3657997846603394e-06, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ] }, "hidden_norms_per_layer": [ 55177.16015625, 1459404800.0, 2815841792.0, 3553956096.0, 3947802112.0, 6848872448.0, 7047305728.0, 7256152064.0, 9300344832.0, 10056428544.0, 10370693120.0, 10568456192.0, 11512604672.0 ], "bp_grad_norms_per_layer": [ 2.3892781086942705e-07, 2.0915398579735012e-10, 2.0916321452624231e-10, 2.0916490761635487e-10, 2.0915806586696561e-10, 2.0912831188990566e-10, 2.0913649978471227e-10, 2.0914339704525275e-10, 2.089406564431684e-10, 2.0894751207034545e-10, 2.0897203412140186e-10, 2.0899702801724374e-10, 2.090319445313682e-10 ] }, "drift": { "embed.weight": 337.6841411506247, "embed.bias": 244.65544843260258, "blocks.0.ln.weight": 9.921388539749072, "blocks.0.w1.weight": 303.34325560691656, "blocks.0.w1.bias": 271.5154938432058, "blocks.0.w2.weight": 490.11291855747174, "blocks.1.ln.weight": 8.358331837822632, "blocks.1.w1.weight": 306.46180391751284, "blocks.1.w1.bias": 289.91192320867975, "blocks.1.w2.weight": 307.16882665457837, "blocks.2.ln.weight": 8.171380552921143, "blocks.2.w1.weight": 309.0280257845424, "blocks.2.w1.bias": 278.09046067069085, "blocks.2.w2.weight": 303.83002249941313, "blocks.3.ln.weight": 7.530980420849777, "blocks.3.w1.weight": 291.36754150240233, "blocks.3.w1.bias": 267.02199332509406, "blocks.3.w2.weight": 279.4411092845991, "blocks.4.ln.weight": 10.6408318843949, "blocks.4.w1.weight": 441.74974808763915, "blocks.4.w1.bias": 407.5025978091534, "blocks.4.w2.weight": 396.8841237755263, "blocks.5.ln.weight": 7.3188489223429976, "blocks.5.w1.weight": 282.40725775096377, "blocks.5.w1.bias": 268.64915470838923, "blocks.5.w2.weight": 255.5102203441866, "blocks.6.ln.weight": 7.484712621287041, "blocks.6.w1.weight": 289.3900145716271, "blocks.6.w1.bias": 273.2836157437038, "blocks.6.w2.weight": 269.0639311186208, "blocks.7.ln.weight": 10.645635950857786, "blocks.7.w1.weight": 435.3403361556039, "blocks.7.w1.bias": 407.2628750706809, "blocks.7.w2.weight": 422.88459144783326, "blocks.8.ln.weight": 9.19535275353374, "blocks.8.w1.weight": 359.87499481651184, "blocks.8.w1.bias": 333.4216491141516, "blocks.8.w2.weight": 337.7077986951993, "blocks.9.ln.weight": 7.799912385129816, "blocks.9.w1.weight": 297.0043322415887, "blocks.9.w1.bias": 289.12017704180437, "blocks.9.w2.weight": 272.7064790358395, "blocks.10.ln.weight": 8.43728199015399, "blocks.10.w1.weight": 330.9678935021042, "blocks.10.w1.bias": 306.6806776473047, "blocks.10.w2.weight": 309.957908747728, "blocks.11.ln.weight": 10.237677378176008, "blocks.11.w1.weight": 400.7826698559754, "blocks.11.w1.bias": 368.5214108931406, "blocks.11.w2.weight": 374.837703368063, "out_ln.weight": 0.67814086539114, "out_head.weight": 9.623079895238506, "out_head.bias": 0.4268739303655545 } }, "fa": { "log": { "train_loss": [ 2.05228896446228, 1.9686302278900147, 1.937331941871643, 1.9156952641296388, 1.8984398557281494, 1.8918078393936157, 1.8841382266616822, 1.8769169528198242, 1.8724429541397094, 1.868889035949707, 1.8656937331390382, 1.8661101271820069, 1.8578856301116944, 1.8565830435180664, 1.856787547569275, 1.8557513214492798, 1.8538894052124024, 1.8534770782089234, 1.848385778579712, 1.846604812889099, 1.8453827571868897, 1.8429374709320068, 1.8401580144500733, 1.8401220611190796, 1.8288005982208253, 1.8259171481323242, 1.8221615615463256, 1.8216705709075929, 1.821623645401001, 1.818600112838745, 1.812706976966858, 1.8111941592788696, 1.8062977261734008, 1.805511683959961, 1.8029492014312745, 1.800798831100464, 1.7953546783065797, 1.7982503284454345, 1.7914396514511108, 1.7916672002792358, 1.7845456259155272, 1.78576413356781, 1.783857018814087, 1.7810697037506102, 1.7796821146011352, 1.7769692651367188, 1.778120286178589, 1.7701848324966432, 1.7680266930770874, 1.7723119870376587, 1.7669956749725342, 1.764911948814392, 1.7598207390975953, 1.7630078075408935, 1.7617963638687133, 1.7589407592391968, 1.7578953286361694, 1.755873950805664, 1.7555263995742798, 1.7516939831924438, 1.7528417974090575, 1.7498321814346314, 1.7489991750335694, 1.744125429725647, 1.7467560472869874, 1.7484809857940673, 1.7442166653823852, 1.7426679946136474, 1.7441077096939086, 1.7404415154647828, 1.734541618347168, 1.7417204373931885, 1.7390217791748046, 1.7405015720367432, 1.739689345970154, 1.7386328066253662, 1.7377501021575927, 1.7382229836654663, 1.7361252673721312, 1.7335023355865478, 1.7335243579483033, 1.7341424390029907, 1.7341539621734618, 1.7341088440322876, 1.7317719327545167, 1.7339295767593383, 1.7329442672729491, 1.7313460754776, 1.7338177963256836, 1.7318969781112672, 1.7321792919921875, 1.7318955504989624, 1.7337695608520507, 1.7288571945953368, 1.7327508489990235, 1.7287590840911866, 1.730326948890686, 1.7341352017593383, 1.7290034577178954, 1.72969926902771 ], "train_acc": [ 0.2384, 0.27844, 0.2943, 0.30138, 0.30742, 0.30942, 0.3195, 0.31888, 0.32204, 0.32418, 0.3248, 0.32782, 0.33146, 0.33268, 0.32912, 0.33066, 0.33278, 0.33552, 0.3367, 0.34006, 0.3393, 0.33932, 0.3395, 0.33874, 0.34818, 0.34772, 0.34958, 0.3503, 0.35032, 0.35086, 0.35212, 0.35332, 0.35488, 0.3559, 0.35578, 0.35756, 0.35926, 0.35818, 0.36006, 0.3605, 0.36376, 0.3638, 0.36622, 0.36562, 0.36488, 0.36572, 0.36658, 0.3694, 0.37002, 0.36866, 0.37106, 0.37212, 0.37664, 0.37196, 0.37114, 0.37274, 0.37342, 0.37482, 0.37588, 0.37478, 0.37494, 0.3766, 0.37674, 0.3785, 0.37762, 0.37722, 0.37866, 0.38074, 0.37858, 0.3806, 0.38312, 0.37868, 0.3786, 0.38086, 0.37808, 0.37986, 0.38126, 0.38078, 0.38162, 0.3829, 0.38342, 0.3823, 0.3824, 0.38028, 0.38296, 0.383, 0.38242, 0.38388, 0.3826, 0.38382, 0.38268, 0.38512, 0.38288, 0.38526, 0.38352, 0.38476, 0.3849, 0.38008, 0.3831, 0.3847 ], "test_acc": [ 0.2743, 0.3072, 0.3046, 0.3269, 0.3349, 0.3431, 0.3427, 0.3386, 0.3512, 0.3518, 0.3496, 0.3458, 0.3629, 0.3681, 0.364, 0.3676, 0.3514, 0.3685, 0.353, 0.3779, 0.3693, 0.3647, 0.3759, 0.3607, 0.374, 0.3735, 0.3711, 0.3721, 0.3821, 0.3752, 0.3707, 0.3851, 0.3838, 0.3893, 0.374, 0.392, 0.3839, 0.3977, 0.3956, 0.3924, 0.3957, 0.3936, 0.394, 0.3912, 0.3993, 0.3945, 0.3978, 0.3946, 0.398, 0.3963, 0.3976, 0.3972, 0.3971, 0.3984, 0.3988, 0.3958, 0.4012, 0.4042, 0.4017, 0.3974, 0.3975, 0.4052, 0.4061, 0.4066, 0.4056, 0.4057, 0.406, 0.4017, 0.4026, 0.4095, 0.4043, 0.4072, 0.4077, 0.4031, 0.4083, 0.407, 0.4077, 0.4099, 0.4067, 0.4065, 0.4057, 0.4092, 0.4093, 0.4055, 0.4097, 0.4081, 0.4083, 0.407, 0.407, 0.4086, 0.4084, 0.4074, 0.4073, 0.4072, 0.4063, 0.4075, 0.407, 0.4074, 0.4075, 0.4076 ] }, "diagnostics": { "bp_cosine": [ 0.0210530087351799, 0.03225391358137131, 0.030373934656381607, -0.01976676471531391, -0.039145730435848236, -0.07764401286840439, -0.04457290470600128, -0.0037843044847249985, -0.0476202666759491, -0.000595096789766103, 0.02137608267366886, 0.995658278465271 ], "perturbation_rho": [ -0.0567036010324955, -0.0030030906200408936, -0.022865712642669678, -0.009168766438961029, -0.0182923823595047, 0.03648798167705536, 0.04260994493961334, 0.0037925627548247576, -0.03891247510910034, -0.052096571773290634, -0.05355001986026764, 0.005782400257885456 ], "nudging": { "0.001": [ -7.315538823604584e-07, -1.1478550732135773e-07, -6.658956408500671e-08, 7.450580596923828e-09, 3.702007234096527e-08, 5.634501576423645e-08, 5.51808625459671e-08, 9.080395102500916e-09, 2.7241185307502747e-08, -1.3969838619232178e-09, -3.3527612686157227e-08, -7.827766239643097e-07 ], "0.003": [ -2.304092049598694e-06, -3.343448042869568e-07, -1.4924444258213043e-07, 1.979060471057892e-08, 1.2828968465328217e-07, 2.391170710325241e-07, 1.1990778148174286e-07, -4.959292709827423e-08, 1.4039687812328339e-07, -6.752088665962219e-09, -3.050081431865692e-08, -2.78581865131855e-06 ], "0.01": [ -7.684342563152313e-06, -1.07521191239357e-06, -4.4563785195350647e-07, 1.5692785382270813e-07, 3.7904828786849976e-07, 7.476191967725754e-07, 4.507601261138916e-07, -3.306195139884949e-08, 5.138572305440903e-07, 2.9569491744041443e-08, -2.5634653866291046e-07, -9.92906279861927e-06 ] }, "hidden_norms_per_layer": [ 7711.2001953125, 86607.8359375, 328385.03125, 717089.75, 1100718.375, 1366338.125, 1659771.0, 1846383.5, 2026219.75, 2144626.25, 2170055.0, 2174719.5, 1710646.75 ], "bp_grad_norms_per_layer": [ 2.5522365831420757e-05, 1.6940738305493142e-06, 5.418342539087462e-07, 4.801818249688949e-07, 4.7660145696681866e-07, 4.771524686475459e-07, 4.772307420353172e-07, 4.777210733664106e-07, 4.776471200784727e-07, 4.787051466337289e-07, 4.790993557435286e-07, 4.780670792570163e-07, 4.5420676997309783e-07 ] }, "drift": { "embed.weight": 51.639575695075386, "embed.bias": 13.420626933240067, "blocks.0.ln.weight": 1.165106572944437, "blocks.0.w1.weight": 17.074257617816983, "blocks.0.w1.bias": 12.55405788253026, "blocks.0.w2.weight": 56.84408822778898, "blocks.1.ln.weight": 1.0814484489664455, "blocks.1.w1.weight": 20.255692646568928, "blocks.1.w1.bias": 12.590175436666444, "blocks.1.w2.weight": 48.43073026110698, "blocks.2.ln.weight": 0.9210710896806559, "blocks.2.w1.weight": 20.147092711724806, "blocks.2.w1.bias": 16.898392906551216, "blocks.2.w2.weight": 46.45488641124572, "blocks.3.ln.weight": 0.6699388356494572, "blocks.3.w1.weight": 19.04886241071522, "blocks.3.w1.bias": 18.822886783231823, "blocks.3.w2.weight": 35.62237142992444, "blocks.4.ln.weight": 0.5724221532943284, "blocks.4.w1.weight": 18.93452177775512, "blocks.4.w1.bias": 18.487677483264793, "blocks.4.w2.weight": 30.11841300499853, "blocks.5.ln.weight": 0.5318503739647785, "blocks.5.w1.weight": 19.752732313152933, "blocks.5.w1.bias": 21.012803450001744, "blocks.5.w2.weight": 26.781939546320714, "blocks.6.ln.weight": 0.4938677177304124, "blocks.6.w1.weight": 18.79282421249984, "blocks.6.w1.bias": 20.24614504362752, "blocks.6.w2.weight": 23.954722502437257, "blocks.7.ln.weight": 0.520902940610959, "blocks.7.w1.weight": 19.15384116500715, "blocks.7.w1.bias": 20.22154003333216, "blocks.7.w2.weight": 28.09055042594723, "blocks.8.ln.weight": 0.5342907608290218, "blocks.8.w1.weight": 18.38918909035725, "blocks.8.w1.bias": 18.8314837769314, "blocks.8.w2.weight": 31.203969055913323, "blocks.9.ln.weight": 0.5198835347685796, "blocks.9.w1.weight": 17.551735719168683, "blocks.9.w1.bias": 17.643006584631404, "blocks.9.w2.weight": 50.56607469544128, "blocks.10.ln.weight": 0.4499630077104289, "blocks.10.w1.weight": 15.14684109843433, "blocks.10.w1.bias": 12.774970121083086, "blocks.10.w2.weight": 53.261273057743395, "blocks.11.ln.weight": 0.4529064172202585, "blocks.11.w1.weight": 17.52348612725844, "blocks.11.w1.bias": 15.699238779618904, "blocks.11.w2.weight": 54.34198491601119, "out_ln.weight": 0.38172881823690796, "out_head.weight": 6.667353449848178, "out_head.bias": 0.7683726336162054 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 12, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 6 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L12_seed6", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }