{ "1": { "dfa": { "log": { "train_loss": [ 2.0748964222717285, 2.0451132692718508, 2.032143096008301, 2.029643494186401, 2.030650337371826, 2.0243890724945066, 2.020762248840332, 2.0232248431396482, 2.0159964645004274, 2.0192399645996093, 2.01540469039917, 2.0154635834503174, 2.017197366409302, 2.0137894206237794, 2.0133308319091796, 2.0108140522003173, 2.011235432815552, 2.009914517288208, 2.0094243881988527, 2.0100407147979737, 2.010185157546997, 2.0089511253356935, 2.0095393753051756, 2.0059863204574584, 2.0064435525512696, 2.005170561828613, 2.0074975017547607, 2.004913715057373, 2.0057138012313844, 2.004565502243042, 2.006841945838928, 2.0055636949157716, 2.0060591010284425, 2.006927216835022, 2.0074666262817384, 2.004335132293701, 2.005483384475708, 2.006595082168579, 2.003282996673584, 2.0056812954330443, 2.003032290878296, 2.0057049587249756, 2.004697043457031, 2.006551830406189, 2.0058861305236815, 2.0044844329071045, 2.0043990351867675, 2.0037572646331787, 2.0045921185302733, 2.0048506913757325, 2.003375824584961, 2.004632271575928, 2.0042632717895508, 2.0026413610076905, 2.001700767211914, 2.003248519668579, 2.003593999633789, 2.003497390823364, 2.003082277145386, 2.001226206436157, 2.0015557537841797, 2.0028394889831542, 2.0041756005859375, 2.0014186894226076, 2.0017097331237794, 2.0027389540863036, 2.00000232421875, 2.001385536727905, 2.0014734981536866, 2.000507820701599, 2.0018744316101076, 2.00272723903656, 2.0029756539535524, 2.0013647467422486, 2.0018114362335204, 2.0025039096832273, 2.0007914069366457, 2.0015052102279665, 2.0013790615844727, 2.000559573059082, 2.000183110809326, 2.002135623321533, 1.9992622534561157, 2.0023144091033935, 1.9984413458633423, 2.0006315287780763, 2.0000011035919187, 1.9984883616638183, 1.9980969067382812, 1.999547445678711, 1.999142066078186, 2.0002035105895994, 1.9980618365859986, 1.9986838175201416, 1.9983668603515625, 1.9985755539321899, 2.000544935379028, 1.9968827368545532, 1.9982192471313476, 2.0020621044921874 ], "train_acc": [ 0.23312, 0.24122, 0.2498, 0.25198, 0.25274, 0.25466, 0.25756, 0.25584, 0.26256, 0.25706, 0.26104, 0.26366, 0.26034, 0.2643, 0.2637, 0.26512, 0.26362, 0.26534, 0.2631, 0.26636, 0.26484, 0.26708, 0.2655, 0.26972, 0.26856, 0.27134, 0.2676, 0.26984, 0.26974, 0.27138, 0.2693, 0.27122, 0.27032, 0.27198, 0.27264, 0.27422, 0.26884, 0.27136, 0.27186, 0.27214, 0.27222, 0.27306, 0.27124, 0.26954, 0.27338, 0.27444, 0.27396, 0.27308, 0.27134, 0.27374, 0.27228, 0.27202, 0.2734, 0.27426, 0.27536, 0.2763, 0.27336, 0.2738, 0.2753, 0.27466, 0.2761, 0.27344, 0.27534, 0.2757, 0.27462, 0.27636, 0.27752, 0.27438, 0.27618, 0.27512, 0.27614, 0.27672, 0.2751, 0.2764, 0.27506, 0.27662, 0.2763, 0.27732, 0.27492, 0.27632, 0.27788, 0.27568, 0.27686, 0.27594, 0.27624, 0.27706, 0.27618, 0.27852, 0.27466, 0.27688, 0.27624, 0.2765, 0.27688, 0.27766, 0.27692, 0.27586, 0.27718, 0.27828, 0.27846, 0.27564 ], "test_acc": [ 0.2476, 0.2684, 0.2584, 0.2859, 0.2672, 0.2792, 0.2735, 0.2954, 0.2679, 0.29, 0.2763, 0.2726, 0.2807, 0.2893, 0.296, 0.2701, 0.2694, 0.2782, 0.2885, 0.2811, 0.2919, 0.2734, 0.2917, 0.2961, 0.2922, 0.3011, 0.2957, 0.2783, 0.3042, 0.2892, 0.2859, 0.2808, 0.2889, 0.2977, 0.2867, 0.2998, 0.2953, 0.2908, 0.2808, 0.287, 0.2953, 0.303, 0.287, 0.3021, 0.2834, 0.3003, 0.2861, 0.2915, 0.2953, 0.3065, 0.2839, 0.2883, 0.298, 0.2928, 0.2955, 0.2906, 0.3041, 0.2956, 0.2883, 0.2887, 0.2903, 0.2939, 0.294, 0.2878, 0.2835, 0.2948, 0.2838, 0.2948, 0.296, 0.2941, 0.294, 0.3002, 0.2949, 0.2918, 0.2977, 0.2982, 0.2944, 0.2961, 0.2936, 0.2989, 0.2956, 0.2995, 0.2953, 0.2967, 0.3003, 0.2945, 0.2989, 0.2961, 0.2974, 0.3003, 0.2941, 0.2969, 0.2982, 0.2977, 0.2981, 0.2977, 0.2979, 0.2972, 0.297, 0.2969 ] }, "diagnostics": { "bp_cosine": [ 0.4029613733291626, 7.883789658080786e-05, -0.0002453301858622581, -0.0004192243213765323, 0.000372876413166523, -0.000354595307726413 ], "perturbation_rho": [ 0.011547078378498554, 0.0, 0.0, 0.0, 0.0, 0.0 ], "nudging": { "0.001": [ -3.4691765904426575e-07, 0.0, 0.0, 0.0, 0.0, 0.0 ], "0.003": [ -1.1422671377658844e-06, 0.0, -2.7939677238464355e-09, 0.0, 0.0, 0.0 ], "0.01": [ -3.50363552570343e-06, 1.862645149230957e-09, -3.725290298461914e-09, 0.0, 0.0, 0.0 ] }, "hidden_norms_per_layer": [ 56897.21875, 1696502784.0, 3738960896.0, 4607917568.0, 5758332928.0, 6969167872.0, 7904643072.0 ], "bp_grad_norms_per_layer": [ 2.473913411904505e-07, 2.2789505005338384e-10, 2.2798352095065866e-10, 2.2797391752149565e-10, 2.2786038333943992e-10, 2.2787945141988786e-10, 2.2788908260462648e-10 ] }, "drift": { "embed.weight": 341.6512135112792, "embed.bias": 266.6380085288841, "blocks.0.ln.weight": 9.881568196594484, "blocks.0.w1.weight": 316.78039360087587, "blocks.0.w1.bias": 286.8114997527113, "blocks.0.w2.weight": 487.5637400185808, "blocks.1.ln.weight": 9.2020409527447, "blocks.1.w1.weight": 361.84956095939293, "blocks.1.w1.bias": 334.52465546675654, "blocks.1.w2.weight": 335.23042288085577, "blocks.2.ln.weight": 8.38680422611515, "blocks.2.w1.weight": 335.6889109899642, "blocks.2.w1.bias": 310.7077386931781, "blocks.2.w2.weight": 315.3949169119556, "blocks.3.ln.weight": 8.903503018515195, "blocks.3.w1.weight": 371.4244307750354, "blocks.3.w1.bias": 345.3889053690205, "blocks.3.w2.weight": 352.95729115252703, "blocks.4.ln.weight": 9.577081150302154, "blocks.4.w1.weight": 387.7879530619586, "blocks.4.w1.bias": 358.359826994576, "blocks.4.w2.weight": 353.9896695590463, "blocks.5.ln.weight": 9.043917438368451, "blocks.5.w1.weight": 368.8104037409108, "blocks.5.w1.bias": 337.4941181161536, "blocks.5.w2.weight": 342.83001538637893, "out_ln.weight": 0.6049025805082792, "out_head.weight": 8.662451359844601, "out_head.bias": 1.2452406037396404 } }, "fa": { "log": { "train_loss": [ 2.0533182458114623, 1.9470771118927002, 1.9098005801391602, 1.8933470011138915, 1.8866070096206664, 1.8806784909820558, 1.8700345465469361, 1.8668433471298218, 1.8549686681747437, 1.8534734383773803, 1.844026010055542, 1.8412904165649413, 1.8354822329711915, 1.8315302365493775, 1.8307162652206421, 1.8245070376968384, 1.820267495956421, 1.8159903725814819, 1.8120850400543214, 1.8062479650115968, 1.8023771206665038, 1.7989153610992432, 1.7973320705795288, 1.789391294517517, 1.7857570403289795, 1.7807958832550048, 1.7800961505126953, 1.7727591732025147, 1.7719479108047484, 1.7722896636199952, 1.765616308631897, 1.765071000442505, 1.7588437004852295, 1.7560785748672485, 1.7530314648056031, 1.7516267270278931, 1.7478641785049438, 1.747710930519104, 1.7394591223526001, 1.7430037671279908, 1.7430737688827516, 1.743327683944702, 1.735208967590332, 1.7367942264175416, 1.735928176651001, 1.7336044045639039, 1.7319979761123658, 1.7286449816131593, 1.7276164590072631, 1.7342356995010375, 1.7273106130599976, 1.728026152114868, 1.7241678939437866, 1.7218856454467772, 1.720424718055725, 1.7259459881973267, 1.723678625831604, 1.7201445708465577, 1.7179317428588867, 1.714501748046875, 1.7184516412353517, 1.7182959340667725, 1.7173260328674316, 1.7162155276870728, 1.7148893152618407, 1.7136942127990722, 1.7128957564926148, 1.7095485464859008, 1.711679192199707, 1.7081169268417358, 1.7124231735992432, 1.7100938080215453, 1.7099676737213134, 1.7056838412094115, 1.7102637582397462, 1.7076803800201417, 1.703552028427124, 1.7047434192657471, 1.7060186026382447, 1.7038543602752685, 1.7023552209091186, 1.7033933319854737, 1.7048375073623656, 1.7029183816146851, 1.7019960340118407, 1.7012598460006714, 1.700243671836853, 1.6951217443847657, 1.7031349285125732, 1.6982279485702514, 1.7003905519866944, 1.7008577185821534, 1.69846902469635, 1.7006194688796996, 1.6990861594009399, 1.7007253762817383, 1.702599566040039, 1.7018861039352418, 1.699664118347168, 1.7012134171295166 ], "train_acc": [ 0.24282, 0.28774, 0.30648, 0.31656, 0.32152, 0.3235, 0.33028, 0.32876, 0.33768, 0.33628, 0.33892, 0.341, 0.3464, 0.34646, 0.3456, 0.35168, 0.34876, 0.35232, 0.35214, 0.3571, 0.3564, 0.35782, 0.35768, 0.36332, 0.3616, 0.36234, 0.3655, 0.36546, 0.36836, 0.36622, 0.36982, 0.36954, 0.3712, 0.37104, 0.37318, 0.37486, 0.37374, 0.37526, 0.37592, 0.37592, 0.37662, 0.37494, 0.37758, 0.37708, 0.37796, 0.38076, 0.37962, 0.38058, 0.3806, 0.37936, 0.38016, 0.38172, 0.38376, 0.384, 0.38752, 0.3876, 0.38602, 0.38746, 0.38644, 0.386, 0.38718, 0.38552, 0.38468, 0.3868, 0.38882, 0.38934, 0.3874, 0.38992, 0.3904, 0.3908, 0.38916, 0.38954, 0.39022, 0.39024, 0.39018, 0.39104, 0.39206, 0.39178, 0.39074, 0.3921, 0.39292, 0.39326, 0.39202, 0.3935, 0.39312, 0.3942, 0.39594, 0.39766, 0.39178, 0.39502, 0.39626, 0.39468, 0.39338, 0.39468, 0.39366, 0.39276, 0.39356, 0.39354, 0.39138, 0.39408 ], "test_acc": [ 0.2926, 0.3237, 0.3296, 0.3577, 0.3485, 0.3454, 0.3678, 0.3648, 0.3607, 0.3756, 0.3775, 0.3817, 0.3786, 0.3781, 0.3803, 0.3682, 0.369, 0.371, 0.3834, 0.3875, 0.3822, 0.3805, 0.392, 0.401, 0.3844, 0.4015, 0.3866, 0.3901, 0.3987, 0.3939, 0.3837, 0.3972, 0.3877, 0.3994, 0.4002, 0.4033, 0.4085, 0.4058, 0.391, 0.399, 0.3986, 0.4086, 0.404, 0.4086, 0.4062, 0.4047, 0.3991, 0.4037, 0.3968, 0.4118, 0.4017, 0.4095, 0.4117, 0.4037, 0.4073, 0.4087, 0.4137, 0.4088, 0.3997, 0.4059, 0.409, 0.4099, 0.4096, 0.412, 0.4102, 0.4137, 0.4102, 0.4121, 0.4119, 0.4132, 0.4149, 0.412, 0.415, 0.4148, 0.4154, 0.416, 0.4112, 0.4109, 0.4153, 0.4148, 0.4183, 0.4172, 0.4152, 0.4157, 0.418, 0.4115, 0.4187, 0.4127, 0.4108, 0.4153, 0.4141, 0.4132, 0.415, 0.4124, 0.4151, 0.4147, 0.4136, 0.4142, 0.4147, 0.4144 ] }, "diagnostics": { "bp_cosine": [ 0.030343683436512947, 0.09938552975654602, -0.07437123358249664, -0.07549507170915604, -0.09523595124483109, 0.9972963929176331 ], "perturbation_rho": [ 0.04541456699371338, 0.008701281622052193, -0.00402827700600028, 0.03399529308080673, -0.00989921111613512, 0.004614755045622587 ], "nudging": { "0.001": [ -2.914457581937313e-06, -5.584442988038063e-07, 1.0908115655183792e-07, 4.6566128730773926e-08, 4.377216100692749e-08, -1.0116491466760635e-06 ], "0.003": [ -8.360599167644978e-06, -2.0274892449378967e-06, 2.825399860739708e-07, 3.023305907845497e-07, 2.789311110973358e-07, -4.071509465575218e-06 ], "0.01": [ -2.804200630635023e-05, -6.612506695091724e-06, 9.683426469564438e-07, 1.1706724762916565e-06, 1.3328390195965767e-06, -1.4974735677242279e-05 ] }, "hidden_norms_per_layer": [ 5724.40771484375, 72733.609375, 478685.65625, 1483182.625, 1809620.875, 2091372.375, 857882.6875 ], "bp_grad_norms_per_layer": [ 3.0453806175501086e-05, 2.1086596007080516e-06, 6.627448101426126e-07, 6.460473969127634e-07, 6.491723638646363e-07, 6.540217896144895e-07, 6.466638637903088e-07 ] }, "drift": { "embed.weight": 42.22188941497859, "embed.bias": 17.68183956971274, "blocks.0.ln.weight": 1.180802481067003, "blocks.0.w1.weight": 15.4315958124657, "blocks.0.w1.bias": 12.305080689576908, "blocks.0.w2.weight": 57.44824499129088, "blocks.1.ln.weight": 0.9692930700548912, "blocks.1.w1.weight": 19.880441088833255, "blocks.1.w1.bias": 16.257331118504066, "blocks.1.w2.weight": 48.06735579536956, "blocks.2.ln.weight": 0.7719428930423391, "blocks.2.w1.weight": 23.427567219106724, "blocks.2.w1.bias": 24.716070592776813, "blocks.2.w2.weight": 33.2055102304801, "blocks.3.ln.weight": 0.6610316048264212, "blocks.3.w1.weight": 21.14916966984416, "blocks.3.w1.bias": 22.188834381211755, "blocks.3.w2.weight": 37.41900122482242, "blocks.4.ln.weight": 0.6045383052903652, "blocks.4.w1.weight": 21.6093498763088, "blocks.4.w1.bias": 23.188519739977856, "blocks.4.w2.weight": 29.43277495491079, "blocks.5.ln.weight": 0.7110348796366065, "blocks.5.w1.weight": 22.91348409054967, "blocks.5.w1.bias": 24.128500394824375, "blocks.5.w2.weight": 42.82735324390181, "out_ln.weight": 0.2879508142897712, "out_head.weight": 5.9584913076844686, "out_head.bias": 1.1797514883024003 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 6, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 1 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L6_seed1", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }