{ "1": { "dfa": { "log": { "train_loss": [ 2.059094401855469, 2.044447731781006, 2.0331237268066404, 2.029790968055725, 2.0203696198272705, 2.019836251373291, 2.0172710887908933, 2.0157542709350587, 2.01279447265625, 2.0095205695343017, 2.0108920065689087, 2.0079552867889405, 2.0044708168792726, 2.0045814642333983, 2.008353828582764, 2.0057097484970092, 2.0044997080993654, 2.008672186203003, 2.007922875289917, 2.005835166091919, 2.0033903245544433, 2.0044442585754396, 2.002520341949463, 2.00441702545166, 2.0058324599456787, 2.004086421432495, 2.0051950196838377, 2.0038982134246828, 2.004509604110718, 2.0052878368377685, 2.002380726890564, 2.004787947921753, 2.0059314285278322, 2.00248601272583, 2.0011240525817873, 2.0024265776062014, 2.000450315246582, 2.003341311035156, 2.0023523516082764, 2.0043818824768067, 2.0009307250213624, 1.9997900833129882, 1.99952888671875, 1.9998678870010376, 2.000314803161621, 2.0005521519470215, 1.9993469972991944, 2.0002477783966066, 1.9992239441680908, 2.000459006500244, 1.999985199661255, 1.9989831493377686, 1.9985046770477295, 1.999920511932373, 2.001435203552246, 1.999222763671875, 1.9992314191436769, 1.9978362256240845, 1.9966827032470704, 1.9963577353286743, 1.9981027877807618, 1.998446220703125, 1.999375821762085, 1.9966239959716796, 1.9978697190856933, 1.9981718766021728, 1.9964544176864625, 1.996339178161621, 1.995297778892517, 1.9981674702453613, 1.9945542547988893, 1.9964004328918457, 1.9957070028686523, 1.9959317153930665, 1.996950538787842, 1.9957062911987304, 1.9937946883392335, 1.9961785815429687, 1.996840117225647, 1.9966120117950439, 1.9950081676483153, 1.9959315377807618, 1.9947433185195922, 1.9953646588897704, 1.9961627129745483, 1.9956305498504638, 1.9933074866104126, 1.9939569332122802, 1.9948224069213867, 1.9938344969940185, 1.9951542666625977, 1.994460453224182, 1.9951913018798828, 1.992417700653076, 1.9943852715682984, 1.9950172023010253, 1.9913645124816894, 1.9934076538467407, 1.993856616821289, 1.9950498567962647 ], "train_acc": [ 0.24538, 0.2525, 0.24984, 0.25596, 0.25824, 0.26188, 0.26018, 0.26256, 0.26788, 0.26836, 0.26572, 0.26712, 0.26946, 0.2707, 0.26872, 0.26986, 0.26942, 0.26706, 0.2688, 0.26814, 0.2714, 0.26896, 0.26966, 0.27136, 0.26994, 0.27172, 0.27024, 0.2708, 0.27018, 0.27212, 0.27326, 0.2728, 0.2694, 0.27118, 0.27332, 0.2738, 0.27492, 0.27382, 0.27348, 0.27124, 0.27338, 0.27632, 0.27474, 0.27438, 0.27608, 0.27216, 0.27472, 0.27174, 0.2764, 0.27286, 0.27426, 0.27344, 0.27646, 0.27692, 0.27348, 0.27398, 0.2745, 0.27462, 0.27702, 0.2742, 0.27524, 0.27522, 0.2742, 0.27684, 0.27522, 0.2755, 0.2759, 0.27692, 0.27698, 0.27796, 0.27768, 0.27376, 0.27822, 0.2749, 0.27752, 0.2773, 0.27838, 0.27666, 0.27632, 0.27526, 0.27792, 0.27644, 0.2755, 0.27696, 0.27616, 0.27868, 0.27898, 0.27856, 0.27766, 0.27746, 0.27564, 0.27836, 0.27742, 0.27794, 0.27654, 0.277, 0.28076, 0.27934, 0.27814, 0.27694 ], "test_acc": [ 0.2655, 0.2561, 0.2732, 0.2647, 0.2937, 0.2959, 0.2856, 0.2952, 0.2909, 0.2903, 0.2948, 0.2937, 0.2853, 0.2983, 0.2836, 0.2904, 0.2751, 0.294, 0.2826, 0.2783, 0.3006, 0.2986, 0.2981, 0.2913, 0.27, 0.2959, 0.2941, 0.2893, 0.2816, 0.2762, 0.2842, 0.2888, 0.294, 0.3006, 0.2761, 0.2995, 0.2824, 0.2895, 0.2918, 0.2959, 0.2896, 0.2977, 0.2867, 0.2906, 0.2955, 0.2965, 0.2819, 0.2848, 0.293, 0.2901, 0.2903, 0.2893, 0.2946, 0.286, 0.2811, 0.2948, 0.2884, 0.2963, 0.2914, 0.2919, 0.2882, 0.2923, 0.2964, 0.3036, 0.3028, 0.2942, 0.2974, 0.286, 0.2997, 0.2913, 0.2942, 0.2914, 0.295, 0.2929, 0.2945, 0.2905, 0.2979, 0.3003, 0.2997, 0.295, 0.2937, 0.2884, 0.2946, 0.2959, 0.2977, 0.2996, 0.2999, 0.2952, 0.297, 0.2936, 0.2981, 0.2977, 0.2982, 0.2978, 0.2979, 0.2976, 0.2983, 0.2977, 0.2978, 0.2978 ] }, "diagnostics": { "bp_cosine": [ 0.41370105743408203, -0.001240116311237216 ], "perturbation_rho": [ 0.015020761638879776, 0.0 ], "nudging": { "0.001": [ -4.163011908531189e-07, 0.0 ], "0.003": [ -1.1897645890712738e-06, 0.0 ], "0.01": [ -3.778841346502304e-06, 9.313225746154785e-10 ] }, "hidden_norms_per_layer": [ 56646.390625, 1782275456.0, 3970110464.0 ], "bp_grad_norms_per_layer": [ 2.493850104201556e-07, 3.667711412358443e-10, 3.6680619652784685e-10 ] }, "drift": { "embed.weight": 340.80661711332743, "embed.bias": 276.58178672612297, "blocks.0.ln.weight": 9.889068312709053, "blocks.0.w1.weight": 318.9410688527977, "blocks.0.w1.bias": 284.37318853440576, "blocks.0.w2.weight": 489.2728313372279, "blocks.1.ln.weight": 9.298819559476074, "blocks.1.w1.weight": 366.2278399546544, "blocks.1.w1.bias": 340.3854434800174, "blocks.1.w2.weight": 341.5363762004093, "out_ln.weight": 0.5301057051408113, "out_head.weight": 8.039116173269838, "out_head.bias": 2.5371126762269562 } }, "fa": { "log": { "train_loss": [ 2.05515945022583, 1.9500655529785156, 1.9110925933456422, 1.8819315839004516, 1.8608471837615967, 1.8478346523666382, 1.8411366244125367, 1.8377560669326782, 1.8311604034805298, 1.8246206870269774, 1.8166842291641236, 1.8113972366714477, 1.8071093799209594, 1.7970440604400635, 1.7988952663803102, 1.7952887838363647, 1.7926777132415772, 1.790428493423462, 1.7899820502090453, 1.7887613116836547, 1.7811174698257446, 1.781726747894287, 1.782828377418518, 1.7825099970245362, 1.7798745111846923, 1.7748807119369507, 1.769409514427185, 1.7675959386444091, 1.7701947622680665, 1.7674276565551759, 1.7609349981307982, 1.7605391665267944, 1.762060026626587, 1.7580202764129638, 1.7636039975357056, 1.7673666812133788, 1.7655566649627685, 1.7669985010147096, 1.7656920331192016, 1.7639919567108153, 1.7634542723846436, 1.7601457201766968, 1.761037275123596, 1.7602271603775024, 1.7624055517578125, 1.7582754214477538, 1.7596718951416015, 1.7575918433380127, 1.757328048439026, 1.7560129935455322, 1.7593553677749634, 1.75662100856781, 1.7546059392547608, 1.7581290004730226, 1.7570533187103272, 1.7555389776992798, 1.755943459587097, 1.752056611404419, 1.752125501060486, 1.7542531232452392, 1.7525837285614014, 1.7537434762954711, 1.7566586553573609, 1.754645963783264, 1.7561360279083251, 1.7577947814178467, 1.7517323531723021, 1.7506846601104735, 1.7523996893310547, 1.7564484720611573, 1.7542920526885986, 1.7536059958648682, 1.753201146583557, 1.7531446646118165, 1.7524780932617188, 1.7523272793197633, 1.752608459777832, 1.7483984720611572, 1.7505473443984985, 1.750156759109497, 1.7495093181991577, 1.7508859223175048, 1.7515791293716432, 1.7466206330108642, 1.751723793373108, 1.750410927658081, 1.7431821329116821, 1.7460082646942139, 1.7443738849639892, 1.7485774746704101, 1.747268639907837, 1.7440908068847656, 1.7475049467468262, 1.7451262094497682, 1.747353721961975, 1.7474739736557008, 1.7444730795669556, 1.748691442642212, 1.743288662033081, 1.7470912045669555 ], "train_acc": [ 0.25462, 0.29498, 0.31256, 0.32432, 0.33206, 0.33724, 0.33776, 0.34132, 0.34392, 0.34576, 0.35074, 0.34868, 0.35426, 0.35624, 0.35478, 0.35702, 0.35892, 0.3572, 0.35788, 0.35796, 0.3596, 0.36274, 0.3592, 0.36092, 0.36282, 0.36558, 0.36466, 0.36602, 0.36356, 0.36714, 0.36908, 0.36888, 0.36582, 0.368, 0.365, 0.3677, 0.3674, 0.3658, 0.36706, 0.368, 0.3688, 0.3678, 0.36976, 0.36634, 0.36654, 0.3687, 0.36986, 0.36986, 0.3703, 0.37068, 0.36806, 0.37002, 0.37306, 0.3722, 0.36826, 0.37146, 0.3704, 0.37428, 0.37186, 0.37382, 0.37398, 0.3711, 0.3723, 0.37532, 0.37158, 0.37096, 0.37172, 0.37316, 0.37314, 0.37438, 0.37196, 0.3737, 0.37458, 0.37306, 0.37588, 0.37444, 0.37408, 0.37832, 0.37416, 0.37576, 0.3746, 0.375, 0.37462, 0.37456, 0.37364, 0.37744, 0.37852, 0.37832, 0.3778, 0.37706, 0.37604, 0.37654, 0.37828, 0.37762, 0.37686, 0.377, 0.37886, 0.37662, 0.37522, 0.37652 ], "test_acc": [ 0.2978, 0.3334, 0.3399, 0.3342, 0.3634, 0.3618, 0.3505, 0.3521, 0.3696, 0.3722, 0.3679, 0.3787, 0.3663, 0.3811, 0.3611, 0.365, 0.3543, 0.3666, 0.3501, 0.36, 0.3572, 0.3504, 0.3467, 0.3598, 0.3353, 0.3474, 0.3382, 0.3432, 0.3617, 0.3397, 0.353, 0.3288, 0.3385, 0.3414, 0.3467, 0.3389, 0.3341, 0.3434, 0.3537, 0.3496, 0.3526, 0.346, 0.3603, 0.3526, 0.3342, 0.346, 0.3392, 0.3277, 0.3535, 0.3419, 0.3396, 0.3404, 0.3433, 0.3468, 0.339, 0.3361, 0.3421, 0.3363, 0.3544, 0.3465, 0.3454, 0.3472, 0.3401, 0.3454, 0.3511, 0.343, 0.3445, 0.3368, 0.3424, 0.3425, 0.3381, 0.3435, 0.3496, 0.346, 0.3411, 0.3408, 0.3512, 0.3469, 0.3473, 0.3419, 0.3554, 0.3449, 0.345, 0.3431, 0.3442, 0.3501, 0.3534, 0.3469, 0.3496, 0.3436, 0.3478, 0.3501, 0.3492, 0.3481, 0.3474, 0.3466, 0.3476, 0.3468, 0.3473, 0.3471 ] }, "diagnostics": { "bp_cosine": [ 0.007958251982927322, 0.9600946307182312 ], "perturbation_rho": [ 0.029625363647937775, 0.18801619112491608 ], "nudging": { "0.001": [ 4.2957253754138947e-07, -8.616363629698753e-06 ], "0.003": [ 1.2052478268742561e-06, -2.6152702048420906e-05 ], "0.01": [ 4.0422892197966576e-06, -8.745735976845026e-05 ] }, "hidden_norms_per_layer": [ 6253.97314453125, 339687.71875, 217173.15625 ], "bp_grad_norms_per_layer": [ 1.8587075828691013e-05, 8.973949547907978e-07, 7.725411705905572e-07 ] }, "drift": { "embed.weight": 35.41278218973057, "embed.bias": 29.83841191850244, "blocks.0.ln.weight": 1.4875314025636917, "blocks.0.w1.weight": 25.996758962578763, "blocks.0.w1.bias": 15.439034204651744, "blocks.0.w2.weight": 58.48910743468254, "blocks.1.ln.weight": 1.2261067193625912, "blocks.1.w1.weight": 24.34549540914942, "blocks.1.w1.bias": 12.006957572444392, "blocks.1.w2.weight": 29.62795958064609, "out_ln.weight": 0.4822583681094011, "out_head.weight": 3.604309031698496, "out_head.bias": 10.930487632919764 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 1 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L2_seed1", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }