{ "4": { "dfa": { "log": { "train_loss": [ 2.0538645137786866, 2.0414622520446777, 2.0403961332702636, 2.0313826718139647, 2.028870590591431, 2.0276684378814696, 2.025082506790161, 2.027707338409424, 2.024693886566162, 2.0219140999603273, 2.024347680053711, 2.0226476731109617, 2.0212312582397463, 2.019639465713501, 2.0200840225982666, 2.022379661102295, 2.0195740895843506, 2.018866870689392, 2.0154102825164797, 2.019121079330444, 2.0158904475402832, 2.0182619565582276, 2.0165906146240236, 2.0169575183868407, 2.0150413411712647, 2.0142192585754395, 2.0149837336730956, 2.014163435897827, 2.0160239248275755, 2.012873958053589, 2.014381752700806, 2.0157296450805666, 2.0139720638656615, 2.0141250953674317, 2.0129578493881226, 2.0142643730926513, 2.011523956451416, 2.0130753877258303, 2.0103190279388428, 2.0131986405181883, 2.011784356765747, 2.0098198655700683, 2.0134172485351565, 2.011796088027954, 2.009907284927368, 2.0113371464538576, 2.011871915245056, 2.012780702667236, 2.0106706674194337, 2.0101452950286864, 2.0108949478149416, 2.0081811878967284, 2.0113219532775877, 2.0078719809722902, 2.008186681213379, 2.0087371883392335, 2.010032041015625, 2.0062248846054076, 2.008138601531982, 2.008908841209412, 2.006502756500244, 2.0063726428604127, 2.006322613143921, 2.0073862936401365, 2.0092133827209473, 2.0075592138671876, 2.0070631226348876, 2.0061116324615478, 2.0080163690567017, 2.0098242531585693, 2.004972350997925, 2.0045611180877687, 2.0060609978485107, 2.0061137674713136, 2.0058565605163574, 2.0072338876342775, 2.0047287912750242, 2.0041282120132444, 2.007643541030884, 2.0067062200546264, 2.005947174911499, 2.0044366609191893, 2.0044241131591796, 2.0034669429016114, 2.0061908039855956, 2.004900071258545, 2.002522025909424, 2.0041396823120117, 2.0040297746276856, 2.0036116275787355, 2.003599824256897, 2.003862293243408, 2.002604514427185, 2.003420566329956, 2.0044958754730224, 2.0024802682876586, 2.001940184288025, 2.004589928436279, 2.00544753616333, 2.004831633987427 ], "train_acc": [ 0.24328, 0.2486, 0.2526, 0.25192, 0.25386, 0.25942, 0.2579, 0.25428, 0.2558, 0.2587, 0.25714, 0.25432, 0.2597, 0.26176, 0.25932, 0.25756, 0.26362, 0.26154, 0.26296, 0.26458, 0.2631, 0.26162, 0.2629, 0.26272, 0.26022, 0.26332, 0.26328, 0.26642, 0.26188, 0.26562, 0.26456, 0.26682, 0.2653, 0.2635, 0.26696, 0.26618, 0.26604, 0.26422, 0.26612, 0.26754, 0.26958, 0.2674, 0.26656, 0.2681, 0.2651, 0.2682, 0.266, 0.26656, 0.26712, 0.26854, 0.26726, 0.26844, 0.26866, 0.26848, 0.2684, 0.26968, 0.2694, 0.27024, 0.26914, 0.2689, 0.27068, 0.26872, 0.2698, 0.2698, 0.27038, 0.27008, 0.26956, 0.26956, 0.26738, 0.2676, 0.27036, 0.27014, 0.26994, 0.27158, 0.27192, 0.27026, 0.27058, 0.27212, 0.26966, 0.26896, 0.27094, 0.27132, 0.27096, 0.27272, 0.2715, 0.2717, 0.27104, 0.27176, 0.26956, 0.26908, 0.27146, 0.2707, 0.27088, 0.26976, 0.2708, 0.27234, 0.27182, 0.27142, 0.27088, 0.27292 ], "test_acc": [ 0.2691, 0.2657, 0.2489, 0.2683, 0.2735, 0.2856, 0.2869, 0.2671, 0.2775, 0.2707, 0.2668, 0.2677, 0.2711, 0.284, 0.28, 0.2978, 0.2649, 0.2558, 0.2813, 0.2732, 0.2875, 0.2844, 0.2664, 0.2731, 0.2948, 0.2757, 0.2818, 0.2811, 0.2842, 0.2762, 0.2852, 0.2639, 0.2834, 0.2859, 0.2804, 0.2727, 0.2794, 0.2916, 0.2746, 0.2768, 0.2903, 0.2722, 0.2896, 0.2856, 0.2906, 0.2848, 0.2776, 0.29, 0.2918, 0.2703, 0.2847, 0.2838, 0.2816, 0.2894, 0.2815, 0.2783, 0.2917, 0.2712, 0.285, 0.2861, 0.2844, 0.2898, 0.2839, 0.2886, 0.2809, 0.2826, 0.2792, 0.2864, 0.2978, 0.2876, 0.2855, 0.2997, 0.2912, 0.2887, 0.2867, 0.2842, 0.284, 0.2781, 0.2817, 0.2911, 0.2842, 0.2834, 0.2867, 0.2861, 0.2867, 0.284, 0.2887, 0.2864, 0.2875, 0.2899, 0.2864, 0.287, 0.2901, 0.2856, 0.2866, 0.2863, 0.2859, 0.2861, 0.2861, 0.2861 ] }, "diagnostics": { "bp_cosine": [ 0.3827235698699951, -0.000831119017675519 ], "perturbation_rho": [ -0.01562047004699707, 0.0 ], "nudging": { "0.001": [ -2.812594175338745e-07, 0.0 ], "0.003": [ -9.383074939250946e-07, 0.0 ], "0.01": [ -3.2153911888599396e-06, 0.0 ] }, "hidden_norms_per_layer": [ 55950.5390625, 1669607168.0, 3780465152.0 ], "bp_grad_norms_per_layer": [ 2.2658105081063695e-07, 2.3708951468748296e-10, 2.3738841448128767e-10 ] }, "drift": { "embed.weight": 337.5136698692365, "embed.bias": 273.5401823379648, "blocks.0.ln.weight": 9.322317945209601, "blocks.0.w1.weight": 322.0064838288751, "blocks.0.w1.bias": 292.5825702677452, "blocks.0.w2.weight": 505.89197780725414, "blocks.1.ln.weight": 9.09606961243359, "blocks.1.w1.weight": 353.39130820313096, "blocks.1.w1.bias": 346.5478039461049, "blocks.1.w2.weight": 349.3876744406949, "out_ln.weight": 0.435883262668521, "out_head.weight": 7.086345015239166, "out_head.bias": 3.9170311167015974 } }, "fa": { "log": { "train_loss": [ 2.083539034461975, 1.9695448753356934, 1.9397349642562867, 1.9066173551177978, 1.886961284866333, 1.8710758205795288, 1.8628956564331054, 1.8567623680877685, 1.8501425790405273, 1.850063798828125, 1.8536383200073243, 1.851845763206482, 1.8578751723480225, 1.8505859604263306, 1.8504567489242554, 1.8505229975128175, 1.8486209188079834, 1.8476799687957763, 1.8461452635192872, 1.8506561833953858, 1.8442412594985962, 1.8458462058258056, 1.842808702659607, 1.8387870932769776, 1.8379171523666382, 1.828637089920044, 1.824536803894043, 1.822955154800415, 1.8200513568878174, 1.814583374671936, 1.8130536968231201, 1.8116273685073851, 1.810110004234314, 1.808945005569458, 1.8023032517242432, 1.8105073015975952, 1.81240649143219, 1.8092195032501222, 1.8054952936172486, 1.8071781116485595, 1.8033202910614015, 1.8002542707061768, 1.7996792233276366, 1.794723889541626, 1.788533415184021, 1.7873220053100587, 1.7867383001327515, 1.7845936785888672, 1.7811818826675414, 1.7822032886505126, 1.7786470770263672, 1.7798991229629517, 1.7747682898712158, 1.771372130050659, 1.7732186395645142, 1.767907095336914, 1.7648547525405884, 1.7638111727523804, 1.7647753219223024, 1.7633140285491944, 1.758088468322754, 1.7619236371612548, 1.7579612891006469, 1.7559792065811157, 1.7589319384002686, 1.7530268384170533, 1.7540921353530883, 1.7525135382080077, 1.7494160869979858, 1.7476271326446533, 1.7485824377059938, 1.7481532715225219, 1.7493890603256226, 1.753240061607361, 1.7450246924209594, 1.7479931283950805, 1.7435640298461914, 1.7442714694595336, 1.7464028844833375, 1.7440459408950806, 1.7451819785308837, 1.7424172634124755, 1.7414722381591796, 1.7440056212997437, 1.7441547555160521, 1.741508984413147, 1.7379715420913697, 1.743159959335327, 1.737216314048767, 1.73957718044281, 1.7399621460342407, 1.7403172652435304, 1.7397853451919556, 1.7367944290161133, 1.7394116397476196, 1.7405242685317994, 1.7411947003173829, 1.7401781003189087, 1.7426191668319702, 1.7414960692977905 ], "train_acc": [ 0.24206, 0.28608, 0.30284, 0.31378, 0.32214, 0.33222, 0.33458, 0.33384, 0.339, 0.3365, 0.33642, 0.33268, 0.3321, 0.3336, 0.33528, 0.33412, 0.3342, 0.33516, 0.3349, 0.3369, 0.33338, 0.33768, 0.3359, 0.3389, 0.33848, 0.33996, 0.34268, 0.34516, 0.34514, 0.34766, 0.3483, 0.35214, 0.34858, 0.34992, 0.35344, 0.35134, 0.34842, 0.35144, 0.35262, 0.35272, 0.35618, 0.35276, 0.35816, 0.3578, 0.35874, 0.3609, 0.36208, 0.3595, 0.3629, 0.36296, 0.36438, 0.36234, 0.3654, 0.36716, 0.36458, 0.36772, 0.36752, 0.36904, 0.3677, 0.3659, 0.3724, 0.36748, 0.37008, 0.37166, 0.37228, 0.37126, 0.37246, 0.3711, 0.37376, 0.3725, 0.37384, 0.37248, 0.37364, 0.37298, 0.37408, 0.37304, 0.37604, 0.37672, 0.3764, 0.37472, 0.37532, 0.3761, 0.37432, 0.37696, 0.3772, 0.37738, 0.37684, 0.37452, 0.37578, 0.37302, 0.37482, 0.3745, 0.37608, 0.37402, 0.37522, 0.37624, 0.377, 0.37676, 0.37804, 0.3765 ], "test_acc": [ 0.2873, 0.2968, 0.3102, 0.3278, 0.3267, 0.3394, 0.3594, 0.3508, 0.348, 0.3577, 0.3237, 0.3288, 0.3256, 0.3468, 0.3314, 0.3353, 0.3342, 0.3343, 0.3363, 0.3386, 0.3359, 0.3401, 0.3353, 0.3296, 0.3361, 0.3547, 0.3367, 0.342, 0.3335, 0.3402, 0.3509, 0.3259, 0.3411, 0.342, 0.3459, 0.3338, 0.3447, 0.3462, 0.3413, 0.3409, 0.3561, 0.3417, 0.3429, 0.3539, 0.3554, 0.3409, 0.3557, 0.3535, 0.3559, 0.3474, 0.3477, 0.3647, 0.3483, 0.337, 0.3458, 0.3461, 0.3488, 0.3399, 0.351, 0.3393, 0.3521, 0.3505, 0.354, 0.3489, 0.3421, 0.3435, 0.3427, 0.345, 0.3509, 0.3393, 0.3513, 0.3592, 0.3435, 0.3491, 0.3462, 0.3486, 0.3435, 0.3421, 0.3463, 0.3537, 0.3507, 0.3476, 0.3523, 0.346, 0.3548, 0.3469, 0.3489, 0.3457, 0.3483, 0.3495, 0.3507, 0.3498, 0.3509, 0.3498, 0.3485, 0.3503, 0.3507, 0.3502, 0.3501, 0.3501 ] }, "diagnostics": { "bp_cosine": [ 0.03285929560661316, 0.9476211071014404 ], "perturbation_rho": [ 0.010396776720881462, 0.21192286908626556 ], "nudging": { "0.001": [ -4.190136678516865e-06, -7.935799658298492e-06 ], "0.003": [ -1.2663658708333969e-05, -2.3964676074683666e-05 ], "0.01": [ -4.219170659780502e-05, -8.006719872355461e-05 ] }, "hidden_norms_per_layer": [ 3884.70703125, 284714.21875, 219214.828125 ], "bp_grad_norms_per_layer": [ 1.9074828742304817e-05, 6.634672331529146e-07, 6.522877811221406e-07 ] }, "drift": { "embed.weight": 27.016438956012585, "embed.bias": 16.969540152339597, "blocks.0.ln.weight": 1.5836171150936886, "blocks.0.w1.weight": 25.706341628627694, "blocks.0.w1.bias": 21.000244171066868, "blocks.0.w2.weight": 64.31974159860198, "blocks.1.ln.weight": 0.9270002241369442, "blocks.1.w1.weight": 14.313388328940205, "blocks.1.w1.bias": 6.9567229997624445, "blocks.1.w2.weight": 31.78188983358227, "out_ln.weight": 0.46949971605667673, "out_head.weight": 3.9796491257565023, "out_head.bias": 12.763196315235756 } } }, "config": { "dataset": "cifar10", "d_hidden": 512, "num_blocks": 2, "batch_size": 128, "epochs": 100, "lr": 0.001, "lr_fb": 0.001, "wd": 0.01, "lam": 0.1, "K": 4, "sigma_bridge": 0.05, "ema_momentum": 0.995, "term_grad_weight": 1.0, "seeds": [ 4 ], "gpu": 0, "output_dir": "results/fa_dfa_d512_L2_seed4", "methods": [ "fa", "dfa" ], "random_targets": false, "penalty_lam": 0.0, "num_classes": 10 } }