diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed4/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed4/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed4/results_cifar10.json b/results/fa_dfa_d512_L2_seed4/results_cifar10.json new file mode 100644 index 0000000..9e35093 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed4/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "4": { + "dfa": { + "log": { + "train_loss": [ + 2.0538645137786866, + 2.0414622520446777, + 2.0403961332702636, + 2.0313826718139647, + 2.028870590591431, + 2.0276684378814696, + 2.025082506790161, + 2.027707338409424, + 2.024693886566162, + 2.0219140999603273, + 2.024347680053711, + 2.0226476731109617, + 2.0212312582397463, + 2.019639465713501, + 2.0200840225982666, + 2.022379661102295, + 2.0195740895843506, + 2.018866870689392, + 2.0154102825164797, + 2.019121079330444, + 2.0158904475402832, + 2.0182619565582276, + 2.0165906146240236, + 2.0169575183868407, + 2.0150413411712647, + 2.0142192585754395, + 2.0149837336730956, + 2.014163435897827, + 2.0160239248275755, + 2.012873958053589, + 2.014381752700806, + 2.0157296450805666, + 2.0139720638656615, + 2.0141250953674317, + 2.0129578493881226, + 2.0142643730926513, + 2.011523956451416, + 2.0130753877258303, + 2.0103190279388428, + 2.0131986405181883, + 2.011784356765747, + 2.0098198655700683, + 2.0134172485351565, + 2.011796088027954, + 2.009907284927368, + 2.0113371464538576, + 2.011871915245056, + 2.012780702667236, + 2.0106706674194337, + 2.0101452950286864, + 2.0108949478149416, + 2.0081811878967284, + 2.0113219532775877, + 2.0078719809722902, + 2.008186681213379, + 2.0087371883392335, + 2.010032041015625, + 2.0062248846054076, + 2.008138601531982, + 2.008908841209412, + 2.006502756500244, + 2.0063726428604127, + 2.006322613143921, + 2.0073862936401365, + 2.0092133827209473, + 2.0075592138671876, + 2.0070631226348876, + 2.0061116324615478, + 2.0080163690567017, + 2.0098242531585693, + 2.004972350997925, + 2.0045611180877687, + 2.0060609978485107, + 2.0061137674713136, + 2.0058565605163574, + 2.0072338876342775, + 2.0047287912750242, + 2.0041282120132444, + 2.007643541030884, + 2.0067062200546264, + 2.005947174911499, + 2.0044366609191893, + 2.0044241131591796, + 2.0034669429016114, + 2.0061908039855956, + 2.004900071258545, + 2.002522025909424, + 2.0041396823120117, + 2.0040297746276856, + 2.0036116275787355, + 2.003599824256897, + 2.003862293243408, + 2.002604514427185, + 2.003420566329956, + 2.0044958754730224, + 2.0024802682876586, + 2.001940184288025, + 2.004589928436279, + 2.00544753616333, + 2.004831633987427 + ], + "train_acc": [ + 0.24328, + 0.2486, + 0.2526, + 0.25192, + 0.25386, + 0.25942, + 0.2579, + 0.25428, + 0.2558, + 0.2587, + 0.25714, + 0.25432, + 0.2597, + 0.26176, + 0.25932, + 0.25756, + 0.26362, + 0.26154, + 0.26296, + 0.26458, + 0.2631, + 0.26162, + 0.2629, + 0.26272, + 0.26022, + 0.26332, + 0.26328, + 0.26642, + 0.26188, + 0.26562, + 0.26456, + 0.26682, + 0.2653, + 0.2635, + 0.26696, + 0.26618, + 0.26604, + 0.26422, + 0.26612, + 0.26754, + 0.26958, + 0.2674, + 0.26656, + 0.2681, + 0.2651, + 0.2682, + 0.266, + 0.26656, + 0.26712, + 0.26854, + 0.26726, + 0.26844, + 0.26866, + 0.26848, + 0.2684, + 0.26968, + 0.2694, + 0.27024, + 0.26914, + 0.2689, + 0.27068, + 0.26872, + 0.2698, + 0.2698, + 0.27038, + 0.27008, + 0.26956, + 0.26956, + 0.26738, + 0.2676, + 0.27036, + 0.27014, + 0.26994, + 0.27158, + 0.27192, + 0.27026, + 0.27058, + 0.27212, + 0.26966, + 0.26896, + 0.27094, + 0.27132, + 0.27096, + 0.27272, + 0.2715, + 0.2717, + 0.27104, + 0.27176, + 0.26956, + 0.26908, + 0.27146, + 0.2707, + 0.27088, + 0.26976, + 0.2708, + 0.27234, + 0.27182, + 0.27142, + 0.27088, + 0.27292 + ], + "test_acc": [ + 0.2691, + 0.2657, + 0.2489, + 0.2683, + 0.2735, + 0.2856, + 0.2869, + 0.2671, + 0.2775, + 0.2707, + 0.2668, + 0.2677, + 0.2711, + 0.284, + 0.28, + 0.2978, + 0.2649, + 0.2558, + 0.2813, + 0.2732, + 0.2875, + 0.2844, + 0.2664, + 0.2731, + 0.2948, + 0.2757, + 0.2818, + 0.2811, + 0.2842, + 0.2762, + 0.2852, + 0.2639, + 0.2834, + 0.2859, + 0.2804, + 0.2727, + 0.2794, + 0.2916, + 0.2746, + 0.2768, + 0.2903, + 0.2722, + 0.2896, + 0.2856, + 0.2906, + 0.2848, + 0.2776, + 0.29, + 0.2918, + 0.2703, + 0.2847, + 0.2838, + 0.2816, + 0.2894, + 0.2815, + 0.2783, + 0.2917, + 0.2712, + 0.285, + 0.2861, + 0.2844, + 0.2898, + 0.2839, + 0.2886, + 0.2809, + 0.2826, + 0.2792, + 0.2864, + 0.2978, + 0.2876, + 0.2855, + 0.2997, + 0.2912, + 0.2887, + 0.2867, + 0.2842, + 0.284, + 0.2781, + 0.2817, + 0.2911, + 0.2842, + 0.2834, + 0.2867, + 0.2861, + 0.2867, + 0.284, + 0.2887, + 0.2864, + 0.2875, + 0.2899, + 0.2864, + 0.287, + 0.2901, + 0.2856, + 0.2866, + 0.2863, + 0.2859, + 0.2861, + 0.2861, + 0.2861 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3827235698699951, + -0.000831119017675519 + ], + "perturbation_rho": [ + -0.01562047004699707, + 0.0 + ], + "nudging": { + "0.001": [ + -2.812594175338745e-07, + 0.0 + ], + "0.003": [ + -9.383074939250946e-07, + 0.0 + ], + "0.01": [ + -3.2153911888599396e-06, + 0.0 + ] + }, + "hidden_norms_per_layer": [ + 55950.5390625, + 1669607168.0, + 3780465152.0 + ], + "bp_grad_norms_per_layer": [ + 2.2658105081063695e-07, + 2.3708951468748296e-10, + 2.3738841448128767e-10 + ] + }, + "drift": { + "embed.weight": 337.5136698692365, + "embed.bias": 273.5401823379648, + "blocks.0.ln.weight": 9.322317945209601, + "blocks.0.w1.weight": 322.0064838288751, + "blocks.0.w1.bias": 292.5825702677452, + "blocks.0.w2.weight": 505.89197780725414, + "blocks.1.ln.weight": 9.09606961243359, + "blocks.1.w1.weight": 353.39130820313096, + "blocks.1.w1.bias": 346.5478039461049, + "blocks.1.w2.weight": 349.3876744406949, + "out_ln.weight": 0.435883262668521, + "out_head.weight": 7.086345015239166, + "out_head.bias": 3.9170311167015974 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.083539034461975, + 1.9695448753356934, + 1.9397349642562867, + 1.9066173551177978, + 1.886961284866333, + 1.8710758205795288, + 1.8628956564331054, + 1.8567623680877685, + 1.8501425790405273, + 1.850063798828125, + 1.8536383200073243, + 1.851845763206482, + 1.8578751723480225, + 1.8505859604263306, + 1.8504567489242554, + 1.8505229975128175, + 1.8486209188079834, + 1.8476799687957763, + 1.8461452635192872, + 1.8506561833953858, + 1.8442412594985962, + 1.8458462058258056, + 1.842808702659607, + 1.8387870932769776, + 1.8379171523666382, + 1.828637089920044, + 1.824536803894043, + 1.822955154800415, + 1.8200513568878174, + 1.814583374671936, + 1.8130536968231201, + 1.8116273685073851, + 1.810110004234314, + 1.808945005569458, + 1.8023032517242432, + 1.8105073015975952, + 1.81240649143219, + 1.8092195032501222, + 1.8054952936172486, + 1.8071781116485595, + 1.8033202910614015, + 1.8002542707061768, + 1.7996792233276366, + 1.794723889541626, + 1.788533415184021, + 1.7873220053100587, + 1.7867383001327515, + 1.7845936785888672, + 1.7811818826675414, + 1.7822032886505126, + 1.7786470770263672, + 1.7798991229629517, + 1.7747682898712158, + 1.771372130050659, + 1.7732186395645142, + 1.767907095336914, + 1.7648547525405884, + 1.7638111727523804, + 1.7647753219223024, + 1.7633140285491944, + 1.758088468322754, + 1.7619236371612548, + 1.7579612891006469, + 1.7559792065811157, + 1.7589319384002686, + 1.7530268384170533, + 1.7540921353530883, + 1.7525135382080077, + 1.7494160869979858, + 1.7476271326446533, + 1.7485824377059938, + 1.7481532715225219, + 1.7493890603256226, + 1.753240061607361, + 1.7450246924209594, + 1.7479931283950805, + 1.7435640298461914, + 1.7442714694595336, + 1.7464028844833375, + 1.7440459408950806, + 1.7451819785308837, + 1.7424172634124755, + 1.7414722381591796, + 1.7440056212997437, + 1.7441547555160521, + 1.741508984413147, + 1.7379715420913697, + 1.743159959335327, + 1.737216314048767, + 1.73957718044281, + 1.7399621460342407, + 1.7403172652435304, + 1.7397853451919556, + 1.7367944290161133, + 1.7394116397476196, + 1.7405242685317994, + 1.7411947003173829, + 1.7401781003189087, + 1.7426191668319702, + 1.7414960692977905 + ], + "train_acc": [ + 0.24206, + 0.28608, + 0.30284, + 0.31378, + 0.32214, + 0.33222, + 0.33458, + 0.33384, + 0.339, + 0.3365, + 0.33642, + 0.33268, + 0.3321, + 0.3336, + 0.33528, + 0.33412, + 0.3342, + 0.33516, + 0.3349, + 0.3369, + 0.33338, + 0.33768, + 0.3359, + 0.3389, + 0.33848, + 0.33996, + 0.34268, + 0.34516, + 0.34514, + 0.34766, + 0.3483, + 0.35214, + 0.34858, + 0.34992, + 0.35344, + 0.35134, + 0.34842, + 0.35144, + 0.35262, + 0.35272, + 0.35618, + 0.35276, + 0.35816, + 0.3578, + 0.35874, + 0.3609, + 0.36208, + 0.3595, + 0.3629, + 0.36296, + 0.36438, + 0.36234, + 0.3654, + 0.36716, + 0.36458, + 0.36772, + 0.36752, + 0.36904, + 0.3677, + 0.3659, + 0.3724, + 0.36748, + 0.37008, + 0.37166, + 0.37228, + 0.37126, + 0.37246, + 0.3711, + 0.37376, + 0.3725, + 0.37384, + 0.37248, + 0.37364, + 0.37298, + 0.37408, + 0.37304, + 0.37604, + 0.37672, + 0.3764, + 0.37472, + 0.37532, + 0.3761, + 0.37432, + 0.37696, + 0.3772, + 0.37738, + 0.37684, + 0.37452, + 0.37578, + 0.37302, + 0.37482, + 0.3745, + 0.37608, + 0.37402, + 0.37522, + 0.37624, + 0.377, + 0.37676, + 0.37804, + 0.3765 + ], + "test_acc": [ + 0.2873, + 0.2968, + 0.3102, + 0.3278, + 0.3267, + 0.3394, + 0.3594, + 0.3508, + 0.348, + 0.3577, + 0.3237, + 0.3288, + 0.3256, + 0.3468, + 0.3314, + 0.3353, + 0.3342, + 0.3343, + 0.3363, + 0.3386, + 0.3359, + 0.3401, + 0.3353, + 0.3296, + 0.3361, + 0.3547, + 0.3367, + 0.342, + 0.3335, + 0.3402, + 0.3509, + 0.3259, + 0.3411, + 0.342, + 0.3459, + 0.3338, + 0.3447, + 0.3462, + 0.3413, + 0.3409, + 0.3561, + 0.3417, + 0.3429, + 0.3539, + 0.3554, + 0.3409, + 0.3557, + 0.3535, + 0.3559, + 0.3474, + 0.3477, + 0.3647, + 0.3483, + 0.337, + 0.3458, + 0.3461, + 0.3488, + 0.3399, + 0.351, + 0.3393, + 0.3521, + 0.3505, + 0.354, + 0.3489, + 0.3421, + 0.3435, + 0.3427, + 0.345, + 0.3509, + 0.3393, + 0.3513, + 0.3592, + 0.3435, + 0.3491, + 0.3462, + 0.3486, + 0.3435, + 0.3421, + 0.3463, + 0.3537, + 0.3507, + 0.3476, + 0.3523, + 0.346, + 0.3548, + 0.3469, + 0.3489, + 0.3457, + 0.3483, + 0.3495, + 0.3507, + 0.3498, + 0.3509, + 0.3498, + 0.3485, + 0.3503, + 0.3507, + 0.3502, + 0.3501, + 0.3501 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.03285929560661316, + 0.9476211071014404 + ], + "perturbation_rho": [ + 0.010396776720881462, + 0.21192286908626556 + ], + "nudging": { + "0.001": [ + -4.190136678516865e-06, + -7.935799658298492e-06 + ], + "0.003": [ + -1.2663658708333969e-05, + -2.3964676074683666e-05 + ], + "0.01": [ + -4.219170659780502e-05, + -8.006719872355461e-05 + ] + }, + "hidden_norms_per_layer": [ + 3884.70703125, + 284714.21875, + 219214.828125 + ], + "bp_grad_norms_per_layer": [ + 1.9074828742304817e-05, + 6.634672331529146e-07, + 6.522877811221406e-07 + ] + }, + "drift": { + "embed.weight": 27.016438956012585, + "embed.bias": 16.969540152339597, + "blocks.0.ln.weight": 1.5836171150936886, + "blocks.0.w1.weight": 25.706341628627694, + "blocks.0.w1.bias": 21.000244171066868, + "blocks.0.w2.weight": 64.31974159860198, + "blocks.1.ln.weight": 0.9270002241369442, + "blocks.1.w1.weight": 14.313388328940205, + "blocks.1.w1.bias": 6.9567229997624445, + "blocks.1.w2.weight": 31.78188983358227, + "out_ln.weight": 0.46949971605667673, + "out_head.weight": 3.9796491257565023, + "out_head.bias": 12.763196315235756 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 4 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed4", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
