diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed3/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed3/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed3/results_cifar10.json b/results/fa_dfa_d512_L2_seed3/results_cifar10.json new file mode 100644 index 0000000..8cf5599 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed3/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "3": { + "dfa": { + "log": { + "train_loss": [ + 2.049092872314453, + 2.044887622756958, + 2.062239527206421, + 2.0690095069122316, + 2.0704432483673094, + 2.076322864227295, + 2.0749057723999025, + 2.0722323740005493, + 2.0724080812835695, + 2.072884361419678, + 2.0764317562866212, + 2.070321410064697, + 2.0702889765930177, + 2.067789299621582, + 2.0646444761657716, + 2.0636547829818728, + 2.062572795333862, + 2.0582885260772703, + 2.059502869415283, + 2.0571998697280884, + 2.0527090773010253, + 2.056031491851807, + 2.0513366117095946, + 2.0520858401870727, + 2.0493150717926025, + 2.0478450300598143, + 2.0498407819366453, + 2.043566691818237, + 2.042290360069275, + 2.039692493896484, + 2.041093152770996, + 2.0399529009246824, + 2.039473579330444, + 2.0396062004089357, + 2.0359111277770996, + 2.0347996918487548, + 2.034452969818115, + 2.033417662200928, + 2.0335788008880615, + 2.0308428141784667, + 2.027684537124634, + 2.0306087942504885, + 2.0288818074798582, + 2.028032119369507, + 2.0284718214416504, + 2.025789548034668, + 2.0262292552948, + 2.023198474197388, + 2.024526604385376, + 2.025226473312378, + 2.0236859022521974, + 2.021138525657654, + 2.022560397567749, + 2.0220771756744385, + 2.0260347727203367, + 2.022141723327637, + 2.021563760910034, + 2.018922806472778, + 2.021806682510376, + 2.0212029346466065, + 2.01982150100708, + 2.019622989349365, + 2.0191136405944823, + 2.0185832523345946, + 2.0185110153961183, + 2.0175517141342163, + 2.0180020709991453, + 2.0152184085845946, + 2.0153978774261474, + 2.017112913208008, + 2.0173879592895507, + 2.0179903555297853, + 2.013354239501953, + 2.016451063537598, + 2.013973571510315, + 2.018112847671509, + 2.015232135925293, + 2.014464662742615, + 2.0156791037368773, + 2.0115500025177, + 2.014401368560791, + 2.0142960264587404, + 2.012123734397888, + 2.0130788822937014, + 2.0141370764923097, + 2.014659231796265, + 2.0124325815582274, + 2.014389346160889, + 2.0128879175567627, + 2.0132610288238526, + 2.014250590438843, + 2.012836150970459, + 2.0106287144470216, + 2.014688469619751, + 2.0122887326812746, + 2.01329588142395, + 2.0123015225601195, + 2.010611874694824, + 2.015006597442627, + 2.0157135874176024 + ], + "train_acc": [ + 0.25188, + 0.25386, + 0.24578, + 0.2458, + 0.24326, + 0.2434, + 0.23896, + 0.24338, + 0.24348, + 0.24286, + 0.24246, + 0.24364, + 0.24108, + 0.24176, + 0.24598, + 0.24638, + 0.24538, + 0.24996, + 0.24744, + 0.24802, + 0.25254, + 0.2511, + 0.2547, + 0.2523, + 0.25268, + 0.25586, + 0.2522, + 0.25328, + 0.25624, + 0.25838, + 0.25822, + 0.25672, + 0.25938, + 0.25924, + 0.25908, + 0.259, + 0.2602, + 0.26116, + 0.26152, + 0.2633, + 0.26614, + 0.2616, + 0.26606, + 0.26386, + 0.26708, + 0.26482, + 0.2682, + 0.26386, + 0.26484, + 0.26862, + 0.26774, + 0.26798, + 0.2692, + 0.2687, + 0.26776, + 0.27036, + 0.26802, + 0.2715, + 0.26714, + 0.27108, + 0.27032, + 0.27288, + 0.271, + 0.27048, + 0.26948, + 0.27382, + 0.27056, + 0.27404, + 0.27162, + 0.27054, + 0.27232, + 0.27328, + 0.27242, + 0.26978, + 0.2725, + 0.27236, + 0.27228, + 0.27282, + 0.27318, + 0.2746, + 0.27434, + 0.27072, + 0.27108, + 0.2737, + 0.273, + 0.2735, + 0.27328, + 0.2745, + 0.27388, + 0.27212, + 0.2744, + 0.27352, + 0.2723, + 0.27264, + 0.27482, + 0.2727, + 0.2734, + 0.27328, + 0.27136, + 0.27322 + ], + "test_acc": [ + 0.2855, + 0.2551, + 0.2775, + 0.2743, + 0.2562, + 0.2696, + 0.2672, + 0.2538, + 0.2753, + 0.2372, + 0.2459, + 0.2719, + 0.2666, + 0.2665, + 0.2673, + 0.2632, + 0.2686, + 0.2624, + 0.2753, + 0.2718, + 0.2735, + 0.2621, + 0.2539, + 0.247, + 0.2764, + 0.2782, + 0.2758, + 0.2809, + 0.2735, + 0.2648, + 0.2652, + 0.2743, + 0.2866, + 0.2829, + 0.2732, + 0.2647, + 0.282, + 0.2671, + 0.2715, + 0.2861, + 0.2807, + 0.2831, + 0.2899, + 0.2743, + 0.2842, + 0.2796, + 0.2721, + 0.2816, + 0.2874, + 0.2873, + 0.2878, + 0.2746, + 0.2911, + 0.2938, + 0.2945, + 0.2906, + 0.2921, + 0.2921, + 0.2867, + 0.2754, + 0.2951, + 0.2874, + 0.2816, + 0.2894, + 0.2686, + 0.277, + 0.2915, + 0.295, + 0.2958, + 0.2885, + 0.2861, + 0.2907, + 0.2913, + 0.2959, + 0.2897, + 0.2872, + 0.2932, + 0.2882, + 0.2933, + 0.2942, + 0.2939, + 0.2946, + 0.2902, + 0.2888, + 0.2957, + 0.2944, + 0.2917, + 0.294, + 0.2895, + 0.2908, + 0.2929, + 0.2916, + 0.2912, + 0.2927, + 0.2923, + 0.2931, + 0.2924, + 0.2923, + 0.2925, + 0.2922 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3577328324317932, + -0.002256808802485466 + ], + "perturbation_rho": [ + 0.006564013194292784, + 0.0245413389056921 + ], + "nudging": { + "0.001": [ + -3.3527612686157227e-07, + 0.0 + ], + "0.003": [ + -9.671784937381744e-07, + 9.313225746154785e-10 + ], + "0.01": [ + -3.1115487217903137e-06, + 3.725290298461914e-09 + ] + }, + "hidden_norms_per_layer": [ + 61062.07421875, + 1830187136.0, + 2154652416.0 + ], + "bp_grad_norms_per_layer": [ + 2.2415125044972228e-07, + 2.5406721171350455e-10, + 2.541881982676131e-10 + ] + }, + "drift": { + "embed.weight": 362.6998630270425, + "embed.bias": 226.82991769893152, + "blocks.0.ln.weight": 11.27242096475318, + "blocks.0.w1.weight": 342.7047730991574, + "blocks.0.w1.bias": 255.335818330469, + "blocks.0.w2.weight": 571.0736810874553, + "blocks.1.ln.weight": 6.709290843015378, + "blocks.1.w1.weight": 234.88441196904554, + "blocks.1.w1.bias": 208.6820413337303, + "blocks.1.w2.weight": 259.6972453610996, + "out_ln.weight": 0.47275142976863993, + "out_head.weight": 5.14258998677984, + "out_head.bias": 3.632529706269454 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.062916795501709, + 1.9544608277130127, + 1.9338681225204468, + 1.9168871939468384, + 1.8961386334609986, + 1.8842207279205323, + 1.8664908053970337, + 1.8596847631454467, + 1.8500450038909912, + 1.8418613220596314, + 1.8393701876449584, + 1.828501918258667, + 1.8237099225234985, + 1.8169598587799072, + 1.8136948993682862, + 1.8099042462539672, + 1.8040387533569335, + 1.7993673914337158, + 1.801761696434021, + 1.7964957051849366, + 1.7922449420166016, + 1.7918584114837646, + 1.7928801208496095, + 1.7959136298370362, + 1.7932421494293214, + 1.7945690915298462, + 1.798325119857788, + 1.7924271218490602, + 1.795842142982483, + 1.786767998275757, + 1.7907304748153687, + 1.7930365305328368, + 1.7880332135009767, + 1.7910264099884032, + 1.786202894821167, + 1.7834789249038696, + 1.7853226938247682, + 1.7844206839752197, + 1.779783320388794, + 1.777475042037964, + 1.7763150534820558, + 1.7789424829101563, + 1.7754264488983154, + 1.7715616805648804, + 1.7733828824615478, + 1.7673900942993164, + 1.7679843439102172, + 1.7700712796020508, + 1.7681101821517944, + 1.763485518951416, + 1.7642558453369142, + 1.7612942028427123, + 1.7610017293548583, + 1.7577664344024657, + 1.7626592459869386, + 1.7603577539443969, + 1.754944856262207, + 1.7521989233398438, + 1.7558432748031616, + 1.757179810218811, + 1.7534725143051146, + 1.7556944265365602, + 1.7504646623992919, + 1.7463257875823974, + 1.7487027013397216, + 1.7462505680084228, + 1.7486760431289672, + 1.7459170078277588, + 1.740626848487854, + 1.7471276846694945, + 1.7445780047225952, + 1.743365991783142, + 1.7377847635650634, + 1.7428057806396484, + 1.7423382642364502, + 1.739464909362793, + 1.7394498482513427, + 1.7388129167556763, + 1.743233028869629, + 1.7352628125, + 1.740815905380249, + 1.7376227493667602, + 1.7356027941894532, + 1.7353747326278686, + 1.7357349237060546, + 1.7323332436370849, + 1.7330560940170288, + 1.736462532081604, + 1.7307056594085692, + 1.7358304736709596, + 1.7327582055282593, + 1.7328367833709717, + 1.730865809020996, + 1.7343174131011962, + 1.7336546128082275, + 1.729335763282776, + 1.731069825515747, + 1.7309973764801025, + 1.7332309117889404, + 1.7309427404022217 + ], + "train_acc": [ + 0.25124, + 0.29078, + 0.30174, + 0.30854, + 0.31558, + 0.32094, + 0.32596, + 0.32986, + 0.3375, + 0.33924, + 0.34048, + 0.34462, + 0.34806, + 0.34818, + 0.34936, + 0.35036, + 0.35452, + 0.35762, + 0.35606, + 0.35678, + 0.35724, + 0.3556, + 0.35836, + 0.35558, + 0.35872, + 0.35734, + 0.35428, + 0.35594, + 0.35682, + 0.35978, + 0.36006, + 0.35966, + 0.36212, + 0.361, + 0.3593, + 0.36056, + 0.36182, + 0.36036, + 0.3643, + 0.36462, + 0.36522, + 0.3643, + 0.3701, + 0.37198, + 0.36678, + 0.36798, + 0.37018, + 0.3697, + 0.3685, + 0.37262, + 0.36694, + 0.3722, + 0.37228, + 0.37302, + 0.37096, + 0.37208, + 0.3721, + 0.37598, + 0.37528, + 0.37364, + 0.37788, + 0.37682, + 0.37554, + 0.37848, + 0.37854, + 0.3787, + 0.37996, + 0.37764, + 0.3765, + 0.37938, + 0.37982, + 0.38054, + 0.383, + 0.38022, + 0.382, + 0.3806, + 0.38078, + 0.38504, + 0.38192, + 0.38324, + 0.38318, + 0.38192, + 0.38326, + 0.38492, + 0.38542, + 0.38452, + 0.3843, + 0.38424, + 0.38694, + 0.38464, + 0.38664, + 0.3882, + 0.38476, + 0.3842, + 0.38732, + 0.38674, + 0.38546, + 0.38734, + 0.38404, + 0.38848 + ], + "test_acc": [ + 0.2764, + 0.3182, + 0.3354, + 0.3476, + 0.3539, + 0.339, + 0.3478, + 0.3737, + 0.3595, + 0.3642, + 0.3624, + 0.3739, + 0.3717, + 0.3809, + 0.3776, + 0.3763, + 0.3824, + 0.3807, + 0.3754, + 0.3832, + 0.3864, + 0.391, + 0.3762, + 0.3797, + 0.3875, + 0.3857, + 0.3897, + 0.3769, + 0.3752, + 0.3835, + 0.3795, + 0.3635, + 0.3828, + 0.3894, + 0.3827, + 0.3777, + 0.3865, + 0.3855, + 0.3863, + 0.3865, + 0.3888, + 0.3807, + 0.3986, + 0.3886, + 0.389, + 0.3891, + 0.3782, + 0.384, + 0.3912, + 0.3924, + 0.3923, + 0.3923, + 0.3917, + 0.3969, + 0.3968, + 0.3932, + 0.3964, + 0.3876, + 0.3991, + 0.3852, + 0.4036, + 0.3989, + 0.3858, + 0.3974, + 0.3968, + 0.4013, + 0.403, + 0.4009, + 0.3967, + 0.3979, + 0.397, + 0.3962, + 0.3943, + 0.4013, + 0.4027, + 0.3986, + 0.4013, + 0.3944, + 0.4021, + 0.3941, + 0.3972, + 0.3984, + 0.4003, + 0.3986, + 0.3997, + 0.3989, + 0.3996, + 0.4009, + 0.4004, + 0.3993, + 0.4001, + 0.3999, + 0.4013, + 0.4007, + 0.4007, + 0.4011, + 0.401, + 0.4007, + 0.4011, + 0.4012 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.018671220168471336, + 0.9215916395187378 + ], + "perturbation_rho": [ + 0.05869613587856293, + -0.006530101411044598 + ], + "nudging": { + "0.001": [ + -1.8319697119295597e-06, + -3.306486178189516e-06 + ], + "0.003": [ + -5.463924026116729e-06, + -1.0309304343536496e-05 + ], + "0.01": [ + -1.8201360944658518e-05, + -3.473513061180711e-05 + ] + }, + "hidden_norms_per_layer": [ + 6274.154296875, + 343870.53125, + 375719.59375 + ], + "bp_grad_norms_per_layer": [ + 2.1775536879431456e-05, + 1.1024598052244983e-06, + 8.687474064572598e-07 + ] + }, + "drift": { + "embed.weight": 47.037152107454325, + "embed.bias": 16.388390598893867, + "blocks.0.ln.weight": 1.5269469673782543, + "blocks.0.w1.weight": 25.58456877637686, + "blocks.0.w1.bias": 18.02406186908715, + "blocks.0.w2.weight": 64.17096592056014, + "blocks.1.ln.weight": 1.3407223784512263, + "blocks.1.w1.weight": 21.242765670034206, + "blocks.1.w1.bias": 17.953849785001406, + "blocks.1.w2.weight": 23.00878057790312, + "out_ln.weight": 0.3700761416548859, + "out_head.weight": 5.133209234946238, + "out_head.bias": 3.885876738755204 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 3 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed3", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
