diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed5/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed5/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed5/results_cifar10.json b/results/fa_dfa_d512_L2_seed5/results_cifar10.json new file mode 100644 index 0000000..d5c8ea9 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed5/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "5": { + "dfa": { + "log": { + "train_loss": [ + 2.0501297537231444, + 2.0391713497924804, + 2.0405313035583497, + 2.0335817265319824, + 2.0266058160018923, + 2.0228387924957274, + 2.0232558026504517, + 2.0218732793426515, + 2.0191759132385254, + 2.0202307054901123, + 2.018844593505859, + 2.017033308792114, + 2.018027767868042, + 2.018668871307373, + 2.015074652633667, + 2.015589296875, + 2.016558995742798, + 2.019203759498596, + 2.0183322762298586, + 2.0155471825408937, + 2.018300429916382, + 2.0150776953125, + 2.0150013764953614, + 2.012721175842285, + 2.016366043663025, + 2.012075606918335, + 2.016505323944092, + 2.01135826461792, + 2.0136885620117186, + 2.013543639678955, + 2.013746788291931, + 2.0128848664093018, + 2.012771292114258, + 2.01191774017334, + 2.010462758102417, + 2.010521863632202, + 2.009425925369263, + 2.0124644644546508, + 2.0108147170639037, + 2.010228076095581, + 2.0088936639022825, + 2.0095657570648195, + 2.007657756729126, + 2.009475396652222, + 2.010636301422119, + 2.0098936741638185, + 2.0092102942276, + 2.009080667991638, + 2.007752434120178, + 2.0074822512054444, + 2.011261424026489, + 2.006237863006592, + 2.008023773574829, + 2.0073289957427978, + 2.006207457962036, + 2.0055681369781495, + 2.006566423034668, + 2.0086398764038087, + 2.005377918167114, + 2.008910454864502, + 2.0054182757568357, + 2.0053556463241575, + 2.005029055404663, + 2.0059510985565185, + 2.005951479187012, + 2.0057564875793457, + 2.0048374938964844, + 2.0036859961700437, + 2.005258397903442, + 2.005781553649902, + 2.004468630065918, + 2.0044502724456787, + 2.0023633781433103, + 2.002619049530029, + 2.003770675506592, + 2.0034406785583494, + 2.0038263823699953, + 2.004770489578247, + 2.0045603427505494, + 2.003471921005249, + 2.0053932760620117, + 2.002159836387634, + 2.0036436273574827, + 2.002813849029541, + 2.00232444770813, + 2.0031388371276857, + 2.003156742095947, + 2.0042506001281737, + 2.001820291137695, + 2.0023800246810914, + 2.0012053105926513, + 2.0006055866241454, + 2.0019854052352906, + 2.001209078979492, + 2.0008096754455567, + 2.0021328547668458, + 2.0031403130340575, + 1.9998649573516847, + 2.002096244430542, + 2.0019282162475585 + ], + "train_acc": [ + 0.25066, + 0.25648, + 0.25718, + 0.25752, + 0.26214, + 0.26184, + 0.26432, + 0.2653, + 0.26402, + 0.26416, + 0.26932, + 0.26444, + 0.26816, + 0.26564, + 0.2684, + 0.27134, + 0.26932, + 0.267, + 0.26686, + 0.26922, + 0.26814, + 0.26974, + 0.2686, + 0.26834, + 0.2661, + 0.26928, + 0.26724, + 0.26998, + 0.26744, + 0.26994, + 0.26896, + 0.2696, + 0.26804, + 0.2696, + 0.27204, + 0.26932, + 0.27152, + 0.26992, + 0.27178, + 0.27218, + 0.27082, + 0.27092, + 0.2737, + 0.27122, + 0.27138, + 0.27174, + 0.272, + 0.2722, + 0.2723, + 0.27346, + 0.26892, + 0.27434, + 0.27432, + 0.27238, + 0.27332, + 0.27454, + 0.27508, + 0.27256, + 0.27376, + 0.27296, + 0.27436, + 0.27456, + 0.27532, + 0.27364, + 0.2735, + 0.27452, + 0.27372, + 0.27588, + 0.27558, + 0.27532, + 0.27558, + 0.2755, + 0.27522, + 0.27524, + 0.2758, + 0.27718, + 0.27532, + 0.27618, + 0.27686, + 0.27688, + 0.27632, + 0.27328, + 0.27464, + 0.27712, + 0.27804, + 0.27666, + 0.2755, + 0.27784, + 0.27688, + 0.27586, + 0.27696, + 0.27672, + 0.27692, + 0.2786, + 0.27814, + 0.27484, + 0.27636, + 0.27772, + 0.27436, + 0.27908 + ], + "test_acc": [ + 0.2723, + 0.2812, + 0.2672, + 0.2819, + 0.2601, + 0.279, + 0.2898, + 0.289, + 0.2685, + 0.2896, + 0.2766, + 0.2838, + 0.2792, + 0.2863, + 0.3016, + 0.292, + 0.2951, + 0.2919, + 0.2929, + 0.2842, + 0.2837, + 0.2864, + 0.3007, + 0.2981, + 0.2983, + 0.2929, + 0.2962, + 0.3, + 0.2923, + 0.2989, + 0.2802, + 0.2939, + 0.269, + 0.2905, + 0.278, + 0.2981, + 0.3057, + 0.2984, + 0.3025, + 0.2843, + 0.3007, + 0.2824, + 0.2941, + 0.3064, + 0.284, + 0.2892, + 0.2981, + 0.2894, + 0.2983, + 0.2972, + 0.2969, + 0.2958, + 0.2892, + 0.299, + 0.2959, + 0.2899, + 0.2863, + 0.3044, + 0.2926, + 0.2916, + 0.2983, + 0.2914, + 0.3015, + 0.2956, + 0.2904, + 0.2972, + 0.2893, + 0.289, + 0.2961, + 0.2993, + 0.2911, + 0.289, + 0.2944, + 0.2942, + 0.2955, + 0.2939, + 0.2961, + 0.295, + 0.2949, + 0.2966, + 0.2977, + 0.2997, + 0.2982, + 0.2984, + 0.2965, + 0.2941, + 0.2911, + 0.2957, + 0.2962, + 0.2998, + 0.2916, + 0.2965, + 0.2952, + 0.2956, + 0.2959, + 0.2965, + 0.2957, + 0.296, + 0.2963, + 0.2963 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.38937193155288696, + -0.00133989576715976 + ], + "perturbation_rho": [ + -0.03419807553291321, + 0.0 + ], + "nudging": { + "0.001": [ + -3.7206336855888367e-07, + 0.0 + ], + "0.003": [ + -1.1147931218147278e-06, + 0.0 + ], + "0.01": [ + -3.5390257835388184e-06, + 3.725290298461914e-09 + ] + }, + "hidden_norms_per_layer": [ + 55290.671875, + 1164404992.0, + 1809793664.0 + ], + "bp_grad_norms_per_layer": [ + 2.527334572732798e-07, + 4.3922129822071554e-10, + 4.3930301063532795e-10 + ] + }, + "drift": { + "embed.weight": 334.45692579883826, + "embed.bias": 254.1500844207983, + "blocks.0.ln.weight": 10.378101238923492, + "blocks.0.w1.weight": 277.98485791253944, + "blocks.0.w1.bias": 241.48477586542305, + "blocks.0.w2.weight": 467.05002700094724, + "blocks.1.ln.weight": 6.909499166461763, + "blocks.1.w1.weight": 263.9133275584596, + "blocks.1.w1.bias": 244.87238078164592, + "blocks.1.w2.weight": 283.49051001246613, + "out_ln.weight": 0.43727802835016244, + "out_head.weight": 6.508111271175387, + "out_head.bias": 3.1430989188106846 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.057919206390381, + 1.9476089878845215, + 1.9109919176864625, + 1.8918181984710694, + 1.8734441751861572, + 1.859958696899414, + 1.8465128494644165, + 1.8378619164657592, + 1.8330042699813842, + 1.824237583885193, + 1.82030082321167, + 1.8168681536102296, + 1.8147564684677124, + 1.8174263799285888, + 1.8145158917236328, + 1.8134905625152589, + 1.816219719581604, + 1.8107114935684203, + 1.809884515991211, + 1.8064439716339111, + 1.8076383264160156, + 1.8070710248184203, + 1.799020498085022, + 1.799975090560913, + 1.7974333989715576, + 1.7963496450042724, + 1.8014785760498047, + 1.7986563251113892, + 1.7955734420776368, + 1.7972684210968017, + 1.7941396160125733, + 1.7950014336395264, + 1.7955820244979859, + 1.7959071813201903, + 1.79216160282135, + 1.7948664249038697, + 1.7919580102920531, + 1.7955779486465455, + 1.7922123107147216, + 1.7889366255950927, + 1.7819780150604247, + 1.7830965274429322, + 1.782749061050415, + 1.7800398288726806, + 1.780551498336792, + 1.7743108095932008, + 1.783085387916565, + 1.774484405479431, + 1.7695070098114014, + 1.7732080498504639, + 1.7756617493057252, + 1.7731031243133546, + 1.7697893057632446, + 1.7669785211181641, + 1.7650962362289428, + 1.763043028793335, + 1.7600419904708862, + 1.7632893228912354, + 1.7593432830429077, + 1.7613518405532838, + 1.754806079711914, + 1.7532699264144898, + 1.7546887551498414, + 1.7581820251083373, + 1.751631008605957, + 1.754752312927246, + 1.7504624893951417, + 1.7475749392318725, + 1.751591441116333, + 1.7496289820098876, + 1.748469584388733, + 1.747327193069458, + 1.7421584380722046, + 1.7428951406097413, + 1.7426397796249389, + 1.7432606916046143, + 1.7435048538589477, + 1.7410756462860106, + 1.743000368347168, + 1.7420079108047486, + 1.7423530182266236, + 1.7415100763320923, + 1.7408926866912842, + 1.7403043130874634, + 1.7404012395477295, + 1.7404220779418946, + 1.7388356212615967, + 1.7423903681182862, + 1.7363825454711914, + 1.7398050061035155, + 1.7384051816558839, + 1.7355061944198609, + 1.7398744315338135, + 1.7368783473968505, + 1.7394122046661378, + 1.7361857733154298, + 1.742128964920044, + 1.7403847741699219, + 1.737286774673462, + 1.7390742868041993 + ], + "train_acc": [ + 0.25062, + 0.29808, + 0.31302, + 0.32052, + 0.3262, + 0.33122, + 0.33844, + 0.3404, + 0.34186, + 0.34348, + 0.34654, + 0.34656, + 0.34834, + 0.34672, + 0.3507, + 0.34978, + 0.34784, + 0.35204, + 0.34968, + 0.35226, + 0.35198, + 0.35068, + 0.35748, + 0.35378, + 0.35458, + 0.35536, + 0.35374, + 0.3558, + 0.35606, + 0.35744, + 0.35864, + 0.3575, + 0.35448, + 0.35674, + 0.35792, + 0.3562, + 0.3585, + 0.35812, + 0.35828, + 0.3577, + 0.36192, + 0.36198, + 0.3611, + 0.36338, + 0.36406, + 0.3631, + 0.36, + 0.36512, + 0.36844, + 0.36508, + 0.3646, + 0.36468, + 0.36598, + 0.36518, + 0.3704, + 0.37062, + 0.3711, + 0.37078, + 0.36744, + 0.37034, + 0.37248, + 0.37374, + 0.3702, + 0.37384, + 0.37386, + 0.37256, + 0.3758, + 0.37518, + 0.3727, + 0.37388, + 0.37536, + 0.37548, + 0.37722, + 0.37788, + 0.37788, + 0.37554, + 0.37874, + 0.37764, + 0.37696, + 0.37702, + 0.37834, + 0.37902, + 0.37876, + 0.37774, + 0.37714, + 0.37816, + 0.38042, + 0.37544, + 0.38068, + 0.37858, + 0.38066, + 0.37826, + 0.38016, + 0.3802, + 0.37906, + 0.37884, + 0.37926, + 0.37942, + 0.37788, + 0.37972 + ], + "test_acc": [ + 0.2861, + 0.3325, + 0.3291, + 0.348, + 0.3452, + 0.3574, + 0.3412, + 0.3599, + 0.3485, + 0.3683, + 0.3663, + 0.3682, + 0.3616, + 0.367, + 0.3701, + 0.3702, + 0.3592, + 0.3731, + 0.3691, + 0.3588, + 0.3585, + 0.3754, + 0.3752, + 0.3647, + 0.3568, + 0.3678, + 0.3622, + 0.3687, + 0.3662, + 0.3697, + 0.3614, + 0.3669, + 0.3387, + 0.3594, + 0.3452, + 0.3532, + 0.3488, + 0.3581, + 0.3475, + 0.3599, + 0.3428, + 0.347, + 0.3621, + 0.3565, + 0.3451, + 0.3385, + 0.3365, + 0.3324, + 0.3551, + 0.3452, + 0.353, + 0.3504, + 0.3508, + 0.3448, + 0.3299, + 0.3413, + 0.3342, + 0.3506, + 0.3532, + 0.3428, + 0.3468, + 0.3395, + 0.3551, + 0.3435, + 0.334, + 0.3427, + 0.3352, + 0.3403, + 0.3419, + 0.3374, + 0.3358, + 0.3438, + 0.3401, + 0.3381, + 0.3437, + 0.3412, + 0.3362, + 0.3404, + 0.339, + 0.3406, + 0.3378, + 0.3481, + 0.3449, + 0.3412, + 0.334, + 0.3405, + 0.3431, + 0.3434, + 0.3401, + 0.3446, + 0.3386, + 0.3425, + 0.3413, + 0.3399, + 0.3425, + 0.3407, + 0.3402, + 0.3413, + 0.341, + 0.341 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.01863543502986431, + 0.966240406036377 + ], + "perturbation_rho": [ + 0.049932606518268585, + 0.11253532767295837 + ], + "nudging": { + "0.001": [ + -3.632623702287674e-06, + -7.5231073424220085e-06 + ], + "0.003": [ + -1.0822783224284649e-05, + -2.275872975587845e-05 + ], + "0.01": [ + -3.596034366637468e-05, + -7.59701943024993e-05 + ] + }, + "hidden_norms_per_layer": [ + 3561.231201171875, + 299735.8125, + 271834.53125 + ], + "bp_grad_norms_per_layer": [ + 2.061038867395837e-05, + 5.578897344094003e-07, + 5.395349376158265e-07 + ] + }, + "drift": { + "embed.weight": 25.27185200703667, + "embed.bias": 13.597802808023353, + "blocks.0.ln.weight": 1.7243371838975772, + "blocks.0.w1.weight": 26.803582221943408, + "blocks.0.w1.bias": 17.489010687530495, + "blocks.0.w2.weight": 62.11992968105335, + "blocks.1.ln.weight": 1.1537855920658724, + "blocks.1.w1.weight": 16.75993270124035, + "blocks.1.w1.bias": 9.810533469107403, + "blocks.1.w2.weight": 38.80660527636343, + "out_ln.weight": 0.460453695659119, + "out_head.weight": 4.155803649723169, + "out_head.bias": 13.238295370364474 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 5 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed5", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
