diff options
Diffstat (limited to 'results/fa_dfa_d512_L2_seed6/results_cifar10.json')
| -rw-r--r-- | results/fa_dfa_d512_L2_seed6/results_cifar10.json | 749 |
1 files changed, 749 insertions, 0 deletions
diff --git a/results/fa_dfa_d512_L2_seed6/results_cifar10.json b/results/fa_dfa_d512_L2_seed6/results_cifar10.json new file mode 100644 index 0000000..a0da849 --- /dev/null +++ b/results/fa_dfa_d512_L2_seed6/results_cifar10.json @@ -0,0 +1,749 @@ +{ + "6": { + "dfa": { + "log": { + "train_loss": [ + 2.055892396621704, + 2.0292765501403807, + 2.023764776611328, + 2.020959409866333, + 2.019423359222412, + 2.0197315069580077, + 2.023359367675781, + 2.017872388153076, + 2.01921712928772, + 2.0194658319854737, + 2.021274960708618, + 2.016373544845581, + 2.0175488451766967, + 2.0179581134796143, + 2.0176988045501707, + 2.0177309605407716, + 2.0153829962921144, + 2.013690803070068, + 2.016160803833008, + 2.012104736251831, + 2.0164508349990844, + 2.0172074625396728, + 2.011329041824341, + 2.014233197860718, + 2.0119160061264036, + 2.0112428046417237, + 2.0135288095092774, + 2.0137764200592043, + 2.0114110033416748, + 2.011166734046936, + 2.01347174949646, + 2.0128866384887694, + 2.012690868988037, + 2.0142732004547117, + 2.013253126296997, + 2.012407520980835, + 2.0118109189605713, + 2.012256015167236, + 2.0096606398773194, + 2.010287212905884, + 2.0091940085601805, + 2.0101572361755373, + 2.0091212350845336, + 2.010151270904541, + 2.0109262997817994, + 2.0077846411514284, + 2.0088822582626342, + 2.0098557024383545, + 2.0110063369750977, + 2.0083373790740966, + 2.0075834423828125, + 2.0072854569244383, + 2.0076236277771, + 2.009549726829529, + 2.00914709564209, + 2.0072284757232666, + 2.0073054156112673, + 2.008326266860962, + 2.0065047761535646, + 2.0040750775527956, + 2.008966516571045, + 2.006659435195923, + 2.006130950393677, + 2.0071768866729736, + 2.004858699607849, + 2.005933465194702, + 2.0051698098754884, + 2.0040941329193114, + 2.004839565887451, + 2.004348826370239, + 2.0043614904785154, + 2.005439692611694, + 2.0047981397247314, + 2.0036350199127195, + 2.0039494177627564, + 2.002428635940552, + 2.002635501022339, + 2.005249846954346, + 2.0045922426605225, + 1.9999085303497315, + 2.0022091399383544, + 2.001223135147095, + 2.005691502914429, + 2.0016508586883544, + 2.0019130290222167, + 2.0011878201293944, + 2.002061458091736, + 2.001959662628174, + 2.0005823556518556, + 2.003897890167236, + 2.003386359901428, + 2.0019060565185547, + 2.0028662380981443, + 2.000936403427124, + 2.003748550567627, + 2.00183758392334, + 2.001099390411377, + 2.002016563873291, + 2.001500345993042, + 2.000833380355835 + ], + "train_acc": [ + 0.2468, + 0.25656, + 0.2583, + 0.25842, + 0.26294, + 0.26512, + 0.25982, + 0.26482, + 0.26072, + 0.26388, + 0.25908, + 0.26332, + 0.26268, + 0.26474, + 0.26364, + 0.26604, + 0.2647, + 0.26542, + 0.26462, + 0.26776, + 0.26296, + 0.26282, + 0.26768, + 0.2662, + 0.26584, + 0.26868, + 0.26712, + 0.2637, + 0.26642, + 0.2643, + 0.26304, + 0.2664, + 0.26832, + 0.2695, + 0.26582, + 0.26628, + 0.2661, + 0.26608, + 0.26796, + 0.26702, + 0.26834, + 0.26798, + 0.27016, + 0.26738, + 0.2666, + 0.26772, + 0.26924, + 0.2708, + 0.26744, + 0.26734, + 0.27232, + 0.26954, + 0.27186, + 0.2691, + 0.26756, + 0.27156, + 0.26944, + 0.26982, + 0.27, + 0.2734, + 0.27014, + 0.27428, + 0.2721, + 0.27192, + 0.27394, + 0.27134, + 0.2706, + 0.27214, + 0.2724, + 0.27452, + 0.27194, + 0.27366, + 0.273, + 0.27294, + 0.2731, + 0.27446, + 0.27392, + 0.2735, + 0.274, + 0.2742, + 0.2727, + 0.27306, + 0.27192, + 0.27572, + 0.27528, + 0.27414, + 0.2743, + 0.27318, + 0.27448, + 0.27334, + 0.27238, + 0.27438, + 0.27446, + 0.27388, + 0.27336, + 0.27486, + 0.27176, + 0.27446, + 0.2743, + 0.27204 + ], + "test_acc": [ + 0.2713, + 0.2844, + 0.2811, + 0.28, + 0.299, + 0.2643, + 0.2824, + 0.2917, + 0.2912, + 0.2738, + 0.2633, + 0.2873, + 0.285, + 0.2787, + 0.2918, + 0.2776, + 0.2763, + 0.278, + 0.2677, + 0.2808, + 0.2944, + 0.2953, + 0.2923, + 0.2954, + 0.297, + 0.2825, + 0.2932, + 0.2826, + 0.2908, + 0.285, + 0.2799, + 0.2848, + 0.3029, + 0.2813, + 0.2915, + 0.2709, + 0.3065, + 0.2788, + 0.3023, + 0.2961, + 0.2864, + 0.2937, + 0.297, + 0.3001, + 0.2957, + 0.282, + 0.2855, + 0.2917, + 0.2897, + 0.2983, + 0.2881, + 0.2843, + 0.2775, + 0.2932, + 0.2953, + 0.2891, + 0.3012, + 0.2843, + 0.2914, + 0.2863, + 0.2978, + 0.2948, + 0.2863, + 0.2944, + 0.2897, + 0.2924, + 0.2925, + 0.2939, + 0.2888, + 0.2956, + 0.2964, + 0.2878, + 0.2855, + 0.2904, + 0.2999, + 0.2861, + 0.3025, + 0.2935, + 0.2953, + 0.2878, + 0.2974, + 0.2959, + 0.2944, + 0.2924, + 0.2937, + 0.2953, + 0.2911, + 0.2938, + 0.2924, + 0.2938, + 0.2953, + 0.2933, + 0.2955, + 0.2954, + 0.2939, + 0.2937, + 0.2938, + 0.2936, + 0.2933, + 0.2933 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.3805140256881714, + -0.00048614124534651637 + ], + "perturbation_rho": [ + 0.010780533775687218, + 0.0 + ], + "nudging": { + "0.001": [ + -3.3294782042503357e-07, + 0.0 + ], + "0.003": [ + -1.0631047189235687e-06, + 0.0 + ], + "0.01": [ + -3.623776137828827e-06, + 9.313225746154785e-10 + ] + }, + "hidden_norms_per_layer": [ + 54183.453125, + 1543298944.0, + 3004247040.0 + ], + "bp_grad_norms_per_layer": [ + 2.45587500558031e-07, + 3.692772754249063e-10, + 3.6931127600503544e-10 + ] + }, + "drift": { + "embed.weight": 334.1717985048247, + "embed.bias": 247.7536312263247, + "blocks.0.ln.weight": 9.54033246951961, + "blocks.0.w1.weight": 315.1784989948421, + "blocks.0.w1.bias": 269.25844995073356, + "blocks.0.w2.weight": 501.0628341707343, + "blocks.1.ln.weight": 8.010501646129491, + "blocks.1.w1.weight": 317.0441501524571, + "blocks.1.w1.bias": 304.79370018295725, + "blocks.1.w2.weight": 308.3494986335005, + "out_ln.weight": 0.4575791541009348, + "out_head.weight": 6.637383076518475, + "out_head.bias": 3.6615792171842636 + } + }, + "fa": { + "log": { + "train_loss": [ + 2.065024294166565, + 1.9630456279754638, + 1.9233733417129517, + 1.9067592349243163, + 1.8861662637329102, + 1.8703109120941162, + 1.8611061660766601, + 1.8445787530899047, + 1.829258919067383, + 1.8199622161102296, + 1.8095393975448608, + 1.7991895624542236, + 1.79670791015625, + 1.7896576220321656, + 1.7787932138061524, + 1.777765901145935, + 1.768475433731079, + 1.7715507403945923, + 1.7699084145736694, + 1.7577085567474364, + 1.7492800643539428, + 1.7376883664703369, + 1.7303459451293945, + 1.7293071484375, + 1.7250730394744873, + 1.726899693222046, + 1.7227447848129271, + 1.7317372454452515, + 1.7304015692138672, + 1.7312020352172852, + 1.7351370712280274, + 1.7342145778656006, + 1.7334492336654663, + 1.731919374732971, + 1.7354538122940064, + 1.7322556600952148, + 1.7360534030914307, + 1.7412740663909911, + 1.7402722408676148, + 1.7424089098358155, + 1.7433867425918579, + 1.7484364804077148, + 1.7482806644058229, + 1.7441494891738891, + 1.7457399251937866, + 1.740269787902832, + 1.7429518072128296, + 1.7410654845428466, + 1.7409823212432862, + 1.7343881818008422, + 1.736907575340271, + 1.7340854137802124, + 1.734343325843811, + 1.7312401904296875, + 1.7296781457138062, + 1.7250156705474853, + 1.7303392902374268, + 1.7267954447174072, + 1.7268179355621338, + 1.7248962731552124, + 1.7265133374786377, + 1.725437378578186, + 1.7230116376495361, + 1.721951872406006, + 1.7212245053482056, + 1.7194156966781615, + 1.7177197817993164, + 1.7192226972198486, + 1.7195494704437255, + 1.7167850009536743, + 1.7179081740570068, + 1.7162539065551758, + 1.7143080168914795, + 1.7166276223373413, + 1.716199371986389, + 1.7125089855957032, + 1.7071118188858032, + 1.7140238445281983, + 1.711059020729065, + 1.7108189041137696, + 1.7138464722061157, + 1.712218090133667, + 1.7137628644561766, + 1.7120113299179076, + 1.7139518783950807, + 1.7121368927383422, + 1.7085959339523316, + 1.7080107479095459, + 1.7105122137069702, + 1.7120901413345337, + 1.7093008170318604, + 1.707778765335083, + 1.7079006521987916, + 1.7071793605804444, + 1.7064016004180909, + 1.7067470293426514, + 1.7087606598281861, + 1.7090342914581298, + 1.707086050338745, + 1.7054454077911376 + ], + "train_acc": [ + 0.24472, + 0.28828, + 0.3077, + 0.31704, + 0.32668, + 0.33122, + 0.3323, + 0.3406, + 0.34542, + 0.35004, + 0.35242, + 0.3556, + 0.35868, + 0.36042, + 0.36382, + 0.36434, + 0.3649, + 0.36774, + 0.36866, + 0.36968, + 0.37606, + 0.3764, + 0.3827, + 0.38044, + 0.38462, + 0.38274, + 0.38134, + 0.3805, + 0.38172, + 0.38162, + 0.37954, + 0.3812, + 0.38154, + 0.38246, + 0.38214, + 0.38156, + 0.38276, + 0.37756, + 0.37994, + 0.37818, + 0.37948, + 0.3745, + 0.3761, + 0.37776, + 0.37658, + 0.37964, + 0.3789, + 0.37938, + 0.37994, + 0.38366, + 0.38024, + 0.38026, + 0.38234, + 0.38264, + 0.38382, + 0.38478, + 0.3855, + 0.38412, + 0.38446, + 0.38598, + 0.38618, + 0.38722, + 0.38892, + 0.3878, + 0.38716, + 0.38748, + 0.38934, + 0.3868, + 0.391, + 0.39034, + 0.39048, + 0.39066, + 0.39448, + 0.3907, + 0.39146, + 0.39476, + 0.39424, + 0.39456, + 0.39384, + 0.3942, + 0.39406, + 0.39414, + 0.3935, + 0.39276, + 0.39352, + 0.3918, + 0.3955, + 0.39626, + 0.39398, + 0.39516, + 0.3936, + 0.39472, + 0.39608, + 0.39546, + 0.3953, + 0.3935, + 0.39494, + 0.39556, + 0.39782, + 0.39818 + ], + "test_acc": [ + 0.2947, + 0.3403, + 0.3462, + 0.3468, + 0.3593, + 0.3653, + 0.3723, + 0.3689, + 0.372, + 0.3699, + 0.3635, + 0.3648, + 0.3749, + 0.3716, + 0.3759, + 0.3936, + 0.3903, + 0.3867, + 0.3853, + 0.3955, + 0.3909, + 0.4035, + 0.3969, + 0.3965, + 0.3878, + 0.3929, + 0.3895, + 0.3756, + 0.3801, + 0.377, + 0.3725, + 0.3941, + 0.3851, + 0.3949, + 0.3941, + 0.3753, + 0.3733, + 0.3731, + 0.3846, + 0.3734, + 0.3695, + 0.3857, + 0.3871, + 0.3798, + 0.3841, + 0.3771, + 0.3762, + 0.3814, + 0.3893, + 0.3712, + 0.3673, + 0.3771, + 0.3882, + 0.3816, + 0.3894, + 0.3825, + 0.3915, + 0.369, + 0.3847, + 0.3726, + 0.3876, + 0.3789, + 0.3679, + 0.3797, + 0.3785, + 0.3897, + 0.3758, + 0.3883, + 0.3789, + 0.3812, + 0.375, + 0.3779, + 0.3876, + 0.3884, + 0.3853, + 0.3865, + 0.3874, + 0.3859, + 0.3907, + 0.3826, + 0.385, + 0.3929, + 0.3856, + 0.3809, + 0.385, + 0.3849, + 0.3824, + 0.3854, + 0.3838, + 0.3857, + 0.3835, + 0.3842, + 0.385, + 0.3866, + 0.3864, + 0.3868, + 0.3865, + 0.3866, + 0.3865, + 0.3865 + ] + }, + "diagnostics": { + "bp_cosine": [ + 0.017966898158192635, + 0.9611225724220276 + ], + "perturbation_rho": [ + -0.022423196583986282, + 0.05839487165212631 + ], + "nudging": { + "0.001": [ + -1.0927324183285236e-06, + -6.873218808323145e-06 + ], + "0.003": [ + -3.30101465806365e-06, + -2.0737992599606514e-05 + ], + "0.01": [ + -1.1010735761374235e-05, + -6.911164382472634e-05 + ] + }, + "hidden_norms_per_layer": [ + 5436.04931640625, + 220695.28125, + 94910.3203125 + ], + "bp_grad_norms_per_layer": [ + 2.4236895114881918e-05, + 2.0322845557529945e-06, + 1.8303358046978246e-06 + ] + }, + "drift": { + "embed.weight": 32.57084729521678, + "embed.bias": 26.337782289300907, + "blocks.0.ln.weight": 1.3633438568396286, + "blocks.0.w1.weight": 19.737032593158407, + "blocks.0.w1.bias": 13.272555669066517, + "blocks.0.w2.weight": 55.66342599708415, + "blocks.1.ln.weight": 1.0296837730331478, + "blocks.1.w1.weight": 17.104661462082266, + "blocks.1.w1.bias": 9.996125311409836, + "blocks.1.w2.weight": 40.18024027628224, + "out_ln.weight": 0.49660679931516427, + "out_head.weight": 3.626674560113674, + "out_head.bias": 8.095867414428609 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 512, + "num_blocks": 2, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 6 + ], + "gpu": 0, + "output_dir": "results/fa_dfa_d512_L2_seed6", + "methods": [ + "fa", + "dfa" + ], + "random_targets": false, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
