diff options
Diffstat (limited to 'results/fa_random_targets_s42/results_cifar10.json')
| -rw-r--r-- | results/fa_random_targets_s42/results_cifar10.json | 411 |
1 files changed, 411 insertions, 0 deletions
diff --git a/results/fa_random_targets_s42/results_cifar10.json b/results/fa_random_targets_s42/results_cifar10.json new file mode 100644 index 0000000..33fa066 --- /dev/null +++ b/results/fa_random_targets_s42/results_cifar10.json @@ -0,0 +1,411 @@ +{ + "42": { + "fa": { + "log": { + "train_loss": [ + 2.3210656842803954, + 2.3150660639953613, + 2.31394060256958, + 2.3137241358184815, + 2.313226750564575, + 2.312898317718506, + 2.3115276292419433, + 2.3112998097229003, + 2.312373881149292, + 2.3112880519104, + 2.3110179233551027, + 2.3094827233886717, + 2.3097055834197997, + 2.309138665313721, + 2.308755371398926, + 2.309352218093872, + 2.3081418705749512, + 2.3084949157714845, + 2.307779687347412, + 2.3071102055358885, + 2.3067180699920655, + 2.306768290481567, + 2.306924085235596, + 2.3063941722869874, + 2.306285163803101, + 2.3056750212860107, + 2.3055725598907473, + 2.3055327081298826, + 2.3053424534606934, + 2.3050209490966798, + 2.3051358866882325, + 2.304873356246948, + 2.3045516327667235, + 2.3042913507080076, + 2.304434557800293, + 2.3042074402618407, + 2.3039160931396485, + 2.304433411102295, + 2.3036191528320313, + 2.3038957733154297, + 2.303670624084473, + 2.303965150299072, + 2.303804924468994, + 2.3035577531433105, + 2.303584457550049, + 2.303571176300049, + 2.30339740234375, + 2.303557454452515, + 2.30346072013855, + 2.3033780017852785, + 2.303559310379028, + 2.3033258779144288, + 2.3033027320098878, + 2.303322297897339, + 2.30284891708374, + 2.3031199270629883, + 2.302974216156006, + 2.3031179604339598, + 2.303074387893677, + 2.3032363694763185, + 2.3030751721191405, + 2.3031637412261965, + 2.3029984189605712, + 2.302961895904541, + 2.3029372912597657, + 2.30282003036499, + 2.3028841104888915, + 2.302927931060791, + 2.30283846572876, + 2.3028817950439455, + 2.302871095428467, + 2.302848546066284, + 2.3027211415863036, + 2.302883378829956, + 2.3028133658599854, + 2.302789750442505, + 2.30266556968689, + 2.3026871818542483, + 2.3026958183288575, + 2.3027067826080323, + 2.302647667160034, + 2.3026781449890135, + 2.3026719428253175, + 2.302752258377075, + 2.3025668229675293, + 2.3027340324401857, + 2.3026700817871095, + 2.3026870487976074, + 2.3026517832946776, + 2.302639422836304, + 2.3026284925842284, + 2.302678219604492, + 2.3025743629455566, + 2.302645079803467, + 2.3026254082489013, + 2.3025657051086426, + 2.302568560562134, + 2.302596629562378, + 2.3026467196655274, + 2.30262910446167 + ], + "train_acc": [ + 0.09916, + 0.09876, + 0.10146, + 0.09992, + 0.10196, + 0.09982, + 0.09806, + 0.10266, + 0.10208, + 0.10162, + 0.10026, + 0.09852, + 0.10096, + 0.09824, + 0.09968, + 0.09992, + 0.10076, + 0.09998, + 0.09878, + 0.10038, + 0.1028, + 0.1005, + 0.09974, + 0.10234, + 0.10008, + 0.10142, + 0.10072, + 0.09942, + 0.09986, + 0.09736, + 0.09932, + 0.09888, + 0.10114, + 0.10054, + 0.09992, + 0.09942, + 0.09802, + 0.09746, + 0.09936, + 0.10052, + 0.09982, + 0.0983, + 0.09972, + 0.0996, + 0.09914, + 0.09954, + 0.1011, + 0.09934, + 0.09846, + 0.10064, + 0.09888, + 0.10058, + 0.10134, + 0.10024, + 0.10182, + 0.1007, + 0.10096, + 0.10038, + 0.1018, + 0.09818, + 0.10196, + 0.10002, + 0.10066, + 0.1021, + 0.09886, + 0.10106, + 0.09934, + 0.0975, + 0.10084, + 0.09938, + 0.1002, + 0.09842, + 0.1023, + 0.09958, + 0.10186, + 0.1014, + 0.10052, + 0.09892, + 0.09954, + 0.10054, + 0.09992, + 0.09962, + 0.10002, + 0.10092, + 0.10188, + 0.099, + 0.10124, + 0.09706, + 0.10042, + 0.10008, + 0.09796, + 0.09966, + 0.10016, + 0.09854, + 0.0991, + 0.10094, + 0.10254, + 0.09996, + 0.09714, + 0.09882 + ], + "test_acc": [ + 0.0948, + 0.0811, + 0.1058, + 0.0925, + 0.1061, + 0.0856, + 0.1171, + 0.1042, + 0.0998, + 0.0894, + 0.0985, + 0.0732, + 0.0858, + 0.0861, + 0.1274, + 0.0628, + 0.1051, + 0.104, + 0.1127, + 0.1045, + 0.1051, + 0.1183, + 0.0754, + 0.0837, + 0.0762, + 0.1063, + 0.1, + 0.0952, + 0.0933, + 0.1226, + 0.1009, + 0.1043, + 0.117, + 0.0946, + 0.0931, + 0.1133, + 0.0955, + 0.0995, + 0.0942, + 0.0837, + 0.109, + 0.1136, + 0.0937, + 0.0749, + 0.1135, + 0.1174, + 0.086, + 0.0883, + 0.108, + 0.0945, + 0.1034, + 0.0948, + 0.0933, + 0.1122, + 0.0924, + 0.0801, + 0.0856, + 0.0858, + 0.1102, + 0.1195, + 0.1005, + 0.0939, + 0.0985, + 0.0976, + 0.091, + 0.0991, + 0.0951, + 0.1015, + 0.0989, + 0.1104, + 0.0934, + 0.0977, + 0.1057, + 0.0996, + 0.0998, + 0.0893, + 0.1136, + 0.1194, + 0.1184, + 0.0927, + 0.1011, + 0.1005, + 0.0986, + 0.0947, + 0.1008, + 0.1149, + 0.1071, + 0.0997, + 0.0718, + 0.117, + 0.1241, + 0.1006, + 0.1178, + 0.0988, + 0.0993, + 0.1143, + 0.117, + 0.1217, + 0.1193, + 0.12 + ] + }, + "diagnostics": { + "bp_cosine": [ + -0.25835472345352173, + -0.36130592226982117, + -0.2657647430896759, + 0.9999802708625793 + ], + "perturbation_rho": [ + -0.043529167771339417, + 0.022320769727230072, + 0.011527110822498798, + 0.0071525974199175835 + ], + "nudging": { + "0.001": [ + 1.0617077350616455e-07, + 1.210719347000122e-07, + 9.499490261077881e-08, + -3.259629011154175e-07 + ], + "0.003": [ + 3.129243850708008e-07, + 3.7997961044311523e-07, + 2.682209014892578e-07, + -1.0058283805847168e-06 + ], + "0.01": [ + 1.0654330253601074e-06, + 1.2777745723724365e-06, + 8.754432201385498e-07, + -3.335997462272644e-06 + ] + }, + "hidden_norms_per_layer": [ + 1076.538818359375, + 51151.71875, + 101311.3046875, + 119784.4453125, + 128818.7890625 + ], + "bp_grad_norms_per_layer": [ + 2.6915265038951475e-07, + 2.3872169663263776e-07, + 2.386778135132772e-07, + 2.389696476257086e-07, + 2.3893238676464534e-07 + ] + }, + "drift": { + "embed.weight": 9.80184818135659, + "embed.bias": 19.49465769896296, + "blocks.0.ln.weight": 0.26961779594421387, + "blocks.0.w1.weight": 9.358735259494848, + "blocks.0.w1.bias": 12.749895988211446, + "blocks.0.w2.weight": 19.870291739972853, + "blocks.1.ln.weight": 0.3701913058757782, + "blocks.1.w1.weight": 9.472528827416744, + "blocks.1.w1.bias": 11.79483149750118, + "blocks.1.w2.weight": 14.954104550351216, + "blocks.2.ln.weight": 0.3377458453178406, + "blocks.2.w1.weight": 7.33340319144077, + "blocks.2.w1.bias": 9.089785454164343, + "blocks.2.w2.weight": 12.405169546116843, + "blocks.3.ln.weight": 0.49049311876296997, + "blocks.3.w1.weight": 5.387752188715276, + "blocks.3.w1.bias": 5.9034627839649305, + "blocks.3.w2.weight": 7.60319140703279, + "out_ln.weight": 0.5721396803855896, + "out_head.weight": 0.9433164083950665, + "out_head.bias": 0.4188211351080402 + } + } + }, + "config": { + "dataset": "cifar10", + "d_hidden": 256, + "num_blocks": 4, + "batch_size": 128, + "epochs": 100, + "lr": 0.001, + "lr_fb": 0.001, + "wd": 0.01, + "lam": 0.1, + "K": 4, + "sigma_bridge": 0.05, + "ema_momentum": 0.995, + "term_grad_weight": 1.0, + "seeds": [ + 42 + ], + "gpu": 0, + "output_dir": "results/fa_random_targets_s42", + "methods": [ + "fa" + ], + "random_targets": true, + "penalty_lam": 0.0, + "num_classes": 10 + } +}
\ No newline at end of file |
