diff options
Diffstat (limited to 'results/h2_smoke_w0.2/snapshot_evolution_s42.json')
| -rw-r--r-- | results/h2_smoke_w0.2/snapshot_evolution_s42.json | 237 |
1 files changed, 237 insertions, 0 deletions
diff --git a/results/h2_smoke_w0.2/snapshot_evolution_s42.json b/results/h2_smoke_w0.2/snapshot_evolution_s42.json new file mode 100644 index 0000000..a98f5da --- /dev/null +++ b/results/h2_smoke_w0.2/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.2", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.2 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 17.12088966369629, + 17.690689086914062, + 18.420406341552734, + 18.75864601135254 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010638737585395575, + 0.00045698368921875954, + 0.0003363286959938705, + 0.0002763723023235798, + 0.0002378255157964304 + ], + "bp_grad_norms_F": [ + 0.03763078525662422, + 0.015000421553850174, + 0.010959738865494728, + 0.008936461992561817, + 0.007658911868929863 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0859375, + "loss_eval": 2.4382002353668213, + "epoch": 0 + }, + { + "hidden_norms": [ + 85.67359161376953, + 53.38432693481445, + 47.44037628173828, + 55.29991149902344, + 67.34859466552734 + ], + "bp_grad_norms_per_sample_med": [ + 8.009114390006289e-05, + 7.683139119762927e-05, + 7.53635322325863e-05, + 7.400008325930685e-05, + 7.128623110475019e-05 + ], + "bp_grad_norms_F": [ + 0.0027135731652379036, + 0.0025544750969856977, + 0.0024875544477254152, + 0.0024266208056360483, + 0.0023267678916454315 + ], + "gamma_dfa": NaN, + "acc_eval": 0.083984375, + "loss_eval": 2.4839837551116943, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.92682647705078, + 59.23755645751953, + 52.980411529541016, + 64.2865982055664, + 78.33065032958984 + ], + "bp_grad_norms_per_sample_med": [ + 6.883802416268736e-05, + 6.662087980657816e-05, + 6.507965008495376e-05, + 6.394806405296549e-05, + 6.143032078398392e-05 + ], + "bp_grad_norms_F": [ + 0.0023220409639179707, + 0.002212206134572625, + 0.0021602711640298367, + 0.0021026749163866043, + 0.002004916314035654 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.4874913692474365, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.67398834228516, + 58.03565216064453, + 49.116390228271484, + 60.295406341552734, + 73.20696258544922 + ], + "bp_grad_norms_per_sample_med": [ + 7.312109664781019e-05, + 7.063996599754319e-05, + 6.898775609442964e-05, + 6.728436710545793e-05, + 6.445571489166468e-05 + ], + "bp_grad_norms_F": [ + 0.002473062602803111, + 0.0023518132511526346, + 0.0022898896131664515, + 0.002222386421635747, + 0.002102817641571164 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.4926531314849854, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 17.12088966369629, + 17.690689086914062, + 18.420406341552734, + 18.75864601135254 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010638737585395575, + 0.00045698368921875954, + 0.0003363286959938705, + 0.0002763723023235798, + 0.0002378255157964304 + ], + "bp_grad_norms_F": [ + 0.03763078525662422, + 0.015000421553850174, + 0.010959738865494728, + 0.008936461992561817, + 0.007658911868929863 + ], + "gamma_dfa": 0.0037797510012751445, + "acc_eval": 0.0859375, + "loss_eval": 2.4382002353668213, + "epoch": 0 + }, + { + "hidden_norms": [ + 1258.0216064453125, + 5942.1240234375, + 4878.22021484375, + 5972.6494140625, + 4135.04931640625 + ], + "bp_grad_norms_per_sample_med": [ + 1.158710347226588e-06, + 8.974735692390823e-07, + 8.935384698816051e-07, + 8.949773473432288e-07, + 8.903299999474257e-07 + ], + "bp_grad_norms_F": [ + 6.218944326974452e-05, + 4.8492554924450815e-05, + 4.7771758545422927e-05, + 4.744856778415851e-05, + 4.708760025096126e-05 + ], + "gamma_dfa": 0.039906812366098166, + "acc_eval": 0.1259765625, + "loss_eval": 2.2913613319396973, + "epoch": 1 + }, + { + "hidden_norms": [ + 2455.668212890625, + 26613.791015625, + 20806.90234375, + 23305.125, + 14706.8408203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.5421919619693654e-07, + 2.1852616782780387e-07, + 2.1860738286250125e-07, + 2.179439917426862e-07, + 2.1746768652519677e-07 + ], + "bp_grad_norms_F": [ + 3.6695244489237666e-05, + 1.5090728993527591e-05, + 1.4612215636589099e-05, + 1.4485378414974548e-05, + 1.4331568308989517e-05 + ], + "gamma_dfa": 0.03681188588961959, + "acc_eval": 0.1416015625, + "loss_eval": 2.3159337043762207, + "epoch": 2 + }, + { + "hidden_norms": [ + 2871.099853515625, + 38200.73828125, + 28961.662109375, + 32314.5390625, + 19539.51953125 + ], + "bp_grad_norms_per_sample_med": [ + 2.831942822467681e-07, + 1.5707844625012513e-07, + 1.5655700735806022e-07, + 1.5635474426289875e-07, + 1.559963891395455e-07 + ], + "bp_grad_norms_F": [ + 2.7198082534596324e-05, + 1.122839967138134e-05, + 1.0740075595094822e-05, + 1.0607479453028645e-05, + 1.046583474817453e-05 + ], + "gamma_dfa": 0.036901777144521475, + "acc_eval": 0.1435546875, + "loss_eval": 2.321805477142334, + "epoch": 3 + } + ] +}
\ No newline at end of file |
