diff options
Diffstat (limited to 'results/h2_smoke_w0.5/snapshot_evolution_s42.json')
| -rw-r--r-- | results/h2_smoke_w0.5/snapshot_evolution_s42.json | 237 |
1 files changed, 237 insertions, 0 deletions
diff --git a/results/h2_smoke_w0.5/snapshot_evolution_s42.json b/results/h2_smoke_w0.5/snapshot_evolution_s42.json new file mode 100644 index 0000000..8c75ebd --- /dev/null +++ b/results/h2_smoke_w0.5/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.5", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": NaN, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 86.00836944580078, + 130.30899047851562, + 107.6886215209961, + 127.31951141357422, + 155.31224060058594 + ], + "bp_grad_norms_per_sample_med": [ + 5.636421337840147e-05, + 4.504464232013561e-05, + 4.254864325048402e-05, + 4.0549883124185726e-05, + 3.8371628761524335e-05 + ], + "bp_grad_norms_F": [ + 0.0019479888724163175, + 0.0014867106219753623, + 0.0013919975608587265, + 0.001322419848293066, + 0.0012390650808811188 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1435546875, + "loss_eval": 2.293787717819214, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.2545166015625, + 142.36724853515625, + 117.42737579345703, + 145.57473754882812, + 174.0562744140625 + ], + "bp_grad_norms_per_sample_med": [ + 5.0501937948865816e-05, + 4.213622378301807e-05, + 3.962606206187047e-05, + 3.741410546354018e-05, + 3.486485002213158e-05 + ], + "bp_grad_norms_F": [ + 0.001744136679917574, + 0.0013844756176695228, + 0.0012931021628901362, + 0.0012163385981693864, + 0.0011240089079365134 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1640625, + "loss_eval": 2.2804112434387207, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.97102355957031, + 140.33131408691406, + 110.34066772460938, + 136.7115936279297, + 163.25784301757812 + ], + "bp_grad_norms_per_sample_med": [ + 5.4715037549613044e-05, + 4.477328184293583e-05, + 4.2219675378873944e-05, + 3.9974820538191125e-05, + 3.672601087600924e-05 + ], + "bp_grad_norms_F": [ + 0.0019211760954931378, + 0.0015042650047689676, + 0.0013935193419456482, + 0.0013014256255701184, + 0.0011887947330251336 + ], + "gamma_dfa": NaN, + "acc_eval": 0.1630859375, + "loss_eval": 2.294424057006836, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 42.802223205566406, + 44.22697067260742, + 46.05121994018555, + 46.896766662597656 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010791289387270808, + 0.0002035950165009126, + 0.00014324457151815295, + 0.00011542177526280284, + 9.846547618508339e-05 + ], + "bp_grad_norms_F": [ + 0.0380445197224617, + 0.00666962843388319, + 0.0046500470489263535, + 0.003719294909387827, + 0.003155440790578723 + ], + "gamma_dfa": 0.004864378133788705, + "acc_eval": 0.080078125, + "loss_eval": 2.446239709854126, + "epoch": 0 + }, + { + "hidden_norms": [ + 1180.2318115234375, + 5768.2900390625, + 5472.90234375, + 6369.3427734375, + 5295.2470703125 + ], + "bp_grad_norms_per_sample_med": [ + 1.2146981589467032e-06, + 8.634061714474228e-07, + 8.587696811446222e-07, + 8.589160529481887e-07, + 8.53334995554178e-07 + ], + "bp_grad_norms_F": [ + 6.592504360014573e-05, + 4.607137088896707e-05, + 4.4360855099512264e-05, + 4.341698149801232e-05, + 4.290258584660478e-05 + ], + "gamma_dfa": 0.0467059058137238, + "acc_eval": 0.15625, + "loss_eval": 2.2713985443115234, + "epoch": 1 + }, + { + "hidden_norms": [ + 2312.98193359375, + 25168.3515625, + 22182.9609375, + 23364.205078125, + 16927.552734375 + ], + "bp_grad_norms_per_sample_med": [ + 4.0056002603705565e-07, + 2.224278716767003e-07, + 2.2240433850129193e-07, + 2.2153939482905116e-07, + 2.2145297862152802e-07 + ], + "bp_grad_norms_F": [ + 3.370734702912159e-05, + 1.619783870410174e-05, + 1.508272544015199e-05, + 1.4707649825140834e-05, + 1.4549447769240942e-05 + ], + "gamma_dfa": 0.04014483268838376, + "acc_eval": 0.1513671875, + "loss_eval": 2.315417528152466, + "epoch": 2 + }, + { + "hidden_norms": [ + 2703.50634765625, + 35877.58203125, + 30404.849609375, + 31748.2421875, + 22049.421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.239594548176683e-07, + 1.6274317715669895e-07, + 1.625548691208678e-07, + 1.6296479543598252e-07, + 1.628933432584745e-07 + ], + "bp_grad_norms_F": [ + 2.923223473771941e-05, + 1.1944111065531615e-05, + 1.1137096407765057e-05, + 1.09043749034754e-05, + 1.0791579370561522e-05 + ], + "gamma_dfa": 0.039210652525071055, + "acc_eval": 0.1484375, + "loss_eval": 2.3342530727386475, + "epoch": 3 + } + ] +}
\ No newline at end of file |
