{ "config": { "output_dir": "results/h2_smoke_w0.5", "epochs": 3, "lr": 0.001, "wd": 0.01, "seed": 42, "depth": 4, "d_hidden": 256, "log_every": 1, "no_residual_add": true, "w2_std": 0.5 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656 ], "bp_grad_norms_per_sample_med": [ 0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05 ], "bp_grad_norms_F": [ 0.0380445197224617, 0.00666962843388319, 0.0046500470489263535, 0.003719294909387827, 0.003155440790578723 ], "gamma_dfa": NaN, "acc_eval": 0.080078125, "loss_eval": 2.446239709854126, "epoch": 0 }, { "hidden_norms": [ 86.00836944580078, 130.30899047851562, 107.6886215209961, 127.31951141357422, 155.31224060058594 ], "bp_grad_norms_per_sample_med": [ 5.636421337840147e-05, 4.504464232013561e-05, 4.254864325048402e-05, 4.0549883124185726e-05, 3.8371628761524335e-05 ], "bp_grad_norms_F": [ 0.0019479888724163175, 0.0014867106219753623, 0.0013919975608587265, 0.001322419848293066, 0.0012390650808811188 ], "gamma_dfa": NaN, "acc_eval": 0.1435546875, "loss_eval": 2.293787717819214, "epoch": 1 }, { "hidden_norms": [ 103.2545166015625, 142.36724853515625, 117.42737579345703, 145.57473754882812, 174.0562744140625 ], "bp_grad_norms_per_sample_med": [ 5.0501937948865816e-05, 4.213622378301807e-05, 3.962606206187047e-05, 3.741410546354018e-05, 3.486485002213158e-05 ], "bp_grad_norms_F": [ 0.001744136679917574, 0.0013844756176695228, 0.0012931021628901362, 0.0012163385981693864, 0.0011240089079365134 ], "gamma_dfa": NaN, "acc_eval": 0.1640625, "loss_eval": 2.2804112434387207, "epoch": 2 }, { "hidden_norms": [ 99.97102355957031, 140.33131408691406, 110.34066772460938, 136.7115936279297, 163.25784301757812 ], "bp_grad_norms_per_sample_med": [ 5.4715037549613044e-05, 4.477328184293583e-05, 4.2219675378873944e-05, 3.9974820538191125e-05, 3.672601087600924e-05 ], "bp_grad_norms_F": [ 0.0019211760954931378, 0.0015042650047689676, 0.0013935193419456482, 0.0013014256255701184, 0.0011887947330251336 ], "gamma_dfa": NaN, "acc_eval": 0.1630859375, "loss_eval": 2.294424057006836, "epoch": 3 } ], "dfa_log": [ { "hidden_norms": [ 8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656 ], "bp_grad_norms_per_sample_med": [ 0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05 ], "bp_grad_norms_F": [ 0.0380445197224617, 0.00666962843388319, 0.0046500470489263535, 0.003719294909387827, 0.003155440790578723 ], "gamma_dfa": 0.004864378133788705, "acc_eval": 0.080078125, "loss_eval": 2.446239709854126, "epoch": 0 }, { "hidden_norms": [ 1180.2318115234375, 5768.2900390625, 5472.90234375, 6369.3427734375, 5295.2470703125 ], "bp_grad_norms_per_sample_med": [ 1.2146981589467032e-06, 8.634061714474228e-07, 8.587696811446222e-07, 8.589160529481887e-07, 8.53334995554178e-07 ], "bp_grad_norms_F": [ 6.592504360014573e-05, 4.607137088896707e-05, 4.4360855099512264e-05, 4.341698149801232e-05, 4.290258584660478e-05 ], "gamma_dfa": 0.0467059058137238, "acc_eval": 0.15625, "loss_eval": 2.2713985443115234, "epoch": 1 }, { "hidden_norms": [ 2312.98193359375, 25168.3515625, 22182.9609375, 23364.205078125, 16927.552734375 ], "bp_grad_norms_per_sample_med": [ 4.0056002603705565e-07, 2.224278716767003e-07, 2.2240433850129193e-07, 2.2153939482905116e-07, 2.2145297862152802e-07 ], "bp_grad_norms_F": [ 3.370734702912159e-05, 1.619783870410174e-05, 1.508272544015199e-05, 1.4707649825140834e-05, 1.4549447769240942e-05 ], "gamma_dfa": 0.04014483268838376, "acc_eval": 0.1513671875, "loss_eval": 2.315417528152466, "epoch": 2 }, { "hidden_norms": [ 2703.50634765625, 35877.58203125, 30404.849609375, 31748.2421875, 22049.421875 ], "bp_grad_norms_per_sample_med": [ 3.239594548176683e-07, 1.6274317715669895e-07, 1.625548691208678e-07, 1.6296479543598252e-07, 1.628933432584745e-07 ], "bp_grad_norms_F": [ 2.923223473771941e-05, 1.1944111065531615e-05, 1.1137096407765057e-05, 1.09043749034754e-05, 1.0791579370561522e-05 ], "gamma_dfa": 0.039210652525071055, "acc_eval": 0.1484375, "loss_eval": 2.3342530727386475, "epoch": 3 } ] }