{ "config": { "output_dir": "results/h2_smoke_w0.2", "epochs": 3, "lr": 0.001, "wd": 0.01, "seed": 42, "depth": 4, "d_hidden": 256, "log_every": 1, "no_residual_add": true, "w2_std": 0.2 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.718070030212402, 17.12088966369629, 17.690689086914062, 18.420406341552734, 18.75864601135254 ], "bp_grad_norms_per_sample_med": [ 0.0010638737585395575, 0.00045698368921875954, 0.0003363286959938705, 0.0002763723023235798, 0.0002378255157964304 ], "bp_grad_norms_F": [ 0.03763078525662422, 0.015000421553850174, 0.010959738865494728, 0.008936461992561817, 0.007658911868929863 ], "gamma_dfa": NaN, "acc_eval": 0.0859375, "loss_eval": 2.4382002353668213, "epoch": 0 }, { "hidden_norms": [ 85.67359161376953, 53.38432693481445, 47.44037628173828, 55.29991149902344, 67.34859466552734 ], "bp_grad_norms_per_sample_med": [ 8.009114390006289e-05, 7.683139119762927e-05, 7.53635322325863e-05, 7.400008325930685e-05, 7.128623110475019e-05 ], "bp_grad_norms_F": [ 0.0027135731652379036, 0.0025544750969856977, 0.0024875544477254152, 0.0024266208056360483, 0.0023267678916454315 ], "gamma_dfa": NaN, "acc_eval": 0.083984375, "loss_eval": 2.4839837551116943, "epoch": 1 }, { "hidden_norms": [ 103.92682647705078, 59.23755645751953, 52.980411529541016, 64.2865982055664, 78.33065032958984 ], "bp_grad_norms_per_sample_med": [ 6.883802416268736e-05, 6.662087980657816e-05, 6.507965008495376e-05, 6.394806405296549e-05, 6.143032078398392e-05 ], "bp_grad_norms_F": [ 0.0023220409639179707, 0.002212206134572625, 0.0021602711640298367, 0.0021026749163866043, 0.002004916314035654 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 2.4874913692474365, "epoch": 2 }, { "hidden_norms": [ 99.67398834228516, 58.03565216064453, 49.116390228271484, 60.295406341552734, 73.20696258544922 ], "bp_grad_norms_per_sample_med": [ 7.312109664781019e-05, 7.063996599754319e-05, 6.898775609442964e-05, 6.728436710545793e-05, 6.445571489166468e-05 ], "bp_grad_norms_F": [ 0.002473062602803111, 0.0023518132511526346, 0.0022898896131664515, 0.002222386421635747, 0.002102817641571164 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.4926531314849854, "epoch": 3 } ], "dfa_log": [ { "hidden_norms": [ 8.718070030212402, 17.12088966369629, 17.690689086914062, 18.420406341552734, 18.75864601135254 ], "bp_grad_norms_per_sample_med": [ 0.0010638737585395575, 0.00045698368921875954, 0.0003363286959938705, 0.0002763723023235798, 0.0002378255157964304 ], "bp_grad_norms_F": [ 0.03763078525662422, 0.015000421553850174, 0.010959738865494728, 0.008936461992561817, 0.007658911868929863 ], "gamma_dfa": 0.0037797510012751445, "acc_eval": 0.0859375, "loss_eval": 2.4382002353668213, "epoch": 0 }, { "hidden_norms": [ 1258.0216064453125, 5942.1240234375, 4878.22021484375, 5972.6494140625, 4135.04931640625 ], "bp_grad_norms_per_sample_med": [ 1.158710347226588e-06, 8.974735692390823e-07, 8.935384698816051e-07, 8.949773473432288e-07, 8.903299999474257e-07 ], "bp_grad_norms_F": [ 6.218944326974452e-05, 4.8492554924450815e-05, 4.7771758545422927e-05, 4.744856778415851e-05, 4.708760025096126e-05 ], "gamma_dfa": 0.039906812366098166, "acc_eval": 0.1259765625, "loss_eval": 2.2913613319396973, "epoch": 1 }, { "hidden_norms": [ 2455.668212890625, 26613.791015625, 20806.90234375, 23305.125, 14706.8408203125 ], "bp_grad_norms_per_sample_med": [ 3.5421919619693654e-07, 2.1852616782780387e-07, 2.1860738286250125e-07, 2.179439917426862e-07, 2.1746768652519677e-07 ], "bp_grad_norms_F": [ 3.6695244489237666e-05, 1.5090728993527591e-05, 1.4612215636589099e-05, 1.4485378414974548e-05, 1.4331568308989517e-05 ], "gamma_dfa": 0.03681188588961959, "acc_eval": 0.1416015625, "loss_eval": 2.3159337043762207, "epoch": 2 }, { "hidden_norms": [ 2871.099853515625, 38200.73828125, 28961.662109375, 32314.5390625, 19539.51953125 ], "bp_grad_norms_per_sample_med": [ 2.831942822467681e-07, 1.5707844625012513e-07, 1.5655700735806022e-07, 1.5635474426289875e-07, 1.559963891395455e-07 ], "bp_grad_norms_F": [ 2.7198082534596324e-05, 1.122839967138134e-05, 1.0740075595094822e-05, 1.0607479453028645e-05, 1.046583474817453e-05 ], "gamma_dfa": 0.036901777144521475, "acc_eval": 0.1435546875, "loss_eval": 2.321805477142334, "epoch": 3 } ] }