{ "config": { "output_dir": "results/h2_smoke_w0.1", "epochs": 3, "lr": 0.001, "wd": 0.01, "seed": 42, "depth": 4, "d_hidden": 256, "log_every": 1, "no_residual_add": true, "w2_std": 0.1 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.718070030212402, 8.560444831848145, 8.845171928405762, 9.21005916595459, 9.379204750061035 ], "bp_grad_norms_per_sample_med": [ 0.001055641332641244, 0.0007215326768346131, 0.0005827629356645048, 0.0004979022196494043, 0.00043998067849315703 ], "bp_grad_norms_F": [ 0.036981210112571716, 0.023669881746172905, 0.018871067091822624, 0.016073165461421013, 0.014115042984485626 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 2.4311001300811768, "epoch": 0 }, { "hidden_norms": [ 85.71797180175781, 28.746126174926758, 27.666101455688477, 31.958999633789062, 39.62472915649414 ], "bp_grad_norms_per_sample_med": [ 8.686084765940905e-05, 8.580532448831946e-05, 8.54266545502469e-05, 8.48824274726212e-05, 8.353861630894244e-05 ], "bp_grad_norms_F": [ 0.003033322049304843, 0.002979709068313241, 0.0029494145419448614, 0.002918587066233158, 0.0028573593590408564 ], "gamma_dfa": NaN, "acc_eval": 0.05859375, "loss_eval": 2.529827356338501, "epoch": 1 }, { "hidden_norms": [ 103.60254669189453, 33.103458404541016, 32.14752197265625, 38.19721984863281, 48.121864318847656 ], "bp_grad_norms_per_sample_med": [ 7.112277671694756e-05, 7.050936983432621e-05, 7.047054532449692e-05, 6.984646461205557e-05, 6.839916750323027e-05 ], "bp_grad_norms_F": [ 0.002462180098518729, 0.0024272387381643057, 0.002406709361821413, 0.002380331512540579, 0.0023274135310202837 ], "gamma_dfa": NaN, "acc_eval": 0.0703125, "loss_eval": 2.518604278564453, "epoch": 2 }, { "hidden_norms": [ 99.88206481933594, 32.27016830444336, 29.376516342163086, 35.85775375366211, 44.175907135009766 ], "bp_grad_norms_per_sample_med": [ 7.549120346084237e-05, 7.506681140512228e-05, 7.482277578674257e-05, 7.426074444083497e-05, 7.269046182045713e-05 ], "bp_grad_norms_F": [ 0.002598837483674288, 0.00256195105612278, 0.002536388346925378, 0.0025058977771550417, 0.002439383417367935 ], "gamma_dfa": NaN, "acc_eval": 0.072265625, "loss_eval": 2.5117571353912354, "epoch": 3 } ], "dfa_log": [ { "hidden_norms": [ 8.718070030212402, 8.560444831848145, 8.845171928405762, 9.21005916595459, 9.379204750061035 ], "bp_grad_norms_per_sample_med": [ 0.001055641332641244, 0.0007215326768346131, 0.0005827629356645048, 0.0004979022196494043, 0.00043998067849315703 ], "bp_grad_norms_F": [ 0.036981210112571716, 0.023669881746172905, 0.018871067091822624, 0.016073165461421013, 0.014115042984485626 ], "gamma_dfa": 0.0034602322848513722, "acc_eval": 0.09375, "loss_eval": 2.4311001300811768, "epoch": 0 }, { "hidden_norms": [ 1321.57177734375, 5876.37109375, 5211.20947265625, 5922.93798828125, 3697.69580078125 ], "bp_grad_norms_per_sample_med": [ 1.0980336355714826e-06, 8.924058079173847e-07, 8.845478305374854e-07, 8.81322591794742e-07, 8.844919534567453e-07 ], "bp_grad_norms_F": [ 7.150410965550691e-05, 5.026865619583987e-05, 4.9243793910136446e-05, 4.888495459454134e-05, 4.859357068198733e-05 ], "gamma_dfa": 0.03524830285459757, "acc_eval": 0.1181640625, "loss_eval": 2.2935099601745605, "epoch": 1 }, { "hidden_norms": [ 2543.9384765625, 26885.123046875, 22657.53515625, 23760.638671875, 13455.5205078125 ], "bp_grad_norms_per_sample_med": [ 3.232785559248441e-07, 2.0931234701038193e-07, 2.086635788600688e-07, 2.0885721596641815e-07, 2.086642325593857e-07 ], "bp_grad_norms_F": [ 3.009554711752571e-05, 1.4969685253163334e-05, 1.4619089597545099e-05, 1.4558195289282594e-05, 1.4452642062678933e-05 ], "gamma_dfa": 0.03537877253256738, "acc_eval": 0.1201171875, "loss_eval": 2.3101487159729004, "epoch": 2 }, { "hidden_norms": [ 2961.771484375, 39258.7265625, 31789.115234375, 32956.20703125, 18197.2578125 ], "bp_grad_norms_per_sample_med": [ 2.570918979927228e-07, 1.4994434138770885e-07, 1.4976241402564483e-07, 1.4952657068079134e-07, 1.4944804149763513e-07 ], "bp_grad_norms_F": [ 2.3238537323777564e-05, 1.1003003237419762e-05, 1.0661849046300631e-05, 1.0592500984785147e-05, 1.0497028597455937e-05 ], "gamma_dfa": 0.03636467596516013, "acc_eval": 0.12109375, "loss_eval": 2.3122406005859375, "epoch": 3 } ] }