diff options
Diffstat (limited to 'results/h2_smoke_w0.1/snapshot_evolution_s42.json')
| -rw-r--r-- | results/h2_smoke_w0.1/snapshot_evolution_s42.json | 237 |
1 files changed, 237 insertions, 0 deletions
diff --git a/results/h2_smoke_w0.1/snapshot_evolution_s42.json b/results/h2_smoke_w0.1/snapshot_evolution_s42.json new file mode 100644 index 0000000..d085d3c --- /dev/null +++ b/results/h2_smoke_w0.1/snapshot_evolution_s42.json @@ -0,0 +1,237 @@ +{ + "config": { + "output_dir": "results/h2_smoke_w0.1", + "epochs": 3, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.560444831848145, + 8.845171928405762, + 9.21005916595459, + 9.379204750061035 + ], + "bp_grad_norms_per_sample_med": [ + 0.001055641332641244, + 0.0007215326768346131, + 0.0005827629356645048, + 0.0004979022196494043, + 0.00043998067849315703 + ], + "bp_grad_norms_F": [ + 0.036981210112571716, + 0.023669881746172905, + 0.018871067091822624, + 0.016073165461421013, + 0.014115042984485626 + ], + "gamma_dfa": NaN, + "acc_eval": 0.09375, + "loss_eval": 2.4311001300811768, + "epoch": 0 + }, + { + "hidden_norms": [ + 85.71797180175781, + 28.746126174926758, + 27.666101455688477, + 31.958999633789062, + 39.62472915649414 + ], + "bp_grad_norms_per_sample_med": [ + 8.686084765940905e-05, + 8.580532448831946e-05, + 8.54266545502469e-05, + 8.48824274726212e-05, + 8.353861630894244e-05 + ], + "bp_grad_norms_F": [ + 0.003033322049304843, + 0.002979709068313241, + 0.0029494145419448614, + 0.002918587066233158, + 0.0028573593590408564 + ], + "gamma_dfa": NaN, + "acc_eval": 0.05859375, + "loss_eval": 2.529827356338501, + "epoch": 1 + }, + { + "hidden_norms": [ + 103.60254669189453, + 33.103458404541016, + 32.14752197265625, + 38.19721984863281, + 48.121864318847656 + ], + "bp_grad_norms_per_sample_med": [ + 7.112277671694756e-05, + 7.050936983432621e-05, + 7.047054532449692e-05, + 6.984646461205557e-05, + 6.839916750323027e-05 + ], + "bp_grad_norms_F": [ + 0.002462180098518729, + 0.0024272387381643057, + 0.002406709361821413, + 0.002380331512540579, + 0.0023274135310202837 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0703125, + "loss_eval": 2.518604278564453, + "epoch": 2 + }, + { + "hidden_norms": [ + 99.88206481933594, + 32.27016830444336, + 29.376516342163086, + 35.85775375366211, + 44.175907135009766 + ], + "bp_grad_norms_per_sample_med": [ + 7.549120346084237e-05, + 7.506681140512228e-05, + 7.482277578674257e-05, + 7.426074444083497e-05, + 7.269046182045713e-05 + ], + "bp_grad_norms_F": [ + 0.002598837483674288, + 0.00256195105612278, + 0.002536388346925378, + 0.0025058977771550417, + 0.002439383417367935 + ], + "gamma_dfa": NaN, + "acc_eval": 0.072265625, + "loss_eval": 2.5117571353912354, + "epoch": 3 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.560444831848145, + 8.845171928405762, + 9.21005916595459, + 9.379204750061035 + ], + "bp_grad_norms_per_sample_med": [ + 0.001055641332641244, + 0.0007215326768346131, + 0.0005827629356645048, + 0.0004979022196494043, + 0.00043998067849315703 + ], + "bp_grad_norms_F": [ + 0.036981210112571716, + 0.023669881746172905, + 0.018871067091822624, + 0.016073165461421013, + 0.014115042984485626 + ], + "gamma_dfa": 0.0034602322848513722, + "acc_eval": 0.09375, + "loss_eval": 2.4311001300811768, + "epoch": 0 + }, + { + "hidden_norms": [ + 1321.57177734375, + 5876.37109375, + 5211.20947265625, + 5922.93798828125, + 3697.69580078125 + ], + "bp_grad_norms_per_sample_med": [ + 1.0980336355714826e-06, + 8.924058079173847e-07, + 8.845478305374854e-07, + 8.81322591794742e-07, + 8.844919534567453e-07 + ], + "bp_grad_norms_F": [ + 7.150410965550691e-05, + 5.026865619583987e-05, + 4.9243793910136446e-05, + 4.888495459454134e-05, + 4.859357068198733e-05 + ], + "gamma_dfa": 0.03524830285459757, + "acc_eval": 0.1181640625, + "loss_eval": 2.2935099601745605, + "epoch": 1 + }, + { + "hidden_norms": [ + 2543.9384765625, + 26885.123046875, + 22657.53515625, + 23760.638671875, + 13455.5205078125 + ], + "bp_grad_norms_per_sample_med": [ + 3.232785559248441e-07, + 2.0931234701038193e-07, + 2.086635788600688e-07, + 2.0885721596641815e-07, + 2.086642325593857e-07 + ], + "bp_grad_norms_F": [ + 3.009554711752571e-05, + 1.4969685253163334e-05, + 1.4619089597545099e-05, + 1.4558195289282594e-05, + 1.4452642062678933e-05 + ], + "gamma_dfa": 0.03537877253256738, + "acc_eval": 0.1201171875, + "loss_eval": 2.3101487159729004, + "epoch": 2 + }, + { + "hidden_norms": [ + 2961.771484375, + 39258.7265625, + 31789.115234375, + 32956.20703125, + 18197.2578125 + ], + "bp_grad_norms_per_sample_med": [ + 2.570918979927228e-07, + 1.4994434138770885e-07, + 1.4976241402564483e-07, + 1.4952657068079134e-07, + 1.4944804149763513e-07 + ], + "bp_grad_norms_F": [ + 2.3238537323777564e-05, + 1.1003003237419762e-05, + 1.0661849046300631e-05, + 1.0592500984785147e-05, + 1.0497028597455937e-05 + ], + "gamma_dfa": 0.03636467596516013, + "acc_eval": 0.12109375, + "loss_eval": 2.3122406005859375, + "epoch": 3 + } + ] +}
\ No newline at end of file |
