summaryrefslogtreecommitdiff
path: root/results/snapshot_synth_v1
diff options
context:
space:
mode:
authorYurenHao0426 <Blackhao0426@gmail.com>2026-06-14 04:06:32 -0500
committerYurenHao0426 <Blackhao0426@gmail.com>2026-06-14 04:06:32 -0500
commitaa73718eb6427d7da3b9cb416275802d90c4b2ed (patch)
treeb68b0a664fb650744ef934a1c22abd740a7b62a6 /results/snapshot_synth_v1
parent827c658fa9a750f3c6ebdb87703762f10f69f6ff (diff)
Add new experiment scripts, figures, and paper assets; untrack pyc/build artifactsHEADmaster
Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
Diffstat (limited to 'results/snapshot_synth_v1')
-rw-r--r--results/snapshot_synth_v1/run_a1.0_s42.log44
-rw-r--r--results/snapshot_synth_v1/snapshot_fa_canonical_s42.json2276
-rw-r--r--results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json2276
-rw-r--r--results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json4960
4 files changed, 9556 insertions, 0 deletions
diff --git a/results/snapshot_synth_v1/run_a1.0_s42.log b/results/snapshot_synth_v1/run_a1.0_s42.log
new file mode 100644
index 0000000..d1e834a
--- /dev/null
+++ b/results/snapshot_synth_v1/run_a1.0_s42.log
@@ -0,0 +1,44 @@
+device=cuda:0, alpha=1.0, depth=4, d_hidden=128, epochs=80, seed=42
+train: torch.Size([12800, 128]), test eval buffer: torch.Size([2000, 128])
+
+=== BP training ===
+ [BP] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845
+ [BP] Ep 1: ||h_L||=1.393e+01 ||g||=3.616e-04 acc=0.7095
+ [BP] Ep 5: ||h_L||=2.067e+01 ||g||=2.195e-04 acc=0.7855
+ [BP] Ep 10: ||h_L||=2.332e+01 ||g||=1.576e-04 acc=0.7915
+ [BP] Ep 15: ||h_L||=2.609e+01 ||g||=9.301e-05 acc=0.8000
+ [BP] Ep 20: ||h_L||=2.880e+01 ||g||=4.764e-05 acc=0.7950
+ [BP] Ep 25: ||h_L||=3.096e+01 ||g||=3.036e-05 acc=0.7995
+ [BP] Ep 30: ||h_L||=3.235e+01 ||g||=1.972e-05 acc=0.7975
+ [BP] Ep 35: ||h_L||=3.329e+01 ||g||=1.527e-05 acc=0.8000
+ [BP] Ep 40: ||h_L||=3.398e+01 ||g||=1.181e-05 acc=0.7975
+ [BP] Ep 45: ||h_L||=3.449e+01 ||g||=1.028e-05 acc=0.7980
+ [BP] Ep 50: ||h_L||=3.489e+01 ||g||=9.180e-06 acc=0.7980
+ [BP] Ep 55: ||h_L||=3.516e+01 ||g||=8.594e-06 acc=0.7975
+ [BP] Ep 60: ||h_L||=3.538e+01 ||g||=8.124e-06 acc=0.7960
+ [BP] Ep 65: ||h_L||=3.553e+01 ||g||=7.551e-06 acc=0.7960
+ [BP] Ep 70: ||h_L||=3.561e+01 ||g||=7.443e-06 acc=0.7960
+ [BP] Ep 75: ||h_L||=3.565e+01 ||g||=7.344e-06 acc=0.7960
+ [BP] Ep 80: ||h_L||=3.565e+01 ||g||=7.323e-06 acc=0.7960
+
+=== DFA training ===
+ [DFA] Ep 0: ||h_L||=1.140e+01 ||g||=2.816e-04 acc=0.0845
+ [DFA] Ep 1: ||h_L||=1.244e+01 ||g||=2.737e-04 acc=0.3775 γ_dfa=0.1151
+ [DFA] Ep 5: ||h_L||=5.072e+01 ||g||=1.943e-04 acc=0.7350 γ_dfa=0.1674
+ [DFA] Ep 10: ||h_L||=1.381e+02 ||g||=1.229e-04 acc=0.7175 γ_dfa=0.1132
+ [DFA] Ep 15: ||h_L||=2.302e+02 ||g||=1.030e-04 acc=0.7110 γ_dfa=0.0913
+ [DFA] Ep 20: ||h_L||=3.213e+02 ||g||=1.112e-04 acc=0.7070 γ_dfa=0.0795
+ [DFA] Ep 25: ||h_L||=4.041e+02 ||g||=1.027e-04 acc=0.7035 γ_dfa=0.0709
+ [DFA] Ep 30: ||h_L||=4.810e+02 ||g||=1.014e-04 acc=0.6845 γ_dfa=0.0650
+ [DFA] Ep 35: ||h_L||=5.483e+02 ||g||=1.116e-04 acc=0.6955 γ_dfa=0.0630
+ [DFA] Ep 40: ||h_L||=6.078e+02 ||g||=1.203e-04 acc=0.6880 γ_dfa=0.0578
+ [DFA] Ep 45: ||h_L||=6.578e+02 ||g||=1.118e-04 acc=0.6845 γ_dfa=0.0563
+ [DFA] Ep 50: ||h_L||=6.988e+02 ||g||=1.262e-04 acc=0.6945 γ_dfa=0.0562
+ [DFA] Ep 55: ||h_L||=7.301e+02 ||g||=1.428e-04 acc=0.6720 γ_dfa=0.0559
+ [DFA] Ep 60: ||h_L||=7.519e+02 ||g||=1.238e-04 acc=0.6910 γ_dfa=0.0542
+ [DFA] Ep 65: ||h_L||=7.678e+02 ||g||=1.230e-04 acc=0.6895 γ_dfa=0.0530
+ [DFA] Ep 70: ||h_L||=7.757e+02 ||g||=1.224e-04 acc=0.6950 γ_dfa=0.0530
+ [DFA] Ep 75: ||h_L||=7.791e+02 ||g||=1.214e-04 acc=0.6915 γ_dfa=0.0526
+ [DFA] Ep 80: ||h_L||=7.797e+02 ||g||=1.203e-04 acc=0.6930 γ_dfa=0.0526
+
+Saved results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json
diff --git a/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json
new file mode 100644
index 0000000..6ff85e7
--- /dev/null
+++ b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json
@@ -0,0 +1,2276 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.457883834838867,
+ 11.697802543640137,
+ 12.001762390136719,
+ 12.303658485412598
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004113642207812518,
+ 0.00037613665335811675,
+ 0.0003495849668979645,
+ 0.0003221812949050218,
+ 0.00025295966770499945
+ ],
+ "bp_grad_F": [
+ 0.018967075273394585,
+ 0.017186719924211502,
+ 0.015851320698857307,
+ 0.01445167325437069,
+ 0.011211601085960865
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5270000100135803,
+ "loss_eval": 1.4865981340408325,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.734084129333496,
+ 12.481009483337402,
+ 13.659913063049316,
+ 15.730950355529785
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007782558677718043,
+ 0.0006171928835101426,
+ 0.0004891889402642846,
+ 0.00038687532651238143,
+ 0.000231728219659999
+ ],
+ "bp_grad_F": [
+ 0.04103676602244377,
+ 0.03172670304775238,
+ 0.024926593527197838,
+ 0.019472092390060425,
+ 0.011657902970910072
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6360000371932983,
+ "loss_eval": 0.965207040309906,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.973358154296875,
+ 13.411399841308594,
+ 16.07562255859375,
+ 20.911983489990234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008172825910151005,
+ 0.0005784342647530138,
+ 0.000417369301430881,
+ 0.0003010776126757264,
+ 0.000168764207046479
+ ],
+ "bp_grad_F": [
+ 0.05745441094040871,
+ 0.04039904102683067,
+ 0.028755735605955124,
+ 0.020857004448771477,
+ 0.011488317511975765
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.687000036239624,
+ "loss_eval": 0.8154960870742798,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.203580856323242,
+ 14.659997940063477,
+ 19.929065704345703,
+ 27.998876571655273
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007437548483721912,
+ 0.00048129685455933213,
+ 0.00031908220262266695,
+ 0.00022696926316712052,
+ 0.00012886490731034428
+ ],
+ "bp_grad_F": [
+ 0.06721046566963196,
+ 0.043338593095541,
+ 0.028462719172239304,
+ 0.019943350926041603,
+ 0.01114331278949976
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.703000009059906,
+ "loss_eval": 0.7722610831260681,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.476441383361816,
+ 16.378177642822266,
+ 25.748563766479492,
+ 36.580970764160156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007116686902008951,
+ 0.00042677627061493695,
+ 0.0002665013598743826,
+ 0.00019125515245832503,
+ 0.0001178958555101417
+ ],
+ "bp_grad_F": [
+ 0.06977967172861099,
+ 0.04175141453742981,
+ 0.02600390836596489,
+ 0.018256530165672302,
+ 0.010964884422719479
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7070000171661377,
+ "loss_eval": 0.7697932720184326,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.808075904846191,
+ 19.022871017456055,
+ 33.50295639038086,
+ 45.75634002685547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000760514521971345,
+ 0.000416931085055694,
+ 0.0002524603623896837,
+ 0.00018262627418152988,
+ 0.0001200677506858483
+ ],
+ "bp_grad_F": [
+ 0.0695224478840828,
+ 0.03927718475461006,
+ 0.023749928921461105,
+ 0.01698874868452549,
+ 0.011118472553789616
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7035000324249268,
+ "loss_eval": 0.7977719902992249,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.191008567810059,
+ 22.44864273071289,
+ 42.65863800048828,
+ 54.38147735595703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007628297316841781,
+ 0.0003877072886098176,
+ 0.00022262487618718296,
+ 0.00016918807523325086,
+ 0.0001183631393359974
+ ],
+ "bp_grad_F": [
+ 0.06797165423631668,
+ 0.03639831766486168,
+ 0.02157149650156498,
+ 0.015874147415161133,
+ 0.011150078848004341
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.70250004529953,
+ "loss_eval": 0.8099735975265503,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.587474822998047,
+ 26.61025619506836,
+ 51.025230407714844,
+ 61.79695129394531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007774661062285304,
+ 0.00037008023355156183,
+ 0.00019806883938144892,
+ 0.0001550534798298031,
+ 0.00011658846779027954
+ ],
+ "bp_grad_F": [
+ 0.06822231411933899,
+ 0.03484996780753136,
+ 0.02039053477346897,
+ 0.015457017347216606,
+ 0.011438230983912945
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6920000314712524,
+ "loss_eval": 0.8282882571220398,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.02984619140625,
+ 31.27604866027832,
+ 59.14579391479492,
+ 68.8819580078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000821497815195471,
+ 0.000388532382203266,
+ 0.0002036481600953266,
+ 0.0001647671015234664,
+ 0.00012798182433471084
+ ],
+ "bp_grad_F": [
+ 0.06896942853927612,
+ 0.03378934785723686,
+ 0.019570810720324516,
+ 0.015211639925837517,
+ 0.01168233621865511
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6785000562667847,
+ "loss_eval": 0.8751994967460632,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.566975593566895,
+ 37.15107345581055,
+ 66.83728790283203,
+ 76.04595184326172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008561373106203973,
+ 0.00037220801459625363,
+ 0.00018477423873264343,
+ 0.0001600280374987051,
+ 0.00012663347297348082
+ ],
+ "bp_grad_F": [
+ 0.06949204951524734,
+ 0.033161722123622894,
+ 0.019245225936174393,
+ 0.015247669070959091,
+ 0.012057062238454819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6585000157356262,
+ "loss_eval": 0.9142682552337646,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.22678279876709,
+ 44.73517990112305,
+ 74.21520233154297,
+ 82.72914123535156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008647029753774405,
+ 0.0003551499976310879,
+ 0.00016902851348277181,
+ 0.00014951576304156333,
+ 0.0001220703707076609
+ ],
+ "bp_grad_F": [
+ 0.06799578666687012,
+ 0.03190648928284645,
+ 0.018390726298093796,
+ 0.015047998167574406,
+ 0.01216125674545765
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6635000109672546,
+ "loss_eval": 0.9312959313392639,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.982205390930176,
+ 53.03363037109375,
+ 81.01543426513672,
+ 88.02293395996094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008814894827082753,
+ 0.0003609499253798276,
+ 0.00016691464406903833,
+ 0.00015374798385892063,
+ 0.00012832213542424142
+ ],
+ "bp_grad_F": [
+ 0.06737235933542252,
+ 0.030633311718702316,
+ 0.017514588311314583,
+ 0.014722960069775581,
+ 0.012166885659098625
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6665000319480896,
+ "loss_eval": 0.9171096086502075,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 17.348485946655273,
+ 65.39360046386719,
+ 94.1773452758789,
+ 97.79885864257812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008671359973959625,
+ 0.0003543675411492586,
+ 0.00017760474293027073,
+ 0.00016833240806590766,
+ 0.0001419015898136422
+ ],
+ "bp_grad_F": [
+ 0.06303472071886063,
+ 0.027784455567598343,
+ 0.016537917777895927,
+ 0.01453208364546299,
+ 0.012470746412873268
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6520000100135803,
+ "loss_eval": 0.9543019533157349,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 19.79836082458496,
+ 82.84272003173828,
+ 118.11077880859375,
+ 117.29456329345703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000835613114759326,
+ 0.00034002913162112236,
+ 0.00017855060286819935,
+ 0.00017689696687739342,
+ 0.0001562273973831907
+ ],
+ "bp_grad_F": [
+ 0.05830768123269081,
+ 0.025488071143627167,
+ 0.01599927246570587,
+ 0.014500983990728855,
+ 0.012853534892201424
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6320000290870667,
+ "loss_eval": 0.9986603260040283,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 24.028667449951172,
+ 104.24053192138672,
+ 151.45233154296875,
+ 148.85594177246094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008604780305176973,
+ 0.0003412840305827558,
+ 0.00020471647439990193,
+ 0.00020128543837927282,
+ 0.00018673941667657346
+ ],
+ "bp_grad_F": [
+ 0.05637207254767418,
+ 0.023704711347818375,
+ 0.016045723110437393,
+ 0.015071108937263489,
+ 0.013779145665466785
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6110000014305115,
+ "loss_eval": 1.08339262008667,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 31.199304580688477,
+ 135.36643981933594,
+ 190.8426971435547,
+ 189.1505126953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000760686700232327,
+ 0.0002976131218019873,
+ 0.00019266465096734464,
+ 0.0001927861594595015,
+ 0.0001783591287676245
+ ],
+ "bp_grad_F": [
+ 0.04442710801959038,
+ 0.020077738910913467,
+ 0.0149933947250247,
+ 0.014391067437827587,
+ 0.01344863511621952
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6480000019073486,
+ "loss_eval": 1.0371382236480713,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 41.846805572509766,
+ 170.3418731689453,
+ 225.09695434570312,
+ 224.6548614501953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007461759960278869,
+ 0.00026667246129363775,
+ 0.00018387376621831208,
+ 0.00018445710884407163,
+ 0.00017204758478328586
+ ],
+ "bp_grad_F": [
+ 0.039136338979005814,
+ 0.018771812319755554,
+ 0.015547079034149647,
+ 0.01513050775974989,
+ 0.01431551855057478
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6200000047683716,
+ "loss_eval": 1.1162669658660889,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 57.18465042114258,
+ 206.83914184570312,
+ 262.21197509765625,
+ 260.03485107421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007871078560128808,
+ 0.00029353986610658467,
+ 0.00022458977764472365,
+ 0.00022484370856545866,
+ 0.00021257037587929517
+ ],
+ "bp_grad_F": [
+ 0.03888345882296562,
+ 0.01824026368558407,
+ 0.015890181064605713,
+ 0.015627194195985794,
+ 0.014916189946234226
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615000128746033,
+ "loss_eval": 1.2106062173843384,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 75.66644287109375,
+ 241.24891662597656,
+ 298.0739440917969,
+ 293.95281982421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000782749499194324,
+ 0.0002943766303360462,
+ 0.00024086510529741645,
+ 0.00024184907670132816,
+ 0.0002289286785526201
+ ],
+ "bp_grad_F": [
+ 0.03717740252614021,
+ 0.01794801466166973,
+ 0.016123440116643906,
+ 0.0158899687230587,
+ 0.015260584652423859
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5680000185966492,
+ "loss_eval": 1.1780248880386353,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 97.68470764160156,
+ 276.2217712402344,
+ 334.56146240234375,
+ 329.1627502441406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007400053436867893,
+ 0.00028874175040982664,
+ 0.00024344309349544346,
+ 0.0002433314366498962,
+ 0.00023140427947510034
+ ],
+ "bp_grad_F": [
+ 0.03569746017456055,
+ 0.0169936865568161,
+ 0.015504195354878902,
+ 0.015339999459683895,
+ 0.014785589650273323
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5745000243186951,
+ "loss_eval": 1.1848244667053223,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 123.06426239013672,
+ 312.8515625,
+ 373.4215087890625,
+ 366.50213623046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007171913748607039,
+ 0.00026914477348327637,
+ 0.00023370776034425944,
+ 0.00023370303097181022,
+ 0.0002235924475826323
+ ],
+ "bp_grad_F": [
+ 0.03427436947822571,
+ 0.016933348029851913,
+ 0.015780098736286163,
+ 0.015659287571907043,
+ 0.015169495716691017
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5715000033378601,
+ "loss_eval": 1.2063732147216797,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 153.3316650390625,
+ 353.62042236328125,
+ 417.3258361816406,
+ 408.16680908203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007328973151743412,
+ 0.000268118514213711,
+ 0.00024018273688852787,
+ 0.00024114495317917317,
+ 0.0002314754092367366
+ ],
+ "bp_grad_F": [
+ 0.033994678407907486,
+ 0.016857070848345757,
+ 0.01595945656299591,
+ 0.01587284542620182,
+ 0.015459166839718819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5450000166893005,
+ "loss_eval": 1.2801684141159058,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 187.16934204101562,
+ 397.18280029296875,
+ 464.5965881347656,
+ 453.26629638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007429302204400301,
+ 0.0002756037574727088,
+ 0.0002533047809265554,
+ 0.0002549285418353975,
+ 0.00024467214825563133
+ ],
+ "bp_grad_F": [
+ 0.03400976210832596,
+ 0.017134130001068115,
+ 0.016380103304982185,
+ 0.016292234882712364,
+ 0.015935255214571953
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5055000185966492,
+ "loss_eval": 1.4238585233688354,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 221.9723663330078,
+ 441.26580810546875,
+ 512.8148193359375,
+ 498.7379455566406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006891476223245263,
+ 0.00027131737442687154,
+ 0.0002505357551854104,
+ 0.000251909252256155,
+ 0.0002428782609058544
+ ],
+ "bp_grad_F": [
+ 0.032484397292137146,
+ 0.01684476062655449,
+ 0.01627412810921669,
+ 0.016195174306631088,
+ 0.015904447063803673
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5290000438690186,
+ "loss_eval": 1.3381338119506836,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 256.86456298828125,
+ 485.2987060546875,
+ 561.24755859375,
+ 544.2046508789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007065363461151719,
+ 0.0002826322161126882,
+ 0.00026495553902350366,
+ 0.0002664696949068457,
+ 0.0002584822941571474
+ ],
+ "bp_grad_F": [
+ 0.032581742852926254,
+ 0.017135880887508392,
+ 0.01663898676633835,
+ 0.01656418852508068,
+ 0.016318844631314278
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.468500018119812,
+ "loss_eval": 1.4673320055007935,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 290.3281555175781,
+ 528.4644165039062,
+ 609.61181640625,
+ 589.482421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007876601885072887,
+ 0.000328866473864764,
+ 0.0003142827481497079,
+ 0.0003149702097289264,
+ 0.00030780391534790397
+ ],
+ "bp_grad_F": [
+ 0.0356873981654644,
+ 0.01825507916510105,
+ 0.01779749058187008,
+ 0.017760321497917175,
+ 0.0175130907446146
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.82278311252594,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 324.2997131347656,
+ 572.9197387695312,
+ 659.7073364257812,
+ 635.6883544921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006818437832407653,
+ 0.000307896378217265,
+ 0.0002974055823870003,
+ 0.000297438440611586,
+ 0.0002942352439276874
+ ],
+ "bp_grad_F": [
+ 0.03148573637008667,
+ 0.017155593261122704,
+ 0.016821201890707016,
+ 0.01674988865852356,
+ 0.016609078273177147
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4540000259876251,
+ "loss_eval": 1.4913204908370972,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 357.986572265625,
+ 616.8123168945312,
+ 709.2523193359375,
+ 681.3218994140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006822228315286338,
+ 0.00030397844966501,
+ 0.0002927799359895289,
+ 0.0002928805770352483,
+ 0.0002893624478019774
+ ],
+ "bp_grad_F": [
+ 0.03142063319683075,
+ 0.017380017787218094,
+ 0.017113016918301582,
+ 0.017052780836820602,
+ 0.01693262904882431
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42250001430511475,
+ "loss_eval": 1.574558138847351,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 391.00396728515625,
+ 660.1432495117188,
+ 758.46875,
+ 726.479248046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006576834712177515,
+ 0.00029913688194938004,
+ 0.0002909695322159678,
+ 0.00029160548001527786,
+ 0.0002882194530684501
+ ],
+ "bp_grad_F": [
+ 0.03063797578215599,
+ 0.01751694455742836,
+ 0.017304742708802223,
+ 0.017256034538149834,
+ 0.017157413065433502
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41700002551078796,
+ "loss_eval": 1.5943682193756104,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 423.0135803222656,
+ 702.8653564453125,
+ 807.1064453125,
+ 771.0443115234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007106211851350963,
+ 0.00032867168192751706,
+ 0.0003195058961864561,
+ 0.0003205789253115654,
+ 0.00031724729342386127
+ ],
+ "bp_grad_F": [
+ 0.032083574682474136,
+ 0.018385307863354683,
+ 0.01818086951971054,
+ 0.018159352242946625,
+ 0.01808425784111023
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3240000009536743,
+ "loss_eval": 1.9495495557785034,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 453.1861267089844,
+ 743.7100219726562,
+ 853.8812255859375,
+ 813.7102661132812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006489204824902117,
+ 0.0002889770839828998,
+ 0.00028184326947666705,
+ 0.00028282302082516253,
+ 0.00027834190404973924
+ ],
+ "bp_grad_F": [
+ 0.029847772791981697,
+ 0.017620669677853584,
+ 0.017466910183429718,
+ 0.01743420958518982,
+ 0.017375603318214417
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3970000147819519,
+ "loss_eval": 1.6998002529144287,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 480.8240661621094,
+ 781.491943359375,
+ 897.1333618164062,
+ 853.1820678710938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006337798549793661,
+ 0.0003062748000957072,
+ 0.0003002039447892457,
+ 0.00030039221746847034,
+ 0.0002973877126350999
+ ],
+ "bp_grad_F": [
+ 0.029168229550123215,
+ 0.017783651128411293,
+ 0.017649564892053604,
+ 0.017613932490348816,
+ 0.01756826601922512
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3865000307559967,
+ "loss_eval": 1.7693381309509277,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 505.9931945800781,
+ 816.3653564453125,
+ 937.6511840820312,
+ 890.0263061523438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006363698630593717,
+ 0.000327500601997599,
+ 0.0003217202320229262,
+ 0.0003208804700989276,
+ 0.0003201036306563765
+ ],
+ "bp_grad_F": [
+ 0.029376372694969177,
+ 0.018225492909550667,
+ 0.01810493879020214,
+ 0.01805899664759636,
+ 0.018048716709017754
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3400000035762787,
+ "loss_eval": 1.777511477470398,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 530.9385375976562,
+ 850.9844970703125,
+ 977.412841796875,
+ 926.3417358398438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006240232032723725,
+ 0.00032233193633146584,
+ 0.00031883586780168116,
+ 0.0003202730731572956,
+ 0.0003188494883943349
+ ],
+ "bp_grad_F": [
+ 0.028516914695501328,
+ 0.018217962235212326,
+ 0.018127964809536934,
+ 0.018103662878274918,
+ 0.018076416105031967
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36250001192092896,
+ "loss_eval": 1.7461223602294922,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 555.9691162109375,
+ 885.6592407226562,
+ 1017.6103515625,
+ 962.8530883789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005949487676844001,
+ 0.0003172095457557589,
+ 0.00031312211649492383,
+ 0.0003130651020910591,
+ 0.0003118007443845272
+ ],
+ "bp_grad_F": [
+ 0.027917204424738884,
+ 0.018052855506539345,
+ 0.017963001504540443,
+ 0.01793370023369789,
+ 0.017934400588274002
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3775000274181366,
+ "loss_eval": 1.7961357831954956,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 580.1717529296875,
+ 919.149169921875,
+ 1056.32470703125,
+ 998.1345825195312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006010148790664971,
+ 0.0003237369528505951,
+ 0.00031987245893105865,
+ 0.00031991174910217524,
+ 0.0003188104019500315
+ ],
+ "bp_grad_F": [
+ 0.027771273627877235,
+ 0.017915818840265274,
+ 0.017828019335865974,
+ 0.017802555114030838,
+ 0.017808666452765465
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.37400001287460327,
+ "loss_eval": 1.8124159574508667,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 602.5966186523438,
+ 950.484619140625,
+ 1092.6507568359375,
+ 1031.02294921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005852986359968781,
+ 0.0003249783185310662,
+ 0.00032142180134542286,
+ 0.0003207105037290603,
+ 0.00032108003506436944
+ ],
+ "bp_grad_F": [
+ 0.02701820805668831,
+ 0.01796947605907917,
+ 0.017892232164740562,
+ 0.017859354615211487,
+ 0.01788966730237007
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34950003027915955,
+ "loss_eval": 1.7797815799713135,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 624.4447021484375,
+ 981.1150512695312,
+ 1127.90234375,
+ 1063.09228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005775236058980227,
+ 0.0003046133788302541,
+ 0.00030120721203275025,
+ 0.00030136521672829986,
+ 0.00029937425279058516
+ ],
+ "bp_grad_F": [
+ 0.026447290554642677,
+ 0.017799606546759605,
+ 0.017730647698044777,
+ 0.017701666802167892,
+ 0.017717311158776283
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3630000054836273,
+ "loss_eval": 1.7884948253631592,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 644.9402465820312,
+ 1010.1371459960938,
+ 1161.7808837890625,
+ 1093.9410400390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000567529525142163,
+ 0.00032071411260403693,
+ 0.0003186226240359247,
+ 0.0003186469548381865,
+ 0.000316357531119138
+ ],
+ "bp_grad_F": [
+ 0.02652687579393387,
+ 0.018418341875076294,
+ 0.018360882997512817,
+ 0.018340308219194412,
+ 0.018352536484599113
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3375000059604645,
+ "loss_eval": 1.894034743309021,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 664.6719970703125,
+ 1038.15478515625,
+ 1194.3914794921875,
+ 1123.5455322265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005615526461042464,
+ 0.0003110080724582076,
+ 0.00030868081375956535,
+ 0.00030884178704582155,
+ 0.0003081669274251908
+ ],
+ "bp_grad_F": [
+ 0.025895435363054276,
+ 0.01783018186688423,
+ 0.017772147431969643,
+ 0.017754852771759033,
+ 0.01777641288936138
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3395000100135803,
+ "loss_eval": 1.9033000469207764,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 683.78173828125,
+ 1065.281005859375,
+ 1225.9638671875,
+ 1152.131591796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005448339506983757,
+ 0.0003069988451898098,
+ 0.0003048715298064053,
+ 0.0003052430984098464,
+ 0.00030476890970021486
+ ],
+ "bp_grad_F": [
+ 0.025077223777770996,
+ 0.017541181296110153,
+ 0.017490437254309654,
+ 0.01747160218656063,
+ 0.017498185858130455
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3840000033378601,
+ "loss_eval": 1.7054094076156616,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 701.634033203125,
+ 1090.699462890625,
+ 1255.5677490234375,
+ 1178.950927734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005554261151701212,
+ 0.0003436058177612722,
+ 0.0003414751263335347,
+ 0.0003412873193155974,
+ 0.0003412757650949061
+ ],
+ "bp_grad_F": [
+ 0.025991667062044144,
+ 0.018797792494297028,
+ 0.01875895820558071,
+ 0.018737811595201492,
+ 0.01877579651772976
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.2985000014305115,
+ "loss_eval": 1.9454095363616943,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 718.1909790039062,
+ 1114.3717041015625,
+ 1283.2196044921875,
+ 1204.0418701171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005466453148983419,
+ 0.00032576482044532895,
+ 0.00032447546254843473,
+ 0.0003244927211198956,
+ 0.0003245829720981419
+ ],
+ "bp_grad_F": [
+ 0.025174839422106743,
+ 0.01795799843966961,
+ 0.01791331358253956,
+ 0.017896415665745735,
+ 0.017930971458554268
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3190000057220459,
+ "loss_eval": 1.9117376804351807,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 734.4074096679688,
+ 1137.696044921875,
+ 1310.3448486328125,
+ 1228.5693359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005316757597029209,
+ 0.00032565969740971923,
+ 0.00032383095822297037,
+ 0.00032448669662699103,
+ 0.0003247321583330631
+ ],
+ "bp_grad_F": [
+ 0.024759862571954727,
+ 0.01794862188398838,
+ 0.01790694147348404,
+ 0.017891528084874153,
+ 0.017931628972291946
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3320000171661377,
+ "loss_eval": 1.8898653984069824,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 749.4878540039062,
+ 1159.565185546875,
+ 1335.8013916015625,
+ 1251.6041259765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005168311763554811,
+ 0.00031509375548921525,
+ 0.0003133788122795522,
+ 0.0003133984573651105,
+ 0.0003139932523481548
+ ],
+ "bp_grad_F": [
+ 0.0242743082344532,
+ 0.01778865046799183,
+ 0.0177480336278677,
+ 0.017732009291648865,
+ 0.01776931621134281
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3360000252723694,
+ "loss_eval": 1.809171199798584,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 763.5787353515625,
+ 1180.0230712890625,
+ 1359.6865234375,
+ 1273.1715087890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005242779734544456,
+ 0.0003271555178798735,
+ 0.00032485066913068295,
+ 0.0003253788163419813,
+ 0.00032494115293957293
+ ],
+ "bp_grad_F": [
+ 0.024425320327281952,
+ 0.01821528747677803,
+ 0.018175508826971054,
+ 0.018160372972488403,
+ 0.01819770224392414
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3290000259876251,
+ "loss_eval": 1.8727153539657593,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 777.29833984375,
+ 1199.8975830078125,
+ 1382.7962646484375,
+ 1294.0777587890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005091701750643551,
+ 0.0003165322996210307,
+ 0.00031451781978830695,
+ 0.00031486450461670756,
+ 0.00031427579233422875
+ ],
+ "bp_grad_F": [
+ 0.023803148418664932,
+ 0.017688797786831856,
+ 0.017653871327638626,
+ 0.01764090545475483,
+ 0.017672821879386902
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3570000231266022,
+ "loss_eval": 1.7817366123199463,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 789.7103881835938,
+ 1218.070556640625,
+ 1403.869384765625,
+ 1313.1611328125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000508163939230144,
+ 0.00031658579246141016,
+ 0.0003145384253002703,
+ 0.0003149410185869783,
+ 0.000314467353746295
+ ],
+ "bp_grad_F": [
+ 0.023785017430782318,
+ 0.017845386639237404,
+ 0.01781085878610611,
+ 0.017796490341424942,
+ 0.017827292904257774
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3255000114440918,
+ "loss_eval": 1.9139658212661743,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 801.9373779296875,
+ 1235.8994140625,
+ 1424.5323486328125,
+ 1331.8375244140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004862714558839798,
+ 0.0002926513261627406,
+ 0.0002908864407800138,
+ 0.0002910781477112323,
+ 0.0002900509862229228
+ ],
+ "bp_grad_F": [
+ 0.023361189290881157,
+ 0.01766069605946541,
+ 0.01763027161359787,
+ 0.017619280144572258,
+ 0.017652587965130806
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36100003123283386,
+ "loss_eval": 1.8068753480911255,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 813.853515625,
+ 1253.337890625,
+ 1444.873779296875,
+ 1350.2630615234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00048765321844257414,
+ 0.000307347479974851,
+ 0.00030599997262470424,
+ 0.000306078844005242,
+ 0.000305346620734781
+ ],
+ "bp_grad_F": [
+ 0.023688213899731636,
+ 0.01818004995584488,
+ 0.018153388053178787,
+ 0.018142297863960266,
+ 0.018173247575759888
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3360000252723694,
+ "loss_eval": 1.8813791275024414,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 824.7192993164062,
+ 1269.39208984375,
+ 1463.5384521484375,
+ 1367.15625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004835445433855057,
+ 0.0003096247965004295,
+ 0.0003079361922573298,
+ 0.00030804326524958014,
+ 0.0003073872940149158
+ ],
+ "bp_grad_F": [
+ 0.02330639213323593,
+ 0.01797325722873211,
+ 0.0179448202252388,
+ 0.017932146787643433,
+ 0.0179706122726202
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.8429521322250366,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 834.9524536132812,
+ 1284.4827880859375,
+ 1481.0673828125,
+ 1383.0155029296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047791830729693174,
+ 0.0003027814091183245,
+ 0.0003019821015186608,
+ 0.0003020255535375327,
+ 0.0003012260131072253
+ ],
+ "bp_grad_F": [
+ 0.02303098328411579,
+ 0.01771283708512783,
+ 0.01768432930111885,
+ 0.017673376947641373,
+ 0.01770668476819992
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34850001335144043,
+ "loss_eval": 1.8080617189407349,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 844.5447998046875,
+ 1298.628662109375,
+ 1497.57373046875,
+ 1397.9241943359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000483115843962878,
+ 0.0003182529762852937,
+ 0.00031743990257382393,
+ 0.0003175203746650368,
+ 0.0003175794845446944
+ ],
+ "bp_grad_F": [
+ 0.02306683361530304,
+ 0.01790531352162361,
+ 0.017880147323012352,
+ 0.017869742587208748,
+ 0.017903709784150124
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33100003004074097,
+ "loss_eval": 1.8166543245315552,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 853.7017822265625,
+ 1312.1446533203125,
+ 1513.2933349609375,
+ 1412.1080322265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047640595585107803,
+ 0.00031948628020472825,
+ 0.00031817753915674984,
+ 0.00031873476109467447,
+ 0.0003185000387020409
+ ],
+ "bp_grad_F": [
+ 0.022898783907294273,
+ 0.017956143245100975,
+ 0.017929796129465103,
+ 0.017917128279805183,
+ 0.017962384968996048
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33800002932548523,
+ "loss_eval": 1.8004838228225708,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 862.0558471679688,
+ 1324.4920654296875,
+ 1527.697509765625,
+ 1425.1290283203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004698090488091111,
+ 0.00029860963695682585,
+ 0.0002971645735669881,
+ 0.0002974079397972673,
+ 0.00029624722083099186
+ ],
+ "bp_grad_F": [
+ 0.022676818072795868,
+ 0.01772218942642212,
+ 0.017698047682642937,
+ 0.017688868567347527,
+ 0.01772254891693592
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3530000150203705,
+ "loss_eval": 1.8075289726257324,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 869.9756469726562,
+ 1336.185791015625,
+ 1541.3792724609375,
+ 1437.4677734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004706987820100039,
+ 0.0003098493325524032,
+ 0.0003085599164478481,
+ 0.0003086493816226721,
+ 0.0003082384937442839
+ ],
+ "bp_grad_F": [
+ 0.022675253450870514,
+ 0.01779225468635559,
+ 0.017767589539289474,
+ 0.017757505178451538,
+ 0.017791779711842537
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.827038288116455,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 877.3834838867188,
+ 1347.156982421875,
+ 1554.1087646484375,
+ 1448.9537353515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000473314750706777,
+ 0.00030716857872903347,
+ 0.0003054763947147876,
+ 0.0003060955787077546,
+ 0.0003047685313504189
+ ],
+ "bp_grad_F": [
+ 0.02272479608654976,
+ 0.01781822182238102,
+ 0.017794664949178696,
+ 0.01778644695878029,
+ 0.01781868003308773
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.32450002431869507,
+ "loss_eval": 1.8790045976638794,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 884.1793212890625,
+ 1357.25146484375,
+ 1565.88232421875,
+ 1459.538818359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046717250370420516,
+ 0.00030950061045587063,
+ 0.000308411312289536,
+ 0.00030838610837236047,
+ 0.00030820758547633886
+ ],
+ "bp_grad_F": [
+ 0.02260792814195156,
+ 0.017898347228765488,
+ 0.017876161262392998,
+ 0.017865851521492004,
+ 0.01790330745279789
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3225000202655792,
+ "loss_eval": 1.8583427667617798,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 890.4108276367188,
+ 1366.517333984375,
+ 1576.69921875,
+ 1469.300537109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004612848279066384,
+ 0.00030920191784389317,
+ 0.0003086488868575543,
+ 0.0003085103817284107,
+ 0.0003084034251514822
+ ],
+ "bp_grad_F": [
+ 0.022702287882566452,
+ 0.018074622377753258,
+ 0.01805359311401844,
+ 0.018043993040919304,
+ 0.018074078485369682
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33250001072883606,
+ "loss_eval": 1.8819878101348877,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 896.1082763671875,
+ 1374.973388671875,
+ 1586.524169921875,
+ 1478.1490478515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046731752809137106,
+ 0.0003127296222373843,
+ 0.00031115938327275217,
+ 0.0003112337435595691,
+ 0.00031117399339564145
+ ],
+ "bp_grad_F": [
+ 0.022609086707234383,
+ 0.018025977537035942,
+ 0.01800408773124218,
+ 0.017995676025748253,
+ 0.018028175458312035
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3150000274181366,
+ "loss_eval": 1.8731034994125366,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 901.4246826171875,
+ 1382.871337890625,
+ 1595.7164306640625,
+ 1486.465576171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004559764638543129,
+ 0.00029873938183300197,
+ 0.00029821961652487516,
+ 0.0002982193836942315,
+ 0.0002976148098241538
+ ],
+ "bp_grad_F": [
+ 0.022443631663918495,
+ 0.017807144671678543,
+ 0.01778426393866539,
+ 0.017775312066078186,
+ 0.017809107899665833
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3190000057220459,
+ "loss_eval": 1.9132741689682007,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 906.219970703125,
+ 1389.97998046875,
+ 1603.95458984375,
+ 1493.869384765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045692393905483186,
+ 0.000307796144625172,
+ 0.0003068537334911525,
+ 0.0003067644138354808,
+ 0.0003064550110138953
+ ],
+ "bp_grad_F": [
+ 0.022245025262236595,
+ 0.017795003950595856,
+ 0.0177734587341547,
+ 0.017764581367373466,
+ 0.017800522968173027
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3270000219345093,
+ "loss_eval": 1.8190391063690186,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 910.5570678710938,
+ 1396.3927001953125,
+ 1611.4957275390625,
+ 1500.6524658203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045115925604477525,
+ 0.00029847086989320815,
+ 0.0002977230178657919,
+ 0.0002977572148665786,
+ 0.0002975583774968982
+ ],
+ "bp_grad_F": [
+ 0.02203645370900631,
+ 0.017681924626231194,
+ 0.01766141690313816,
+ 0.017652763053774834,
+ 0.0176865067332983
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35500001907348633,
+ "loss_eval": 1.7965762615203857,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 914.5003662109375,
+ 1402.2757568359375,
+ 1618.2999267578125,
+ 1506.7991943359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004569143056869507,
+ 0.00029972344054840505,
+ 0.0002987241605296731,
+ 0.0002987434563692659,
+ 0.00029907189309597015
+ ],
+ "bp_grad_F": [
+ 0.022272884845733643,
+ 0.01781252957880497,
+ 0.017791228368878365,
+ 0.017782466486096382,
+ 0.017818717285990715
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.328000009059906,
+ "loss_eval": 1.8610442876815796,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 918.0006103515625,
+ 1407.5118408203125,
+ 1624.3853759765625,
+ 1512.30029296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045414711348712444,
+ 0.00030931030050851405,
+ 0.0003081976028624922,
+ 0.0003081892791669816,
+ 0.0003081847680732608
+ ],
+ "bp_grad_F": [
+ 0.022085461765527725,
+ 0.01779778115451336,
+ 0.017776912078261375,
+ 0.017768092453479767,
+ 0.01780613884329796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34300002455711365,
+ "loss_eval": 1.804802417755127,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 921.121826171875,
+ 1412.175537109375,
+ 1629.830810546875,
+ 1517.2005615234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004531690792646259,
+ 0.00031135816243477166,
+ 0.00031044447678141296,
+ 0.00031072759884409606,
+ 0.0003106470685452223
+ ],
+ "bp_grad_F": [
+ 0.022044293582439423,
+ 0.017750630155205727,
+ 0.017730476334691048,
+ 0.017722314223647118,
+ 0.017757223919034004
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.8111987113952637,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 923.8903198242188,
+ 1416.300048828125,
+ 1634.646484375,
+ 1521.5411376953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004468595434445888,
+ 0.0003022409218829125,
+ 0.00030127677018754184,
+ 0.00030117464484646916,
+ 0.00030144210904836655
+ ],
+ "bp_grad_F": [
+ 0.02193099819123745,
+ 0.017699316143989563,
+ 0.017679594457149506,
+ 0.017671333625912666,
+ 0.017706507816910744
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3525000214576721,
+ "loss_eval": 1.797281265258789,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 926.2950439453125,
+ 1419.8856201171875,
+ 1638.8184814453125,
+ 1525.284423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044905568938702345,
+ 0.00030229080584831536,
+ 0.00030173707637004554,
+ 0.0003015522670466453,
+ 0.0003012538072653115
+ ],
+ "bp_grad_F": [
+ 0.021881939843297005,
+ 0.017657367512583733,
+ 0.017637958750128746,
+ 0.017629873007535934,
+ 0.01766354590654373
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34800001978874207,
+ "loss_eval": 1.8036439418792725,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 928.36181640625,
+ 1422.943359375,
+ 1642.3917236328125,
+ 1528.47705078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004465414967853576,
+ 0.00030299098580144346,
+ 0.00030190899269655347,
+ 0.00030191292171366513,
+ 0.000301982625387609
+ ],
+ "bp_grad_F": [
+ 0.02188783325254917,
+ 0.01768629439175129,
+ 0.01766696758568287,
+ 0.017658723518252373,
+ 0.017692700028419495
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.359000027179718,
+ "loss_eval": 1.7996938228607178,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 930.1182861328125,
+ 1425.561279296875,
+ 1645.422607421875,
+ 1531.2088623046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004439539334271103,
+ 0.00030093194800429046,
+ 0.00030001465347595513,
+ 0.0003001568838953972,
+ 0.0002998457639478147
+ ],
+ "bp_grad_F": [
+ 0.021926432847976685,
+ 0.01775786094367504,
+ 0.017738472670316696,
+ 0.01773017831146717,
+ 0.01776653714478016
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.8030681610107422,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 931.579345703125,
+ 1427.7337646484375,
+ 1647.9693603515625,
+ 1533.509033203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044511700980365276,
+ 0.00030080872238613665,
+ 0.00030003004940226674,
+ 0.0003000932920258492,
+ 0.00029993904172442853
+ ],
+ "bp_grad_F": [
+ 0.021828416734933853,
+ 0.017681054770946503,
+ 0.017661932855844498,
+ 0.017653752118349075,
+ 0.017688728868961334
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.7960853576660156,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 932.7696533203125,
+ 1429.520751953125,
+ 1650.0577392578125,
+ 1535.389892578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004446738166734576,
+ 0.0003006414044648409,
+ 0.00030009649344719946,
+ 0.0003001675067935139,
+ 0.00029965140856802464
+ ],
+ "bp_grad_F": [
+ 0.021837500855326653,
+ 0.01768680103123188,
+ 0.017667656764388084,
+ 0.017659684643149376,
+ 0.017694275826215744
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35450002551078796,
+ "loss_eval": 1.8004000186920166,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 933.7157592773438,
+ 1430.9381103515625,
+ 1651.7154541015625,
+ 1536.879638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044473307207226753,
+ 0.00030047594918869436,
+ 0.0002997968113049865,
+ 0.00029963525594212115,
+ 0.00029955641366541386
+ ],
+ "bp_grad_F": [
+ 0.0217889491468668,
+ 0.01765742339193821,
+ 0.01763851009309292,
+ 0.01763063855469227,
+ 0.017664924263954163
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3555000126361847,
+ "loss_eval": 1.7942780256271362,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 934.4593505859375,
+ 1432.0382080078125,
+ 1652.9989013671875,
+ 1538.0234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004453740257304162,
+ 0.0003002033627126366,
+ 0.00029949398594908416,
+ 0.00029964259010739625,
+ 0.0002993734087795019
+ ],
+ "bp_grad_F": [
+ 0.021799130365252495,
+ 0.017666727304458618,
+ 0.0176478810608387,
+ 0.017639974132180214,
+ 0.017674267292022705
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34550002217292786,
+ "loss_eval": 1.800949215888977,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 934.9984741210938,
+ 1432.84814453125,
+ 1653.939697265625,
+ 1538.8624267578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044546957360580564,
+ 0.0003038236463908106,
+ 0.000302964064758271,
+ 0.00030298702768050134,
+ 0.00030283271917141974
+ ],
+ "bp_grad_F": [
+ 0.021853182464838028,
+ 0.017717286944389343,
+ 0.017698239535093307,
+ 0.017690137028694153,
+ 0.01772582344710827
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35600000619888306,
+ "loss_eval": 1.800832986831665,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.3856201171875,
+ 1433.427490234375,
+ 1654.6126708984375,
+ 1539.4669189453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044487748527899384,
+ 0.00030164900817908347,
+ 0.00030081532895565033,
+ 0.00030082385637797415,
+ 0.000300481216982007
+ ],
+ "bp_grad_F": [
+ 0.02177177555859089,
+ 0.017657004296779633,
+ 0.017638202756643295,
+ 0.017630264163017273,
+ 0.01766461506485939
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3490000069141388,
+ "loss_eval": 1.794891119003296,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.636474609375,
+ 1433.79345703125,
+ 1655.038330078125,
+ 1539.8505859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004437313473317772,
+ 0.00030232034623622894,
+ 0.0003012971137650311,
+ 0.00030129036167636514,
+ 0.00030084658646956086
+ ],
+ "bp_grad_F": [
+ 0.021787401288747787,
+ 0.0176764614880085,
+ 0.017657602205872536,
+ 0.017649594694375992,
+ 0.017684470862150192
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35350000858306885,
+ "loss_eval": 1.7952260971069336,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.7716064453125,
+ 1433.996826171875,
+ 1655.2738037109375,
+ 1540.06298828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044510490261018276,
+ 0.0003025131591130048,
+ 0.00030167156364768744,
+ 0.0003019055584445596,
+ 0.00030186952790245414
+ ],
+ "bp_grad_F": [
+ 0.02179691381752491,
+ 0.017687244340777397,
+ 0.017668338492512703,
+ 0.017660312354564667,
+ 0.01769554615020752
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.7945536375045776,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.8350830078125,
+ 1434.09326171875,
+ 1655.3861083984375,
+ 1540.164794921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044426857493817806,
+ 0.0003006447514053434,
+ 0.0002995560353156179,
+ 0.0002996143593918532,
+ 0.0002996891853399575
+ ],
+ "bp_grad_F": [
+ 0.02177303098142147,
+ 0.017660290002822876,
+ 0.017641469836235046,
+ 0.017633574083447456,
+ 0.01766815222799778
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35850000381469727,
+ "loss_eval": 1.7939436435699463,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.8506469726562,
+ 1434.11669921875,
+ 1655.4130859375,
+ 1540.189208984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044382456690073013,
+ 0.0003010118380188942,
+ 0.0003002960584126413,
+ 0.00030042475555092096,
+ 0.00029991925111971796
+ ],
+ "bp_grad_F": [
+ 0.021775126457214355,
+ 0.01766343042254448,
+ 0.017644599080085754,
+ 0.017636677250266075,
+ 0.017671329900622368
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3595000207424164,
+ "loss_eval": 1.7936068773269653,
+ "epoch": 80
+ }
+ ],
+ "seed": 42,
+ "alpha": 1.0,
+ "depth": 4,
+ "d_hidden": 128
+} \ No newline at end of file
diff --git a/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json
new file mode 100644
index 0000000..438739c
--- /dev/null
+++ b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json
@@ -0,0 +1,2276 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.460872650146484,
+ 11.70040512084961,
+ 12.004783630371094,
+ 12.311223030090332
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004118149809073657,
+ 0.0003761148836929351,
+ 0.00034950554254464805,
+ 0.00032246875343844295,
+ 0.0002528287877794355
+ ],
+ "bp_grad_F": [
+ 0.018988799303770065,
+ 0.017196672037243843,
+ 0.015853216871619225,
+ 0.014456234872341156,
+ 0.011207858100533485
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5265000462532043,
+ "loss_eval": 1.4851115942001343,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.751569747924805,
+ 12.541290283203125,
+ 13.77841567993164,
+ 15.976567268371582
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007904200465418398,
+ 0.0006201046635396779,
+ 0.0004867047828156501,
+ 0.0003823215956799686,
+ 0.00022867691586725414
+ ],
+ "bp_grad_F": [
+ 0.041881538927555084,
+ 0.03210915997624397,
+ 0.025059428066015244,
+ 0.01950555481016636,
+ 0.011618814431130886
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6350000500679016,
+ "loss_eval": 0.959205687046051,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.018173217773438,
+ 13.625839233398438,
+ 16.65739631652832,
+ 22.032325744628906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008111135102808475,
+ 0.0005643682088702917,
+ 0.0004009789554402232,
+ 0.00029031067970208824,
+ 0.00016489777772221714
+ ],
+ "bp_grad_F": [
+ 0.059235598891973495,
+ 0.040808264166116714,
+ 0.02855612151324749,
+ 0.020608671009540558,
+ 0.011410079896450043
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6855000257492065,
+ "loss_eval": 0.818859875202179,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.308274269104004,
+ 15.27676010131836,
+ 21.78426170349121,
+ 30.742971420288086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007430269033648074,
+ 0.000469190941657871,
+ 0.00030379975214600563,
+ 0.00021638885664287955,
+ 0.00012503107427619398
+ ],
+ "bp_grad_F": [
+ 0.06859903037548065,
+ 0.04267093911767006,
+ 0.027331173419952393,
+ 0.01921078749001026,
+ 0.01109629962593317
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6940000057220459,
+ "loss_eval": 0.7901937365531921,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.659590721130371,
+ 17.736019134521484,
+ 29.108901977539062,
+ 40.405487060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007397185545414686,
+ 0.0004240924317855388,
+ 0.00025522997020743787,
+ 0.00018211310089100152,
+ 0.00011715881555574015
+ ],
+ "bp_grad_F": [
+ 0.07044756412506104,
+ 0.040140341967344284,
+ 0.024354523047804832,
+ 0.017343631014227867,
+ 0.01095715630799532
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6975000500679016,
+ "loss_eval": 0.8005170822143555,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.09460735321045,
+ 21.214082717895508,
+ 38.0382194519043,
+ 49.941673278808594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007781236781738698,
+ 0.00040500680916011333,
+ 0.00022763953893445432,
+ 0.00017000116349663585,
+ 0.0001182492560474202
+ ],
+ "bp_grad_F": [
+ 0.0692453384399414,
+ 0.037047095596790314,
+ 0.021944386884570122,
+ 0.016124187037348747,
+ 0.011101995594799519
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6925000548362732,
+ "loss_eval": 0.8182728290557861,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.613083839416504,
+ 25.80984878540039,
+ 47.72332763671875,
+ 58.812931060791016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007534404867328703,
+ 0.00035873899469152093,
+ 0.00019843837071675807,
+ 0.00015793486090842634,
+ 0.00011804765381384641
+ ],
+ "bp_grad_F": [
+ 0.06768736243247986,
+ 0.034021928906440735,
+ 0.019909236580133438,
+ 0.015198245644569397,
+ 0.011175908148288727
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6945000290870667,
+ "loss_eval": 0.8370131254196167,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.181544303894043,
+ 31.215173721313477,
+ 57.29954147338867,
+ 67.44005584716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008308067917823792,
+ 0.0003639743954408914,
+ 0.00018776576325763017,
+ 0.00015568821982014924,
+ 0.00012153007264714688
+ ],
+ "bp_grad_F": [
+ 0.0664583221077919,
+ 0.03186826407909393,
+ 0.018696729093790054,
+ 0.014834162779152393,
+ 0.011486423201858997
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6775000095367432,
+ "loss_eval": 0.8666528463363647,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.879924774169922,
+ 37.906219482421875,
+ 67.32949829101562,
+ 75.90506744384766
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000856662227306515,
+ 0.0003640915092546493,
+ 0.0001897388428915292,
+ 0.00016743727610446513,
+ 0.00013579493679571897
+ ],
+ "bp_grad_F": [
+ 0.06490001082420349,
+ 0.0302249975502491,
+ 0.018041465431451797,
+ 0.014820784330368042,
+ 0.011990511789917946
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6565000414848328,
+ "loss_eval": 0.9446665048599243,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.732318878173828,
+ 45.59952163696289,
+ 76.33224487304688,
+ 84.44403076171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008764212252572179,
+ 0.00035432647564448416,
+ 0.00017862815002445132,
+ 0.00016163433610927314,
+ 0.0001364263880532235
+ ],
+ "bp_grad_F": [
+ 0.06546498835086823,
+ 0.02990337274968624,
+ 0.01799662783741951,
+ 0.015155031345784664,
+ 0.012622621841728687
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6390000581741333,
+ "loss_eval": 1.0291955471038818,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 16.836196899414062,
+ 55.33602523803711,
+ 84.32881164550781,
+ 92.9534912109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000854950922075659,
+ 0.00036200409522280097,
+ 0.00018266236293129623,
+ 0.0001705951290205121,
+ 0.00014654053666163236
+ ],
+ "bp_grad_F": [
+ 0.06433594971895218,
+ 0.0289771668612957,
+ 0.017391620203852654,
+ 0.015173865482211113,
+ 0.012928354553878307
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6330000162124634,
+ "loss_eval": 1.076339840888977,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 19.05539894104004,
+ 69.66182708740234,
+ 97.1963119506836,
+ 102.74567413330078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008397337514907122,
+ 0.00034183592651970685,
+ 0.00018204437219537795,
+ 0.00017718512390274554,
+ 0.0001551504828967154
+ ],
+ "bp_grad_F": [
+ 0.062221452593803406,
+ 0.027522921562194824,
+ 0.01681770198047161,
+ 0.01498384214937687,
+ 0.013089192099869251
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.643500030040741,
+ "loss_eval": 1.0531169176101685,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 23.65813636779785,
+ 86.25741577148438,
+ 120.24312591552734,
+ 124.2949447631836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008297308231703937,
+ 0.0003140757908113301,
+ 0.00017996964743360877,
+ 0.00017669204680714756,
+ 0.00015717324276920408
+ ],
+ "bp_grad_F": [
+ 0.06484393030405045,
+ 0.028613954782485962,
+ 0.01715104468166828,
+ 0.01567785255610943,
+ 0.014462707564234734
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6255000233650208,
+ "loss_eval": 1.3249526023864746,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 30.92644500732422,
+ 102.1397705078125,
+ 147.9296417236328,
+ 157.7542266845703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008446995634585619,
+ 0.000312876160023734,
+ 0.00019047399109695107,
+ 0.00018901094153989106,
+ 0.00017103466961998492
+ ],
+ "bp_grad_F": [
+ 0.063303142786026,
+ 0.02876628190279007,
+ 0.01635562814772129,
+ 0.015436392277479172,
+ 0.014697290025651455
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6045000553131104,
+ "loss_eval": 1.394450306892395,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 40.05237579345703,
+ 123.65401458740234,
+ 173.33119201660156,
+ 188.9973907470703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008657039143145084,
+ 0.0003323613782413304,
+ 0.0002161249576602131,
+ 0.0002138354757335037,
+ 0.00019650986359920353
+ ],
+ "bp_grad_F": [
+ 0.054496586322784424,
+ 0.025836922228336334,
+ 0.0159344132989645,
+ 0.015238149091601372,
+ 0.014629158191382885
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5950000286102295,
+ "loss_eval": 1.1977143287658691,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 50.589420318603516,
+ 147.02255249023438,
+ 197.975830078125,
+ 217.0601806640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008191568194888532,
+ 0.00030697352485731244,
+ 0.00021884859597776085,
+ 0.00021713844034820795,
+ 0.00020184220920782536
+ ],
+ "bp_grad_F": [
+ 0.04439451918005943,
+ 0.021627753973007202,
+ 0.015079431235790253,
+ 0.0144795598462224,
+ 0.014037052169442177
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6115000247955322,
+ "loss_eval": 1.1207692623138428,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 61.36143112182617,
+ 169.08056640625,
+ 221.02748107910156,
+ 240.8756561279297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007864299113862216,
+ 0.0002859561063814908,
+ 0.0002155074180336669,
+ 0.00021533406106755137,
+ 0.00020066267461515963
+ ],
+ "bp_grad_F": [
+ 0.04005742073059082,
+ 0.01873522810637951,
+ 0.014609597623348236,
+ 0.014084910042583942,
+ 0.013653460890054703
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6175000071525574,
+ "loss_eval": 1.059693694114685,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 72.36003875732422,
+ 188.58563232421875,
+ 241.86294555664062,
+ 258.58087158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007837018347345293,
+ 0.0002863232512027025,
+ 0.00022506402456201613,
+ 0.00022481133055407554,
+ 0.00021070068760309368
+ ],
+ "bp_grad_F": [
+ 0.039807844907045364,
+ 0.01775156892836094,
+ 0.01470963191241026,
+ 0.014359688386321068,
+ 0.01395167876034975
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025000214576721,
+ "loss_eval": 1.1027324199676514,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 81.18446350097656,
+ 200.67935180664062,
+ 257.0839538574219,
+ 267.81317138671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00082020164700225,
+ 0.0003102799819316715,
+ 0.0002470446634106338,
+ 0.0002463961427565664,
+ 0.00023495900677517056
+ ],
+ "bp_grad_F": [
+ 0.041444260627031326,
+ 0.01803578995168209,
+ 0.014944672584533691,
+ 0.014712288975715637,
+ 0.014517528004944324
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5820000171661377,
+ "loss_eval": 1.146970272064209,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 91.12315368652344,
+ 208.71234130859375,
+ 269.7666931152344,
+ 278.79949951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008638632134534419,
+ 0.0003278621006757021,
+ 0.00026185397291556,
+ 0.00026034258189611137,
+ 0.0002510476915631443
+ ],
+ "bp_grad_F": [
+ 0.04429177567362785,
+ 0.018727537244558334,
+ 0.015489915385842323,
+ 0.01529665943235159,
+ 0.015330186113715172
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5394999980926514,
+ "loss_eval": 1.2919961214065552,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 104.20027160644531,
+ 224.12327575683594,
+ 292.86212158203125,
+ 302.2417297363281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008091026684269309,
+ 0.0002788364654406905,
+ 0.0002307023387402296,
+ 0.0002291825512656942,
+ 0.0002224020572612062
+ ],
+ "bp_grad_F": [
+ 0.043314289301633835,
+ 0.018204446882009506,
+ 0.01538326870650053,
+ 0.015148352831602097,
+ 0.015248478390276432
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615000128746033,
+ "loss_eval": 1.3774936199188232,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 119.46916198730469,
+ 246.84373474121094,
+ 322.8492736816406,
+ 331.5632019042969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007946055266074836,
+ 0.0002993302186951041,
+ 0.0002581049920991063,
+ 0.00025690835900604725,
+ 0.00025083290529437363
+ ],
+ "bp_grad_F": [
+ 0.04004265367984772,
+ 0.017564039677381516,
+ 0.015413369052112103,
+ 0.01514766737818718,
+ 0.015221393667161465
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5430000424385071,
+ "loss_eval": 1.3054314851760864,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 136.81655883789062,
+ 275.0496826171875,
+ 359.30596923828125,
+ 365.4009704589844
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007907089893706143,
+ 0.00031880626920610666,
+ 0.00028100365307182074,
+ 0.0002786303812172264,
+ 0.00027127860812470317
+ ],
+ "bp_grad_F": [
+ 0.03825194016098976,
+ 0.017261793836951256,
+ 0.01555734220892191,
+ 0.01527914684265852,
+ 0.015313600189983845
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5270000100135803,
+ "loss_eval": 1.3047609329223633,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 154.3377227783203,
+ 303.1491394042969,
+ 395.8551330566406,
+ 398.4109191894531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007455120794475079,
+ 0.0002850848250091076,
+ 0.00025729817571118474,
+ 0.00025698516401462257,
+ 0.0002516870736144483
+ ],
+ "bp_grad_F": [
+ 0.03626802936196327,
+ 0.01676987297832966,
+ 0.015425236895680428,
+ 0.015152523294091225,
+ 0.015204805880784988
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5555000305175781,
+ "loss_eval": 1.2945412397384644,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 172.51333618164062,
+ 332.53106689453125,
+ 434.6177978515625,
+ 432.9015197753906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007499566418118775,
+ 0.00028473397833295166,
+ 0.0002601774758659303,
+ 0.0002574811805970967,
+ 0.00025375629775226116
+ ],
+ "bp_grad_F": [
+ 0.035628896206617355,
+ 0.016559967771172523,
+ 0.015500359237194061,
+ 0.015283019281923771,
+ 0.01530501153320074
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5250000357627869,
+ "loss_eval": 1.348174810409546,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 191.6818084716797,
+ 362.3817138671875,
+ 473.73529052734375,
+ 468.3863830566406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00077909289393574,
+ 0.0003061260504182428,
+ 0.0002848915464710444,
+ 0.000283668254269287,
+ 0.00027828654856421053
+ ],
+ "bp_grad_F": [
+ 0.03710347041487694,
+ 0.01679745502769947,
+ 0.01587643474340439,
+ 0.01569107361137867,
+ 0.015713181346654892
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.48750001192092896,
+ "loss_eval": 1.513879418373108,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 212.49392700195312,
+ 393.7915954589844,
+ 515.7852172851562,
+ 507.1173095703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007443951326422393,
+ 0.000309632858261466,
+ 0.00028767462936230004,
+ 0.0002863617264665663,
+ 0.00028263547574169934
+ ],
+ "bp_grad_F": [
+ 0.034536320716142654,
+ 0.01654498465359211,
+ 0.015813451260328293,
+ 0.015621310099959373,
+ 0.0156637541949749
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5090000033378601,
+ "loss_eval": 1.345898151397705,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 231.91209411621094,
+ 422.3776550292969,
+ 553.1364135742188,
+ 540.5762329101562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007372196414507926,
+ 0.0002908413589466363,
+ 0.00027582875918596983,
+ 0.0002760514325927943,
+ 0.00027193804271519184
+ ],
+ "bp_grad_F": [
+ 0.034806184470653534,
+ 0.01654907502233982,
+ 0.01595865748822689,
+ 0.01580234244465828,
+ 0.01584061235189438
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4970000088214874,
+ "loss_eval": 1.4695581197738647,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 251.87222290039062,
+ 452.5732116699219,
+ 591.4275512695312,
+ 574.1845703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007362416945397854,
+ 0.0002964947489090264,
+ 0.0002815316547639668,
+ 0.0002831071906257421,
+ 0.0002781452494673431
+ ],
+ "bp_grad_F": [
+ 0.034162748605012894,
+ 0.016219308599829674,
+ 0.01574064791202545,
+ 0.015600688755512238,
+ 0.015627028420567513
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.48100003600120544,
+ "loss_eval": 1.4220975637435913,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 272.3019104003906,
+ 483.1678161621094,
+ 631.2042846679688,
+ 609.8804931640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007130270241759717,
+ 0.0003075756540056318,
+ 0.00029428518610075116,
+ 0.00029221284785307944,
+ 0.0002892380871344358
+ ],
+ "bp_grad_F": [
+ 0.033144623041152954,
+ 0.01614796556532383,
+ 0.015754450112581253,
+ 0.015617748722434044,
+ 0.015651794150471687
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.49550002813339233,
+ "loss_eval": 1.398095726966858,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 293.1174621582031,
+ 513.9456176757812,
+ 671.4954223632812,
+ 646.9434204101562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007292498485185206,
+ 0.0003146968665532768,
+ 0.0003013227542396635,
+ 0.000301573658362031,
+ 0.00029794115107506514
+ ],
+ "bp_grad_F": [
+ 0.033789947628974915,
+ 0.016436096280813217,
+ 0.016089752316474915,
+ 0.015960095450282097,
+ 0.0159769207239151
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4570000171661377,
+ "loss_eval": 1.5174756050109863,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 312.291748046875,
+ 542.6367797851562,
+ 708.0426025390625,
+ 679.9037475585938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007159899105317891,
+ 0.0003197023761458695,
+ 0.00030903122387826443,
+ 0.0003080730966757983,
+ 0.00030512994271703064
+ ],
+ "bp_grad_F": [
+ 0.03305007144808769,
+ 0.016458848491311073,
+ 0.0161746796220541,
+ 0.01604822278022766,
+ 0.016068853437900543
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.45350003242492676,
+ "loss_eval": 1.4785963296890259,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 330.2493896484375,
+ 569.4765625,
+ 741.90380859375,
+ 710.49609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007181349792517722,
+ 0.0003215835604351014,
+ 0.00031238331575877964,
+ 0.00031264303834177554,
+ 0.0003104021889157593
+ ],
+ "bp_grad_F": [
+ 0.0329170823097229,
+ 0.016988366842269897,
+ 0.01674317568540573,
+ 0.01661907136440277,
+ 0.01665792241692543
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4320000112056732,
+ "loss_eval": 1.545434594154358,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 348.3463439941406,
+ 596.8388061523438,
+ 776.8276977539062,
+ 742.1928100585938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006930733215995133,
+ 0.0003099350433330983,
+ 0.0003020780859515071,
+ 0.0003008935309480876,
+ 0.00029881703085266054
+ ],
+ "bp_grad_F": [
+ 0.03210154175758362,
+ 0.0165875144302845,
+ 0.016380906105041504,
+ 0.016269827261567116,
+ 0.01630542054772377
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.46150001883506775,
+ "loss_eval": 1.4990708827972412,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 367.8572998046875,
+ 624.6773071289062,
+ 813.023193359375,
+ 774.825439453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006842412985861301,
+ 0.00032654378446750343,
+ 0.00031924000359140337,
+ 0.0003176531463395804,
+ 0.00031533741275779903
+ ],
+ "bp_grad_F": [
+ 0.03194142132997513,
+ 0.016769496724009514,
+ 0.01658361405134201,
+ 0.016465021297335625,
+ 0.016491062939167023
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4345000088214874,
+ "loss_eval": 1.5226876735687256,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 386.9555969238281,
+ 652.0831298828125,
+ 847.6653442382812,
+ 805.962158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007009130204096437,
+ 0.00033408711897209287,
+ 0.00032650009961798787,
+ 0.00032573731732554734,
+ 0.00032366803498007357
+ ],
+ "bp_grad_F": [
+ 0.032547831535339355,
+ 0.01727951131761074,
+ 0.017110776156187057,
+ 0.017009133473038673,
+ 0.017040319740772247
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4025000333786011,
+ "loss_eval": 1.6661202907562256,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 405.57061767578125,
+ 678.9530639648438,
+ 881.5497436523438,
+ 835.913330078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006714131450280547,
+ 0.00031647825380787253,
+ 0.0003093808190897107,
+ 0.00030856815283186734,
+ 0.00030731584411114454
+ ],
+ "bp_grad_F": [
+ 0.030830882489681244,
+ 0.016467954963445663,
+ 0.016322584822773933,
+ 0.016228536143898964,
+ 0.01625511236488819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.44850000739097595,
+ "loss_eval": 1.5340722799301147,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 423.3720703125,
+ 705.0136108398438,
+ 914.5001831054688,
+ 865.4478759765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006793327047489583,
+ 0.0003244458057451993,
+ 0.0003182501532137394,
+ 0.00031923994538374245,
+ 0.00031612347811460495
+ ],
+ "bp_grad_F": [
+ 0.03101767599582672,
+ 0.01673293113708496,
+ 0.01659614033997059,
+ 0.016509832814335823,
+ 0.01653491146862507
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42000001668930054,
+ "loss_eval": 1.6198900938034058,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 440.53741455078125,
+ 729.8703002929688,
+ 945.1349487304688,
+ 892.7785034179688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006624915986321867,
+ 0.00031068388489075005,
+ 0.00030363586847670376,
+ 0.00030243129003793,
+ 0.00030108148348517716
+ ],
+ "bp_grad_F": [
+ 0.030339404940605164,
+ 0.01675509847700596,
+ 0.016639690846204758,
+ 0.01655009388923645,
+ 0.016594169661402702
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4280000329017639,
+ "loss_eval": 1.6058467626571655,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 457.5261535644531,
+ 754.3056640625,
+ 975.5144653320312,
+ 919.8758544921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006706257117912173,
+ 0.0003283233381807804,
+ 0.00032177154207602143,
+ 0.0003207549743819982,
+ 0.0003196784819010645
+ ],
+ "bp_grad_F": [
+ 0.03072393499314785,
+ 0.016925832256674767,
+ 0.01681169681251049,
+ 0.01673683524131775,
+ 0.016768047586083412
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39000001549720764,
+ "loss_eval": 1.7052431106567383,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 474.70233154296875,
+ 778.4963989257812,
+ 1005.5798950195312,
+ 947.08251953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006340838735923171,
+ 0.00030884164152666926,
+ 0.000303937413264066,
+ 0.00030318956123664975,
+ 0.0003018545394297689
+ ],
+ "bp_grad_F": [
+ 0.02923908829689026,
+ 0.016514884307980537,
+ 0.016419367864727974,
+ 0.016349095851182938,
+ 0.0163878221064806
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4390000104904175,
+ "loss_eval": 1.564381718635559,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 489.3309631347656,
+ 799.4293823242188,
+ 1031.868408203125,
+ 970.6136474609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006363792927004397,
+ 0.00032453436870127916,
+ 0.000319232844049111,
+ 0.0003183995431754738,
+ 0.00031706615118309855
+ ],
+ "bp_grad_F": [
+ 0.02950570173561573,
+ 0.016813522204756737,
+ 0.016721611842513084,
+ 0.016652515158057213,
+ 0.016693497076630592
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42100003361701965,
+ "loss_eval": 1.605594515800476,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 502.8161315917969,
+ 819.462890625,
+ 1056.7576904296875,
+ 992.5881958007812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006477028946392238,
+ 0.00033125586924143136,
+ 0.0003257581265643239,
+ 0.000326100125676021,
+ 0.00032460023066960275
+ ],
+ "bp_grad_F": [
+ 0.029688136652112007,
+ 0.01694806106388569,
+ 0.01685865968465805,
+ 0.016797136515378952,
+ 0.016836510971188545
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.673546552658081,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 517.00634765625,
+ 839.9920654296875,
+ 1082.26025390625,
+ 1015.0608520507812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006337560480460525,
+ 0.0003340205585118383,
+ 0.00032972541521303356,
+ 0.00032889688736759126,
+ 0.0003277511859778315
+ ],
+ "bp_grad_F": [
+ 0.029322637245059013,
+ 0.01695762574672699,
+ 0.016879092901945114,
+ 0.01681896671652794,
+ 0.016858574002981186
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38350000977516174,
+ "loss_eval": 1.6975816488265991,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 529.66064453125,
+ 858.3285522460938,
+ 1104.83544921875,
+ 1035.074951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006231985753402114,
+ 0.00033350964076817036,
+ 0.00032944625127129257,
+ 0.00032876565819606185,
+ 0.00032806835952214897
+ ],
+ "bp_grad_F": [
+ 0.029069310054183006,
+ 0.016890447586774826,
+ 0.016818689182400703,
+ 0.016763897612690926,
+ 0.016804050654172897
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3930000066757202,
+ "loss_eval": 1.676193356513977,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 541.9931030273438,
+ 875.95556640625,
+ 1126.6197509765625,
+ 1054.3516845703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006226357654668391,
+ 0.00032438969356007874,
+ 0.0003203299711458385,
+ 0.0003203903906978667,
+ 0.00031863307231105864
+ ],
+ "bp_grad_F": [
+ 0.028472919017076492,
+ 0.016746005043387413,
+ 0.016683315858244896,
+ 0.016633223742246628,
+ 0.016673142090439796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4165000319480896,
+ "loss_eval": 1.6569225788116455,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 555.5247802734375,
+ 895.108642578125,
+ 1150.2750244140625,
+ 1075.3402099609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006058313883841038,
+ 0.00031499756732955575,
+ 0.00031102998764254153,
+ 0.0003108317614533007,
+ 0.00030999473528936505
+ ],
+ "bp_grad_F": [
+ 0.028057299554347992,
+ 0.016642672941088676,
+ 0.016584018245339394,
+ 0.016536688432097435,
+ 0.016577772796154022
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41850000619888306,
+ "loss_eval": 1.622230887413025,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 566.745361328125,
+ 911.0077514648438,
+ 1169.5748291015625,
+ 1092.4599609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000616180885117501,
+ 0.0003297157527413219,
+ 0.00032601068960502744,
+ 0.0003262106911279261,
+ 0.00032522634137421846
+ ],
+ "bp_grad_F": [
+ 0.02835526503622532,
+ 0.016961509361863136,
+ 0.016903148964047432,
+ 0.01685917004942894,
+ 0.01690032333135605
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39250001311302185,
+ "loss_eval": 1.714435338973999,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 578.6380004882812,
+ 927.9735107421875,
+ 1190.5294189453125,
+ 1111.001220703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006051660166122019,
+ 0.0003138712199870497,
+ 0.0003094248822890222,
+ 0.000309422001009807,
+ 0.0003081281029153615
+ ],
+ "bp_grad_F": [
+ 0.027995921671390533,
+ 0.016778133809566498,
+ 0.016729604452848434,
+ 0.01668645441532135,
+ 0.016727875918149948
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40450000762939453,
+ "loss_eval": 1.6801645755767822,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 591.34326171875,
+ 945.9314575195312,
+ 1212.5030517578125,
+ 1130.69580078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000600961095187813,
+ 0.00032534165075048804,
+ 0.0003221939841751009,
+ 0.00032207692856900394,
+ 0.00032122948323376477
+ ],
+ "bp_grad_F": [
+ 0.027977745980024338,
+ 0.017148323357105255,
+ 0.017105158418416977,
+ 0.017058631405234337,
+ 0.01710781268775463
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3930000066757202,
+ "loss_eval": 1.7086997032165527,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 602.791015625,
+ 962.1253051757812,
+ 1232.407958984375,
+ 1148.6063232421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005954196094535291,
+ 0.00032203743467107415,
+ 0.0003193309239577502,
+ 0.00031976529862731695,
+ 0.00031836770358495414
+ ],
+ "bp_grad_F": [
+ 0.027640262618660927,
+ 0.016875414177775383,
+ 0.01683391071856022,
+ 0.016794128343462944,
+ 0.016835639253258705
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38750001788139343,
+ "loss_eval": 1.7161617279052734,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 613.0055541992188,
+ 976.7833251953125,
+ 1250.490966796875,
+ 1164.8575439453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005885999999009073,
+ 0.00031236460199579597,
+ 0.00030869650072418153,
+ 0.00030896696262061596,
+ 0.0003076815919484943
+ ],
+ "bp_grad_F": [
+ 0.027101732790470123,
+ 0.01670675352215767,
+ 0.016670193523168564,
+ 0.01663014106452465,
+ 0.016672657802700996
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41100001335144043,
+ "loss_eval": 1.6481956243515015,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 622.8380126953125,
+ 990.931640625,
+ 1267.7691650390625,
+ 1180.291015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000587237358558923,
+ 0.0003190709976479411,
+ 0.0003160224005114287,
+ 0.00031612091697752476,
+ 0.00031501890043728054
+ ],
+ "bp_grad_F": [
+ 0.027042290195822716,
+ 0.016803324222564697,
+ 0.016769535839557648,
+ 0.016731148585677147,
+ 0.016775181517004967
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40450000762939453,
+ "loss_eval": 1.6591061353683472,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 632.4323120117188,
+ 1004.666259765625,
+ 1284.4637451171875,
+ 1195.189697265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005885775317437947,
+ 0.0003397047985345125,
+ 0.0003383393050171435,
+ 0.00033765248372219503,
+ 0.00033701834036037326
+ ],
+ "bp_grad_F": [
+ 0.027301670983433723,
+ 0.017337650060653687,
+ 0.017313728109002113,
+ 0.017269184812903404,
+ 0.0173148512840271
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3565000295639038,
+ "loss_eval": 1.7250425815582275,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 639.983154296875,
+ 1015.8214721679688,
+ 1297.94091796875,
+ 1207.160400390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005771536380052567,
+ 0.00031455705175176263,
+ 0.0003114652936346829,
+ 0.0003115544968750328,
+ 0.00031060961191542447
+ ],
+ "bp_grad_F": [
+ 0.026900731027126312,
+ 0.01682351529598236,
+ 0.01679442636668682,
+ 0.016759345307946205,
+ 0.016801798716187477
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.398000031709671,
+ "loss_eval": 1.6931191682815552,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 648.44189453125,
+ 1027.905517578125,
+ 1312.5484619140625,
+ 1220.3349609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005807234556414187,
+ 0.0003243165265303105,
+ 0.00032131426269188523,
+ 0.0003215263714082539,
+ 0.0003202861698810011
+ ],
+ "bp_grad_F": [
+ 0.02689860761165619,
+ 0.016972798854112625,
+ 0.016945669427514076,
+ 0.016909556463360786,
+ 0.01695423573255539
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3850000202655792,
+ "loss_eval": 1.713501214981079,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 656.1256103515625,
+ 1038.9337158203125,
+ 1326.0384521484375,
+ 1232.491455078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005809550639241934,
+ 0.0003213974996469915,
+ 0.0003191177383996546,
+ 0.0003187706752214581,
+ 0.0003176441532559693
+ ],
+ "bp_grad_F": [
+ 0.026944397017359734,
+ 0.016979368403553963,
+ 0.01695428043603897,
+ 0.01692255586385727,
+ 0.016963332891464233
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3800000250339508,
+ "loss_eval": 1.7483241558074951,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 663.1458740234375,
+ 1049.1085205078125,
+ 1338.4049072265625,
+ 1243.709228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005775660974904895,
+ 0.00032701215241104364,
+ 0.000323877960909158,
+ 0.00032368660322390497,
+ 0.00032316104625351727
+ ],
+ "bp_grad_F": [
+ 0.026842813938856125,
+ 0.017009008675813675,
+ 0.016984863206744194,
+ 0.016950154677033424,
+ 0.016992947086691856
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36650002002716064,
+ "loss_eval": 1.7447302341461182,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 669.32080078125,
+ 1058.1265869140625,
+ 1349.383544921875,
+ 1253.68603515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005691531114280224,
+ 0.0003169954870827496,
+ 0.0003141614724881947,
+ 0.00031412398675456643,
+ 0.00031352281803265214
+ ],
+ "bp_grad_F": [
+ 0.026560034602880478,
+ 0.01695145107805729,
+ 0.016930771991610527,
+ 0.016894754022359848,
+ 0.016942735761404037
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.7227482795715332,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 675.035888671875,
+ 1066.407958984375,
+ 1359.420654296875,
+ 1262.8460693359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000574529985897243,
+ 0.000330567971104756,
+ 0.0003291864413768053,
+ 0.0003286501159891486,
+ 0.00032822080538608134
+ ],
+ "bp_grad_F": [
+ 0.02670128643512726,
+ 0.017140112817287445,
+ 0.017120162025094032,
+ 0.01708981581032276,
+ 0.017130881547927856
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.37800002098083496,
+ "loss_eval": 1.7512460947036743,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 680.7155151367188,
+ 1074.5833740234375,
+ 1369.3917236328125,
+ 1271.9488525390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005727651296183467,
+ 0.00031855711131356657,
+ 0.0003159786283504218,
+ 0.00031576541368849576,
+ 0.0003150397096760571
+ ],
+ "bp_grad_F": [
+ 0.02646380476653576,
+ 0.016906103119254112,
+ 0.016886914148926735,
+ 0.016857335343956947,
+ 0.016896924003958702
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39100003242492676,
+ "loss_eval": 1.7765766382217407,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 685.6483154296875,
+ 1081.7335205078125,
+ 1378.0848388671875,
+ 1279.824462890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005669392994605005,
+ 0.00032193740480579436,
+ 0.0003195095050614327,
+ 0.00031930883415043354,
+ 0.00031847937498241663
+ ],
+ "bp_grad_F": [
+ 0.02628612145781517,
+ 0.01694479025900364,
+ 0.016926957294344902,
+ 0.016897274181246758,
+ 0.016937877982854843
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38200002908706665,
+ "loss_eval": 1.6996668577194214,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 690.3829345703125,
+ 1088.4320068359375,
+ 1386.209228515625,
+ 1287.180908203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005609798245131969,
+ 0.0003164574736729264,
+ 0.00031414616387337446,
+ 0.0003141844645142555,
+ 0.0003133733116555959
+ ],
+ "bp_grad_F": [
+ 0.025919275358319283,
+ 0.01681407354772091,
+ 0.016797930002212524,
+ 0.01676807552576065,
+ 0.016810856759548187
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4035000205039978,
+ "loss_eval": 1.6783148050308228,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 694.658935546875,
+ 1094.5535888671875,
+ 1393.6761474609375,
+ 1293.9659423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005624280893243849,
+ 0.00031574408058077097,
+ 0.0003139691543765366,
+ 0.00031461575417779386,
+ 0.00031346286414191127
+ ],
+ "bp_grad_F": [
+ 0.02617610991001129,
+ 0.016873449087142944,
+ 0.016857409849762917,
+ 0.01682792603969574,
+ 0.016867902129888535
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.7127265930175781,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 698.4141235351562,
+ 1099.921875,
+ 1400.2060546875,
+ 1299.92919921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005497613456100225,
+ 0.00031591873266734183,
+ 0.00031333384686149657,
+ 0.00031392619712278247,
+ 0.00031339324777945876
+ ],
+ "bp_grad_F": [
+ 0.025806115940213203,
+ 0.016780776903033257,
+ 0.016766363754868507,
+ 0.016736920922994614,
+ 0.01677793264389038
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4165000319480896,
+ "loss_eval": 1.6823266744613647,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 701.8402099609375,
+ 1104.8636474609375,
+ 1406.2545166015625,
+ 1305.4110107421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005536439130082726,
+ 0.0003222717496100813,
+ 0.0003193898010067642,
+ 0.0003197654150426388,
+ 0.00031906200456433
+ ],
+ "bp_grad_F": [
+ 0.02591872774064541,
+ 0.016899071633815765,
+ 0.01688431203365326,
+ 0.01685412786900997,
+ 0.016896730288863182
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3895000219345093,
+ "loss_eval": 1.6973413228988647,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 704.84814453125,
+ 1109.2054443359375,
+ 1411.5528564453125,
+ 1310.220458984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005509129259735346,
+ 0.0003127358213532716,
+ 0.00031018650042824447,
+ 0.00031017058063298464,
+ 0.0003093581763096154
+ ],
+ "bp_grad_F": [
+ 0.02567744068801403,
+ 0.01674523949623108,
+ 0.01673281565308571,
+ 0.016704324632883072,
+ 0.01674455776810646
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40400001406669617,
+ "loss_eval": 1.6765486001968384,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 707.4666137695312,
+ 1112.9517822265625,
+ 1416.120361328125,
+ 1314.365478515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005525590386241674,
+ 0.0003146192757412791,
+ 0.000312337331706658,
+ 0.0003126179799437523,
+ 0.00031193779432214797
+ ],
+ "bp_grad_F": [
+ 0.025625307112932205,
+ 0.016738714650273323,
+ 0.01672603376209736,
+ 0.016697421669960022,
+ 0.016738519072532654
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.406000018119812,
+ "loss_eval": 1.681616187095642,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 709.6942749023438,
+ 1116.1553955078125,
+ 1420.0328369140625,
+ 1317.9129638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005520040867850184,
+ 0.0003149699477944523,
+ 0.0003132218262180686,
+ 0.00031297295936383307,
+ 0.0003122398047707975
+ ],
+ "bp_grad_F": [
+ 0.02563839592039585,
+ 0.01678294688463211,
+ 0.016770213842391968,
+ 0.01674121432006359,
+ 0.01678287237882614
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3985000252723694,
+ "loss_eval": 1.6824655532836914,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 711.4514770507812,
+ 1118.6820068359375,
+ 1423.118408203125,
+ 1320.7220458984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005478749517351389,
+ 0.0003126654773950577,
+ 0.00031092006247490644,
+ 0.0003107163356617093,
+ 0.00030992255778983235
+ ],
+ "bp_grad_F": [
+ 0.025653105229139328,
+ 0.016804352402687073,
+ 0.01679334044456482,
+ 0.016765642911195755,
+ 0.016805216670036316
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3970000147819519,
+ "loss_eval": 1.6816198825836182,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 712.941162109375,
+ 1120.8258056640625,
+ 1425.7293701171875,
+ 1323.110595703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005502297426573932,
+ 0.00031594440224580467,
+ 0.00031323955045081675,
+ 0.0003133862919639796,
+ 0.00031268122256733477
+ ],
+ "bp_grad_F": [
+ 0.025557825341820717,
+ 0.01675795204937458,
+ 0.01674625650048256,
+ 0.01671820878982544,
+ 0.016758527606725693
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4025000333786011,
+ "loss_eval": 1.6777657270431519,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 714.2026977539062,
+ 1122.637451171875,
+ 1427.94921875,
+ 1325.1287841796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005491463234648108,
+ 0.0003148230316583067,
+ 0.00031261687399819493,
+ 0.0003126751398667693,
+ 0.00031198892975226045
+ ],
+ "bp_grad_F": [
+ 0.025629354640841484,
+ 0.016796274110674858,
+ 0.016784505918622017,
+ 0.016756094992160797,
+ 0.01679658703505993
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3985000252723694,
+ "loss_eval": 1.6832109689712524,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 715.1837158203125,
+ 1124.0401611328125,
+ 1429.676025390625,
+ 1326.6959228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005472805933095515,
+ 0.00031123129883781075,
+ 0.0003085967618972063,
+ 0.00030910191708244383,
+ 0.00030826785950921476
+ ],
+ "bp_grad_F": [
+ 0.025491509586572647,
+ 0.01673061214387417,
+ 0.016719412058591843,
+ 0.01669108308851719,
+ 0.016732096672058105
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41350001096725464,
+ "loss_eval": 1.6768076419830322,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 715.9666137695312,
+ 1125.15869140625,
+ 1431.054931640625,
+ 1327.940185546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005469402531161904,
+ 0.0003141815832350403,
+ 0.0003117373853456229,
+ 0.0003121092449873686,
+ 0.00031146654509939253
+ ],
+ "bp_grad_F": [
+ 0.02553613670170307,
+ 0.016766469925642014,
+ 0.016755321994423866,
+ 0.01672743633389473,
+ 0.01676766574382782
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40050002932548523,
+ "loss_eval": 1.6803343296051025,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 716.54345703125,
+ 1125.9932861328125,
+ 1432.0760498046875,
+ 1328.8612060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000544340000487864,
+ 0.0003152569697704166,
+ 0.00031408306676894426,
+ 0.00031385221518576145,
+ 0.0003130683908239007
+ ],
+ "bp_grad_F": [
+ 0.025559071451425552,
+ 0.016799958422780037,
+ 0.01678895764052868,
+ 0.016760708764195442,
+ 0.01680118963122368
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40050002932548523,
+ "loss_eval": 1.6816425323486328,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 716.944580078125,
+ 1126.5697021484375,
+ 1432.786376953125,
+ 1329.5032958984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005474911304190755,
+ 0.00031179687357507646,
+ 0.0003097430744674057,
+ 0.00030947139021009207,
+ 0.00030854580109007657
+ ],
+ "bp_grad_F": [
+ 0.025479920208454132,
+ 0.01673789508640766,
+ 0.016726836562156677,
+ 0.016698846593499184,
+ 0.01673932373523712
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4010000228881836,
+ "loss_eval": 1.6769893169403076,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.2020263671875,
+ 1126.9422607421875,
+ 1433.2410888671875,
+ 1329.9195556640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000546319643035531,
+ 0.00031345203751698136,
+ 0.000311522395350039,
+ 0.000311847630655393,
+ 0.0003111722180619836
+ ],
+ "bp_grad_F": [
+ 0.025481175631284714,
+ 0.01675844006240368,
+ 0.016747308894991875,
+ 0.016719479113817215,
+ 0.0167598407715559
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4075000286102295,
+ "loss_eval": 1.6769570112228394,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.3436889648438,
+ 1127.1475830078125,
+ 1433.49072265625,
+ 1330.1451416015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005438647349365056,
+ 0.00031364860478788614,
+ 0.0003113296115770936,
+ 0.0003115428553428501,
+ 0.00031094413134269416
+ ],
+ "bp_grad_F": [
+ 0.025495020672678947,
+ 0.016764776781201363,
+ 0.016753805801272392,
+ 0.016725784167647362,
+ 0.016766248270869255
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40800002217292786,
+ "loss_eval": 1.6758222579956055,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.4073486328125,
+ 1127.239501953125,
+ 1433.60302734375,
+ 1330.2476806640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005444776033982635,
+ 0.0003124381182715297,
+ 0.0003098779125139117,
+ 0.0003102763439528644,
+ 0.0003094278508797288
+ ],
+ "bp_grad_F": [
+ 0.025471549481153488,
+ 0.016743116080760956,
+ 0.016732197254896164,
+ 0.016704153269529343,
+ 0.016744764521718025
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41450002789497375,
+ "loss_eval": 1.675687551498413,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.4231567382812,
+ 1127.262451171875,
+ 1433.6309814453125,
+ 1330.273193359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005445098504424095,
+ 0.0003131923731416464,
+ 0.00031077052699401975,
+ 0.0003107219818048179,
+ 0.00031013842090032995
+ ],
+ "bp_grad_F": [
+ 0.02547312155365944,
+ 0.016745658591389656,
+ 0.016734709963202477,
+ 0.016706665977835655,
+ 0.016747286543250084
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4140000343322754,
+ "loss_eval": 1.6754448413848877,
+ "epoch": 80
+ }
+ ],
+ "seed": 42,
+ "alpha": 1.0,
+ "depth": 4,
+ "d_hidden": 128
+} \ No newline at end of file
diff --git a/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json b/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json
new file mode 100644
index 0000000..9972e9a
--- /dev/null
+++ b/results/snapshot_synth_v1/snapshot_synth_a1.0_L4_s42.json
@@ -0,0 +1,4960 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_synth_v1",
+ "epochs": 80,
+ "alpha": 1.0,
+ "depth": 4,
+ "seed": 42,
+ "d_hidden": 128,
+ "lr": 0.001,
+ "wd": 0.01
+ },
+ "depth": 4,
+ "d_hidden": 128,
+ "num_classes": 10,
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.301911354064941,
+ 11.659679412841797,
+ 12.48208999633789,
+ 13.934065818786621
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006583131616935134,
+ 0.0004948809510096908,
+ 0.00036159728188067675,
+ 0.00026353230350650847,
+ 0.00020344744552858174
+ ],
+ "bp_grad_F": [
+ 0.03319504112005234,
+ 0.0246991366147995,
+ 0.017943235114216805,
+ 0.012967471033334732,
+ 0.009912492707371712
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7095000147819519,
+ "loss_eval": 0.8666461110115051,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.28874397277832,
+ 12.022683143615723,
+ 13.943255424499512,
+ 17.510770797729492
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007016682648099959,
+ 0.00048243277706205845,
+ 0.00031948124524205923,
+ 0.00020489063172135502,
+ 0.00014097581151872873
+ ],
+ "bp_grad_F": [
+ 0.05366413667798042,
+ 0.03651106730103493,
+ 0.023700030520558357,
+ 0.015033061616122723,
+ 0.010093427263200283
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7725000381469727,
+ "loss_eval": 0.6004051566123962,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.268131256103516,
+ 12.138687133789062,
+ 14.603575706481934,
+ 19.109115600585938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000659371551591903,
+ 0.0004339825245551765,
+ 0.00027271744329482317,
+ 0.0001733575772959739,
+ 0.0001116431230911985
+ ],
+ "bp_grad_F": [
+ 0.06363420188426971,
+ 0.04213711991906166,
+ 0.0264370646327734,
+ 0.016141116619110107,
+ 0.010473517701029778
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7745000123977661,
+ "loss_eval": 0.5640328526496887,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.245299339294434,
+ 12.213927268981934,
+ 14.944411277770996,
+ 19.937482833862305
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000589758506976068,
+ 0.00038736555143259466,
+ 0.000245077651925385,
+ 0.00015142903430387378,
+ 9.591270645614713e-05
+ ],
+ "bp_grad_F": [
+ 0.06846851110458374,
+ 0.04497711360454559,
+ 0.027850953862071037,
+ 0.01671868935227394,
+ 0.01068752072751522
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7835000157356262,
+ "loss_eval": 0.5508342981338501,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.22258186340332,
+ 12.241990089416504,
+ 15.219721794128418,
+ 20.66508674621582
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005271711852401495,
+ 0.00034995534224435687,
+ 0.00021946353081148118,
+ 0.00013214732462074608,
+ 8.23614391265437e-05
+ ],
+ "bp_grad_F": [
+ 0.07378005236387253,
+ 0.04831067472696304,
+ 0.02961091324687004,
+ 0.01746201328933239,
+ 0.010955682955682278
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7855000495910645,
+ "loss_eval": 0.5423576831817627,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.190115928649902,
+ 12.27110481262207,
+ 15.450979232788086,
+ 21.203943252563477
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005092737264931202,
+ 0.00033784759580157697,
+ 0.00020663061877712607,
+ 0.0001207139139296487,
+ 7.417408050969243e-05
+ ],
+ "bp_grad_F": [
+ 0.07774882018566132,
+ 0.051034994423389435,
+ 0.031082650646567345,
+ 0.018063966184854507,
+ 0.01114849466830492
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7845000624656677,
+ "loss_eval": 0.5346181392669678,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.167141914367676,
+ 12.275080680847168,
+ 15.592608451843262,
+ 21.725374221801758
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005083799478597939,
+ 0.00033595148124732077,
+ 0.0002061770501313731,
+ 0.00011957385140703991,
+ 7.27532897144556e-05
+ ],
+ "bp_grad_F": [
+ 0.08175421506166458,
+ 0.053990282118320465,
+ 0.03277580440044403,
+ 0.01879614032804966,
+ 0.011419840157032013
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7905000448226929,
+ "loss_eval": 0.5348329544067383,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.135689735412598,
+ 12.291831016540527,
+ 15.776432991027832,
+ 22.2913761138916
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004477855109144002,
+ 0.0003000828146468848,
+ 0.00018366402946412563,
+ 0.00010473958536749706,
+ 6.266004493227229e-05
+ ],
+ "bp_grad_F": [
+ 0.08535438776016235,
+ 0.05686107277870178,
+ 0.03441749885678291,
+ 0.019436663016676903,
+ 0.011580240912735462
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796500027179718,
+ "loss_eval": 0.5225732326507568,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.113900184631348,
+ 12.296534538269043,
+ 15.874000549316406,
+ 22.73569107055664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00041620698175393045,
+ 0.00028262173873372376,
+ 0.0001732171222101897,
+ 9.77468880591914e-05,
+ 5.725537994294427e-05
+ ],
+ "bp_grad_F": [
+ 0.09095799922943115,
+ 0.061118144541978836,
+ 0.036917947232723236,
+ 0.020527740940451622,
+ 0.011972126550972462
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7945000529289246,
+ "loss_eval": 0.5336357355117798,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.088306427001953,
+ 12.3102388381958,
+ 16.0321102142334,
+ 23.320507049560547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003761165135074407,
+ 0.0002580824075266719,
+ 0.00015763533883728087,
+ 8.57545601320453e-05,
+ 5.005364437238313e-05
+ ],
+ "bp_grad_F": [
+ 0.09630071371793747,
+ 0.06542361527681351,
+ 0.039454828947782516,
+ 0.02160210721194744,
+ 0.012356426566839218
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7915000319480896,
+ "loss_eval": 0.5405644774436951,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.062504768371582,
+ 12.296314239501953,
+ 16.1483211517334,
+ 23.885089874267578
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003359524707775563,
+ 0.00023470049200113863,
+ 0.00014604303578380495,
+ 7.898044714238495e-05,
+ 4.356990029918961e-05
+ ],
+ "bp_grad_F": [
+ 0.09961758553981781,
+ 0.06847036629915237,
+ 0.04127706214785576,
+ 0.02224603295326233,
+ 0.01243517268449068
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8020000457763672,
+ "loss_eval": 0.5290275812149048,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.040243148803711,
+ 12.293885231018066,
+ 16.26875114440918,
+ 24.44219207763672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028416418354026973,
+ 0.0001959044166142121,
+ 0.00011818648636108264,
+ 6.387147004716098e-05,
+ 3.619954804889858e-05
+ ],
+ "bp_grad_F": [
+ 0.10626755654811859,
+ 0.07399805635213852,
+ 0.044546131044626236,
+ 0.023592140525579453,
+ 0.012874037958681583
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8005000352859497,
+ "loss_eval": 0.5458852648735046,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.011943817138672,
+ 12.278276443481445,
+ 16.34218978881836,
+ 24.94852066040039
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002902932756114751,
+ 0.00020653512910939753,
+ 0.0001265774480998516,
+ 6.573591963388026e-05,
+ 3.462762470007874e-05
+ ],
+ "bp_grad_F": [
+ 0.1133178174495697,
+ 0.07985687255859375,
+ 0.048010025173425674,
+ 0.025017691776156425,
+ 0.013337739743292332
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.5682750940322876,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.992447853088379,
+ 12.299921035766602,
+ 16.492944717407227,
+ 25.524486541748047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00023213925305753946,
+ 0.00016858529124874622,
+ 0.00010339246364310384,
+ 5.375607725000009e-05,
+ 2.8085371013730764e-05
+ ],
+ "bp_grad_F": [
+ 0.11885266751050949,
+ 0.08489131927490234,
+ 0.051101066172122955,
+ 0.02628019079566002,
+ 0.013745996169745922
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.5884183645248413,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.968864440917969,
+ 12.2804536819458,
+ 16.559459686279297,
+ 26.08506965637207
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00020740363106597215,
+ 0.00015108383377082646,
+ 9.300659439759329e-05,
+ 4.728052954305895e-05,
+ 2.4296168703585863e-05
+ ],
+ "bp_grad_F": [
+ 0.12586721777915955,
+ 0.09100162982940674,
+ 0.0545843243598938,
+ 0.027565589174628258,
+ 0.014059619046747684
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.5945348143577576,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.95374870300293,
+ 12.280479431152344,
+ 16.662782669067383,
+ 26.677371978759766
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001737641723593697,
+ 0.00012793064524885267,
+ 7.821117469575256e-05,
+ 3.888122591888532e-05,
+ 2.000005952140782e-05
+ ],
+ "bp_grad_F": [
+ 0.1330755203962326,
+ 0.09730331599712372,
+ 0.05829176306724548,
+ 0.028968123719096184,
+ 0.014443416148424149
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7985000610351562,
+ "loss_eval": 0.6085594296455383,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.9340181350708,
+ 12.276576042175293,
+ 16.712459564208984,
+ 27.161230087280273
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001674877858022228,
+ 0.00012590538244694471,
+ 7.574073242722079e-05,
+ 3.732396726263687e-05,
+ 1.86969518836122e-05
+ ],
+ "bp_grad_F": [
+ 0.13938488066196442,
+ 0.10323134809732437,
+ 0.061863236129283905,
+ 0.0303154569119215,
+ 0.01477954164147377
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7935000658035278,
+ "loss_eval": 0.6137893199920654,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.915549278259277,
+ 12.273784637451172,
+ 16.833044052124023,
+ 27.70804214477539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00013765814946964383,
+ 0.00010384680354036391,
+ 6.252297316677868e-05,
+ 3.0995015549706295e-05,
+ 1.5171532140811905e-05
+ ],
+ "bp_grad_F": [
+ 0.1456620693206787,
+ 0.10904198884963989,
+ 0.06525038182735443,
+ 0.03156846761703491,
+ 0.015115385875105858
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8065000176429749,
+ "loss_eval": 0.646562933921814,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.900074005126953,
+ 12.271150588989258,
+ 16.89704704284668,
+ 28.26544761657715
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012433489609975368,
+ 9.527598012937233e-05,
+ 5.774956298409961e-05,
+ 2.7581723770708777e-05,
+ 1.282800621993374e-05
+ ],
+ "bp_grad_F": [
+ 0.15205088257789612,
+ 0.11483236402273178,
+ 0.06858030706644058,
+ 0.03275969997048378,
+ 0.015405165031552315
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8020000457763672,
+ "loss_eval": 0.6640118360519409,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.890129089355469,
+ 12.265545845031738,
+ 16.95741844177246,
+ 28.79555320739746
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010217817907687277,
+ 7.912378350738436e-05,
+ 4.763850665767677e-05,
+ 2.3046186470310204e-05,
+ 1.088724638975691e-05
+ ],
+ "bp_grad_F": [
+ 0.1597365438938141,
+ 0.12170909345149994,
+ 0.07251270860433578,
+ 0.034210700541734695,
+ 0.015816442668437958
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7950000166893005,
+ "loss_eval": 0.6770148277282715,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.874495506286621,
+ 12.249778747558594,
+ 17.042072296142578,
+ 29.30438995361328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.667076665209606e-05,
+ 7.482587534468621e-05,
+ 4.6152406866895035e-05,
+ 2.1790863684145734e-05,
+ 1.0080756510433275e-05
+ ],
+ "bp_grad_F": [
+ 0.16798135638237,
+ 0.1287383735179901,
+ 0.07646958529949188,
+ 0.03567665442824364,
+ 0.016245704144239426
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.7074151635169983,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.860309600830078,
+ 12.262276649475098,
+ 17.10471534729004,
+ 29.77037811279297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.177604468073696e-05,
+ 6.404842861229554e-05,
+ 3.929789818357676e-05,
+ 1.8207463654107414e-05,
+ 8.330911441589706e-06
+ ],
+ "bp_grad_F": [
+ 0.17336878180503845,
+ 0.13393178582191467,
+ 0.07944471389055252,
+ 0.03667045012116432,
+ 0.016434919089078903
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8005000352859497,
+ "loss_eval": 0.7185518741607666,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.851460456848145,
+ 12.24251651763916,
+ 17.171558380126953,
+ 30.212722778320312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.376902067335322e-05,
+ 5.6489287089789286e-05,
+ 3.395874227862805e-05,
+ 1.6138041246449575e-05,
+ 6.9637526394217275e-06
+ ],
+ "bp_grad_F": [
+ 0.17967616021633148,
+ 0.13954690098762512,
+ 0.08263248950242996,
+ 0.037825122475624084,
+ 0.016747957095503807
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.7408589124679565,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.842126846313477,
+ 12.243563652038574,
+ 17.238094329833984,
+ 30.57369613647461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.96977149345912e-05,
+ 5.455461359815672e-05,
+ 3.149309486616403e-05,
+ 1.4526599443343002e-05,
+ 6.351157480821712e-06
+ ],
+ "bp_grad_F": [
+ 0.1842736005783081,
+ 0.14376932382583618,
+ 0.08495213091373444,
+ 0.038578059524297714,
+ 0.01690361276268959
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.7459465265274048,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.834511756896973,
+ 12.231362342834473,
+ 17.27652931213379,
+ 30.958032608032227
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.340271647786722e-05,
+ 5.11680482304655e-05,
+ 3.0357710784301162e-05,
+ 1.3866035260434728e-05,
+ 5.900054475205252e-06
+ ],
+ "bp_grad_F": [
+ 0.1903817504644394,
+ 0.14911234378814697,
+ 0.08797255158424377,
+ 0.03965744748711586,
+ 0.01718064583837986
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.799500048160553,
+ "loss_eval": 0.7703561186790466,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.825489044189453,
+ 12.22317886352539,
+ 17.32727813720703,
+ 31.295225143432617
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 5.839894583914429e-05,
+ 4.5580356527352706e-05,
+ 2.747728103713598e-05,
+ 1.2357729247014504e-05,
+ 5.190840511204442e-06
+ ],
+ "bp_grad_F": [
+ 0.19528549909591675,
+ 0.15347032248973846,
+ 0.09032707661390305,
+ 0.04043765366077423,
+ 0.017367515712976456
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796500027179718,
+ "loss_eval": 0.7836824655532837,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.819538116455078,
+ 12.222261428833008,
+ 17.363719940185547,
+ 31.59310531616211
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 5.029122257838026e-05,
+ 3.970409306930378e-05,
+ 2.4377433874178678e-05,
+ 1.1113867913081776e-05,
+ 4.727653049485525e-06
+ ],
+ "bp_grad_F": [
+ 0.19932542741298676,
+ 0.15725064277648926,
+ 0.09246863424777985,
+ 0.0411805622279644,
+ 0.017557309940457344
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.797913134098053,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.811884880065918,
+ 12.215055465698242,
+ 17.399166107177734,
+ 31.893146514892578
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 4.582677502185106e-05,
+ 3.702253525261767e-05,
+ 2.1835987354279496e-05,
+ 9.762208719621412e-06,
+ 4.239610916556558e-06
+ ],
+ "bp_grad_F": [
+ 0.20321832597255707,
+ 0.16079877316951752,
+ 0.0944279357790947,
+ 0.04182669520378113,
+ 0.01770154759287834
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8015000224113464,
+ "loss_eval": 0.8103511929512024,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.8074951171875,
+ 12.208087921142578,
+ 17.4328670501709,
+ 32.0993537902832
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 4.3260886741336435e-05,
+ 3.466813359409571e-05,
+ 2.0653966203099117e-05,
+ 9.232544471160509e-06,
+ 3.864107839035569e-06
+ ],
+ "bp_grad_F": [
+ 0.20730803906917572,
+ 0.16447876393795013,
+ 0.09640119969844818,
+ 0.042481184005737305,
+ 0.017861463129520416
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8030000329017639,
+ "loss_eval": 0.8259979486465454,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.802508354187012,
+ 12.201593399047852,
+ 17.472795486450195,
+ 32.34526824951172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 4.115825140615925e-05,
+ 3.3230924600502476e-05,
+ 1.9723833247553557e-05,
+ 8.868120858096518e-06,
+ 3.842445494228741e-06
+ ],
+ "bp_grad_F": [
+ 0.21079479157924652,
+ 0.16765208542346954,
+ 0.09817153960466385,
+ 0.04308956116437912,
+ 0.018017521128058434
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.835996687412262,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.79713249206543,
+ 12.19255542755127,
+ 17.48019790649414,
+ 32.53469467163086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.9538805140182376e-05,
+ 3.1396168196806684e-05,
+ 1.915965367516037e-05,
+ 8.288401659228839e-06,
+ 3.5655145893542795e-06
+ ],
+ "bp_grad_F": [
+ 0.2140273153781891,
+ 0.1706041693687439,
+ 0.09975717961788177,
+ 0.043599311262369156,
+ 0.018129423260688782
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.8454185724258423,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.793066024780273,
+ 12.186600685119629,
+ 17.523115158081055,
+ 32.76158905029297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.902446405845694e-05,
+ 3.034434666915331e-05,
+ 1.7979460608330555e-05,
+ 8.018372682272457e-06,
+ 3.2052466849563643e-06
+ ],
+ "bp_grad_F": [
+ 0.217476025223732,
+ 0.17371903359889984,
+ 0.10147368907928467,
+ 0.04418298602104187,
+ 0.018276885151863098
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8025000095367432,
+ "loss_eval": 0.8576318621635437,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.788265228271484,
+ 12.18388557434082,
+ 17.53253173828125,
+ 32.96540832519531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.487027424853295e-05,
+ 2.7703388695954345e-05,
+ 1.6244883227045648e-05,
+ 6.949686849111458e-06,
+ 3.01652812595421e-06
+ ],
+ "bp_grad_F": [
+ 0.2205507904291153,
+ 0.17653042078018188,
+ 0.10301276296377182,
+ 0.04468648508191109,
+ 0.018391530960798264
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.8676812648773193,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.782870292663574,
+ 12.177481651306152,
+ 17.572200775146484,
+ 33.13017654418945
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.207056215615012e-05,
+ 2.538906664995011e-05,
+ 1.4797540643485263e-05,
+ 6.3980214690673165e-06,
+ 2.7153869268659037e-06
+ ],
+ "bp_grad_F": [
+ 0.22312353551387787,
+ 0.17893576622009277,
+ 0.10432329773902893,
+ 0.045110564678907394,
+ 0.018488196656107903
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8015000224113464,
+ "loss_eval": 0.8748663663864136,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.778507232666016,
+ 12.176526069641113,
+ 17.577714920043945,
+ 33.292396545410156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.117206506431103e-05,
+ 2.5556160835549235e-05,
+ 1.5269728464772925e-05,
+ 6.6313673414697405e-06,
+ 2.837193505911273e-06
+ ],
+ "bp_grad_F": [
+ 0.22575876116752625,
+ 0.18135619163513184,
+ 0.10563197731971741,
+ 0.045539867132902145,
+ 0.01859084889292717
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.8849357962608337,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.775252342224121,
+ 12.169761657714844,
+ 17.6116943359375,
+ 33.44955062866211
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0056495234020986e-05,
+ 2.4113667677738704e-05,
+ 1.408176376571646e-05,
+ 6.1218188420752995e-06,
+ 2.6174138838541694e-06
+ ],
+ "bp_grad_F": [
+ 0.2284391075372696,
+ 0.18377536535263062,
+ 0.1069609671831131,
+ 0.04599269852042198,
+ 0.018708044663071632
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8015000224113464,
+ "loss_eval": 0.8959856629371643,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.772398948669434,
+ 12.164031028747559,
+ 17.635194778442383,
+ 33.5887451171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7790018066298217e-05,
+ 2.2673413695883937e-05,
+ 1.327950394625077e-05,
+ 5.801120551041095e-06,
+ 2.3991885882423958e-06
+ ],
+ "bp_grad_F": [
+ 0.23064540326595306,
+ 0.1858666092157364,
+ 0.10809148848056793,
+ 0.04634574428200722,
+ 0.018780354410409927
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8005000352859497,
+ "loss_eval": 0.9018086194992065,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.76898193359375,
+ 12.161084175109863,
+ 17.64798927307129,
+ 33.7384033203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7914453312405385e-05,
+ 2.2498874386656098e-05,
+ 1.335815068159718e-05,
+ 5.8119312598137185e-06,
+ 2.478651822457323e-06
+ ],
+ "bp_grad_F": [
+ 0.2330632209777832,
+ 0.1880374252796173,
+ 0.10926036536693573,
+ 0.04673014581203461,
+ 0.01887366734445095
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.9126823544502258,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.765782356262207,
+ 12.157867431640625,
+ 17.654565811157227,
+ 33.87545394897461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.617536301841028e-05,
+ 2.155852780560963e-05,
+ 1.26063732750481e-05,
+ 5.598193638434168e-06,
+ 2.3114046143746236e-06
+ ],
+ "bp_grad_F": [
+ 0.23493894934654236,
+ 0.18982405960559845,
+ 0.11023002117872238,
+ 0.0470343716442585,
+ 0.018937399610877037
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8010000586509705,
+ "loss_eval": 0.918436586856842,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.76235294342041,
+ 12.158239364624023,
+ 17.692272186279297,
+ 33.97838592529297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.5225266654160805e-05,
+ 2.0318799215601757e-05,
+ 1.18104180728551e-05,
+ 5.113367024023319e-06,
+ 2.0679383396782214e-06
+ ],
+ "bp_grad_F": [
+ 0.23714447021484375,
+ 0.1918695867061615,
+ 0.11135337501764297,
+ 0.047415897250175476,
+ 0.019037041813135147
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.926592230796814,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.761220932006836,
+ 12.152015686035156,
+ 17.702022552490234,
+ 34.099910736083984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.4690283680683933e-05,
+ 2.0103743736399338e-05,
+ 1.1646708117041271e-05,
+ 5.211788447923027e-06,
+ 2.065433818643214e-06
+ ],
+ "bp_grad_F": [
+ 0.23883607983589172,
+ 0.1934758871793747,
+ 0.11221782118082047,
+ 0.04768490791320801,
+ 0.019090749323368073
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.799500048160553,
+ "loss_eval": 0.9292308688163757,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.758316993713379,
+ 12.149521827697754,
+ 17.706113815307617,
+ 34.19028091430664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.3211940060718916e-05,
+ 1.8614891814650036e-05,
+ 1.1040006938856095e-05,
+ 4.901159627479501e-06,
+ 2.003940153372241e-06
+ ],
+ "bp_grad_F": [
+ 0.24076926708221436,
+ 0.19526584446430206,
+ 0.1131957471370697,
+ 0.048007190227508545,
+ 0.019170215353369713
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.939300000667572,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.7562894821167,
+ 12.145485877990723,
+ 17.72273063659668,
+ 34.302001953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.3761875127092935e-05,
+ 1.9169772713212296e-05,
+ 1.1290117072348949e-05,
+ 4.916772468277486e-06,
+ 1.9402432371862233e-06
+ ],
+ "bp_grad_F": [
+ 0.2422482967376709,
+ 0.19667460024356842,
+ 0.11394675076007843,
+ 0.04823824390769005,
+ 0.019216476008296013
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.800000011920929,
+ "loss_eval": 0.9442830681800842,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.753690719604492,
+ 12.144105911254883,
+ 17.737106323242188,
+ 34.404640197753906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.1792104234918952e-05,
+ 1.8292348613613285e-05,
+ 1.0393917364126537e-05,
+ 4.534665094979573e-06,
+ 1.8929350744656404e-06
+ ],
+ "bp_grad_F": [
+ 0.2442140281200409,
+ 0.1984620988368988,
+ 0.11491919308900833,
+ 0.04856158792972565,
+ 0.019297350198030472
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.799500048160553,
+ "loss_eval": 0.9510068297386169,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.751104354858398,
+ 12.139998435974121,
+ 17.73967170715332,
+ 34.49326705932617
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.228700031992048e-05,
+ 1.800662539608311e-05,
+ 1.02799631349626e-05,
+ 4.365918812254677e-06,
+ 1.763435875545838e-06
+ ],
+ "bp_grad_F": [
+ 0.24558202922344208,
+ 0.19977517426013947,
+ 0.11561965942382812,
+ 0.04877489432692528,
+ 0.019342035055160522
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7980000376701355,
+ "loss_eval": 0.9541275501251221,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.748708724975586,
+ 12.140083312988281,
+ 17.75340461730957,
+ 34.58064651489258
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.0954081264790148e-05,
+ 1.69687900779536e-05,
+ 1.0029441000369843e-05,
+ 4.277889729564777e-06,
+ 1.7006685766318697e-06
+ ],
+ "bp_grad_F": [
+ 0.24700944125652313,
+ 0.20111818611621857,
+ 0.11635513603687286,
+ 0.04901802912354469,
+ 0.019400382414460182
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.9603452086448669,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.747987747192383,
+ 12.13515567779541,
+ 17.773204803466797,
+ 34.66823196411133
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.019237945205532e-05,
+ 1.6703623259672895e-05,
+ 9.940931704477407e-06,
+ 4.2076449062733445e-06,
+ 1.6902752122405218e-06
+ ],
+ "bp_grad_F": [
+ 0.2484009861946106,
+ 0.20242078602313995,
+ 0.11704456806182861,
+ 0.04923176020383835,
+ 0.019446346908807755
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7980000376701355,
+ "loss_eval": 0.9656705260276794,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.746366500854492,
+ 12.134767532348633,
+ 17.78083038330078,
+ 34.744384765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.9601726307882927e-05,
+ 1.625595541554503e-05,
+ 9.70309520198498e-06,
+ 4.2589249460434075e-06,
+ 1.6490113239342463e-06
+ ],
+ "bp_grad_F": [
+ 0.2497195154428482,
+ 0.20365330576896667,
+ 0.1177029013633728,
+ 0.0494362898170948,
+ 0.019490210339426994
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7985000610351562,
+ "loss_eval": 0.9694753885269165,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.745685577392578,
+ 12.132808685302734,
+ 17.785594940185547,
+ 34.818721771240234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.9891656847903505e-05,
+ 1.645386146265082e-05,
+ 9.532630429021083e-06,
+ 4.012633780803299e-06,
+ 1.5627846323695849e-06
+ ],
+ "bp_grad_F": [
+ 0.25097453594207764,
+ 0.2048366218805313,
+ 0.11835213750600815,
+ 0.04964917525649071,
+ 0.019541876390576363
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7970000505447388,
+ "loss_eval": 0.9751549363136292,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.744300842285156,
+ 12.130931854248047,
+ 17.797060012817383,
+ 34.88679885864258
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.86829984158976e-05,
+ 1.5538031220785342e-05,
+ 9.179881089949049e-06,
+ 3.900266619893955e-06,
+ 1.5405096291942755e-06
+ ],
+ "bp_grad_F": [
+ 0.2520725131034851,
+ 0.20589254796504974,
+ 0.11892128735780716,
+ 0.04982898011803627,
+ 0.0195804163813591
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7980000376701355,
+ "loss_eval": 0.9781593084335327,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.742894172668457,
+ 12.128829002380371,
+ 17.800174713134766,
+ 34.937950134277344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.839629840105772e-05,
+ 1.504779083916219e-05,
+ 8.953754331741948e-06,
+ 3.7526185678871116e-06,
+ 1.5395226000691764e-06
+ ],
+ "bp_grad_F": [
+ 0.25313958525657654,
+ 0.2068854719400406,
+ 0.11944505572319031,
+ 0.0499873124063015,
+ 0.019611038267612457
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 0.9819083213806152,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.741170883178711,
+ 12.12833309173584,
+ 17.80767822265625,
+ 35.008392333984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.8736680431175046e-05,
+ 1.5372819689218886e-05,
+ 9.080923518922646e-06,
+ 3.7873542169108987e-06,
+ 1.4909855963196605e-06
+ ],
+ "bp_grad_F": [
+ 0.2542133629322052,
+ 0.20790545642375946,
+ 0.11999284476041794,
+ 0.05016028508543968,
+ 0.019651155918836594
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.9845340847969055,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.739892959594727,
+ 12.124402046203613,
+ 17.814624786376953,
+ 35.0652961730957
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.820523539208807e-05,
+ 1.4827967788733076e-05,
+ 8.919139872887172e-06,
+ 3.8056493849580875e-06,
+ 1.4648703654529527e-06
+ ],
+ "bp_grad_F": [
+ 0.25528770685195923,
+ 0.2089182734489441,
+ 0.12054150551557541,
+ 0.05034028738737106,
+ 0.019695136696100235
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.9892162680625916,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.738609313964844,
+ 12.125777244567871,
+ 17.821733474731445,
+ 35.119747161865234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.807287299016025e-05,
+ 1.485222401242936e-05,
+ 8.809645805740729e-06,
+ 3.601295475164079e-06,
+ 1.3953541611044784e-06
+ ],
+ "bp_grad_F": [
+ 0.25628989934921265,
+ 0.2098524272441864,
+ 0.12104840576648712,
+ 0.05050570145249367,
+ 0.019734907895326614
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7970000505447388,
+ "loss_eval": 0.9929525852203369,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.738442420959473,
+ 12.123546600341797,
+ 17.828126907348633,
+ 35.1645393371582
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.7838316125562415e-05,
+ 1.4615891814173665e-05,
+ 8.594040991738439e-06,
+ 3.6455955978453858e-06,
+ 1.4180122889229096e-06
+ ],
+ "bp_grad_F": [
+ 0.25709325075149536,
+ 0.21062038838863373,
+ 0.12145251780748367,
+ 0.05062393099069595,
+ 0.019757961854338646
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.9955189228057861,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.736928939819336,
+ 12.120393753051758,
+ 17.832061767578125,
+ 35.21808624267578
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.690394310571719e-05,
+ 1.4294129869085737e-05,
+ 8.27510575618362e-06,
+ 3.6071653539693216e-06,
+ 1.3830640455125831e-06
+ ],
+ "bp_grad_F": [
+ 0.25789716839790344,
+ 0.21137811243534088,
+ 0.12185957282781601,
+ 0.050752829760313034,
+ 0.019786853343248367
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7975000143051147,
+ "loss_eval": 0.9983878135681152,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.7359619140625,
+ 12.122570991516113,
+ 17.835556030273438,
+ 35.264137268066406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.6666754163452424e-05,
+ 1.4025285963725764e-05,
+ 8.179616088455077e-06,
+ 3.4237471027154243e-06,
+ 1.3576167248174897e-06
+ ],
+ "bp_grad_F": [
+ 0.25863000750541687,
+ 0.21208500862121582,
+ 0.12223963439464569,
+ 0.050873447209596634,
+ 0.0198147501796484
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0010322332382202,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.73526668548584,
+ 12.120652198791504,
+ 17.842275619506836,
+ 35.31349182128906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.6808457075967453e-05,
+ 1.3759586181549821e-05,
+ 8.023761438380461e-06,
+ 3.3788217024266487e-06,
+ 1.3503363334166352e-06
+ ],
+ "bp_grad_F": [
+ 0.2594156563282013,
+ 0.2128157913684845,
+ 0.12262928485870361,
+ 0.050996698439121246,
+ 0.01984303817152977
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7990000247955322,
+ "loss_eval": 1.0038610696792603,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.735087394714355,
+ 12.11837387084961,
+ 17.846410751342773,
+ 35.347412109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.662989416217897e-05,
+ 1.3822269465890713e-05,
+ 7.92401988292113e-06,
+ 3.472342541499529e-06,
+ 1.327858285549155e-06
+ ],
+ "bp_grad_F": [
+ 0.26001590490341187,
+ 0.21339008212089539,
+ 0.12293757498264313,
+ 0.05109258368611336,
+ 0.01986365020275116
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796500027179718,
+ "loss_eval": 1.0062025785446167,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.734339714050293,
+ 12.117914199829102,
+ 17.84966468811035,
+ 35.381446838378906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.6489182598888874e-05,
+ 1.3682294593309052e-05,
+ 8.124485248117708e-06,
+ 3.407540134503506e-06,
+ 1.3195593737691524e-06
+ ],
+ "bp_grad_F": [
+ 0.2605873942375183,
+ 0.21394510567188263,
+ 0.1232379749417305,
+ 0.05118485540151596,
+ 0.019882848486304283
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0082966089248657,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.733570098876953,
+ 12.118681907653809,
+ 17.854442596435547,
+ 35.417537689208984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.6188618246815167e-05,
+ 1.3713249245483894e-05,
+ 7.876165909692645e-06,
+ 3.343990783832851e-06,
+ 1.2941204659000505e-06
+ ],
+ "bp_grad_F": [
+ 0.2612352669239044,
+ 0.21454451978206635,
+ 0.12355507910251617,
+ 0.05128618702292442,
+ 0.019906867295503616
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0103161334991455,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.73337459564209,
+ 12.116337776184082,
+ 17.85533332824707,
+ 35.44430160522461
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.6262945791822858e-05,
+ 1.3456610759021714e-05,
+ 7.976923370733857e-06,
+ 3.304621941424557e-06,
+ 1.2957953003933653e-06
+ ],
+ "bp_grad_F": [
+ 0.2618514895439148,
+ 0.21511761844158173,
+ 0.12386228144168854,
+ 0.05138511210680008,
+ 0.019930575042963028
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0126534700393677,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.732640266418457,
+ 12.11673641204834,
+ 17.85984992980957,
+ 35.47673797607422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5915471522021107e-05,
+ 1.3434865650197025e-05,
+ 7.765964255668223e-06,
+ 3.272770300100092e-06,
+ 1.2807531675207429e-06
+ ],
+ "bp_grad_F": [
+ 0.26224803924560547,
+ 0.2155023217201233,
+ 0.124069944024086,
+ 0.051448848098516464,
+ 0.019943425431847572
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0140384435653687,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.732240676879883,
+ 12.115690231323242,
+ 17.86297035217285,
+ 35.500823974609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.557435462018475e-05,
+ 1.2797115232388023e-05,
+ 7.646640369785018e-06,
+ 3.2042576094681863e-06,
+ 1.2790382015737123e-06
+ ],
+ "bp_grad_F": [
+ 0.26270976662635803,
+ 0.2159367799758911,
+ 0.12429951131343842,
+ 0.051519569009542465,
+ 0.01995890960097313
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796500027179718,
+ "loss_eval": 1.0154695510864258,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.731745719909668,
+ 12.114669799804688,
+ 17.86736297607422,
+ 35.528076171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.58700677275192e-05,
+ 1.3018690879107453e-05,
+ 7.55094788473798e-06,
+ 3.2220066259469604e-06,
+ 1.2598871990121552e-06
+ ],
+ "bp_grad_F": [
+ 0.26308032870292664,
+ 0.2162918895483017,
+ 0.12448756396770477,
+ 0.051577214151620865,
+ 0.019970662891864777
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0169501304626465,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.731338500976562,
+ 12.113511085510254,
+ 17.86815643310547,
+ 35.54944610595703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5586350855301134e-05,
+ 1.2824431905755773e-05,
+ 7.649568942724727e-06,
+ 3.1966815186024178e-06,
+ 1.2639170563488733e-06
+ ],
+ "bp_grad_F": [
+ 0.26345473527908325,
+ 0.21664129197597504,
+ 0.12467629462480545,
+ 0.051637567579746246,
+ 0.01998509280383587
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796500027179718,
+ "loss_eval": 1.018563985824585,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.731039047241211,
+ 12.113682746887207,
+ 17.872100830078125,
+ 35.56554412841797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5501789675909095e-05,
+ 1.2836935638915747e-05,
+ 7.47852936910931e-06,
+ 3.1328777367889415e-06,
+ 1.2308250916248653e-06
+ ],
+ "bp_grad_F": [
+ 0.2637687623500824,
+ 0.2169436365365982,
+ 0.124836765229702,
+ 0.0516866035759449,
+ 0.019995568320155144
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0192590951919556,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.730656623840332,
+ 12.114008903503418,
+ 17.87257194519043,
+ 35.58961486816406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5237865227391012e-05,
+ 1.2954994417668786e-05,
+ 7.515009656344773e-06,
+ 3.2117325190483825e-06,
+ 1.2425814475136576e-06
+ ],
+ "bp_grad_F": [
+ 0.2640174925327301,
+ 0.21717986464500427,
+ 0.1249629333615303,
+ 0.051725782454013824,
+ 0.020004095509648323
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0201796293258667,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.730304718017578,
+ 12.112882614135742,
+ 17.87510108947754,
+ 35.60005569458008
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5281846572179347e-05,
+ 1.280397191294469e-05,
+ 7.457324500137474e-06,
+ 3.1238730571203632e-06,
+ 1.2271989362488966e-06
+ ],
+ "bp_grad_F": [
+ 0.26432526111602783,
+ 0.2174660563468933,
+ 0.12511758506298065,
+ 0.05177601799368858,
+ 0.02001647651195526
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0214923620224,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.730023384094238,
+ 12.112593650817871,
+ 17.87718963623047,
+ 35.61077880859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5160739167185966e-05,
+ 1.2885939213447273e-05,
+ 7.442678906954825e-06,
+ 3.1402662443724694e-06,
+ 1.2329509218034218e-06
+ ],
+ "bp_grad_F": [
+ 0.2645094394683838,
+ 0.21764276921749115,
+ 0.12521088123321533,
+ 0.051804810762405396,
+ 0.020022746175527573
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0221376419067383,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729791641235352,
+ 12.11282730102539,
+ 17.878896713256836,
+ 35.62131118774414
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4924515198799782e-05,
+ 1.2676942787948065e-05,
+ 7.327739240281517e-06,
+ 3.135102815576829e-06,
+ 1.2368633406367735e-06
+ ],
+ "bp_grad_F": [
+ 0.26469096541404724,
+ 0.2178148329257965,
+ 0.12530171871185303,
+ 0.051832377910614014,
+ 0.02002853713929653
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0227359533309937,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.72957706451416,
+ 12.112420082092285,
+ 17.879562377929688,
+ 35.631195068359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.5078092474141158e-05,
+ 1.2648180018004496e-05,
+ 7.402486517094076e-06,
+ 3.110948682660819e-06,
+ 1.2303731864449219e-06
+ ],
+ "bp_grad_F": [
+ 0.26483553647994995,
+ 0.2179516702890396,
+ 0.12537437677383423,
+ 0.051855091005563736,
+ 0.020033741369843483
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0231714248657227,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.72945499420166,
+ 12.112156867980957,
+ 17.8814754486084,
+ 35.639610290527344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4999122868175618e-05,
+ 1.2563705240609124e-05,
+ 7.3636233537399676e-06,
+ 3.091453436354641e-06,
+ 1.2325838270044187e-06
+ ],
+ "bp_grad_F": [
+ 0.2649652361869812,
+ 0.21807390451431274,
+ 0.12544025480747223,
+ 0.05187588557600975,
+ 0.020038409158587456
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0237369537353516,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729272842407227,
+ 12.112222671508789,
+ 17.881935119628906,
+ 35.644290924072266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4974531950429082e-05,
+ 1.2648583833652083e-05,
+ 7.3520282057870645e-06,
+ 3.080302576563554e-06,
+ 1.2291716302570421e-06
+ ],
+ "bp_grad_F": [
+ 0.2650584876537323,
+ 0.21816210448741913,
+ 0.12548699975013733,
+ 0.051890380680561066,
+ 0.020041609182953835
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0240200757980347,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.72924518585205,
+ 12.112285614013672,
+ 17.88214683532715,
+ 35.64848709106445
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4959082363930065e-05,
+ 1.2588670870172791e-05,
+ 7.344425739574945e-06,
+ 3.080124088228331e-06,
+ 1.2237677537996206e-06
+ ],
+ "bp_grad_F": [
+ 0.26513636112213135,
+ 0.21823462843894958,
+ 0.12552553415298462,
+ 0.051902592182159424,
+ 0.020044438540935516
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0243031978607178,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.72916030883789,
+ 12.112074851989746,
+ 17.882980346679688,
+ 35.650428771972656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4942641428206116e-05,
+ 1.2567295925691724e-05,
+ 7.336187991313636e-06,
+ 3.0725423130206764e-06,
+ 1.2260832136234967e-06
+ ],
+ "bp_grad_F": [
+ 0.26517778635025024,
+ 0.21827547252178192,
+ 0.12554767727851868,
+ 0.0519094243645668,
+ 0.02004585973918438
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0244944095611572,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729132652282715,
+ 12.112125396728516,
+ 17.883481979370117,
+ 35.65312576293945
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4903710507496726e-05,
+ 1.2576123481267132e-05,
+ 7.317236850212794e-06,
+ 3.078314875892829e-06,
+ 1.2210558679726091e-06
+ ],
+ "bp_grad_F": [
+ 0.26521575450897217,
+ 0.2183104306459427,
+ 0.1255662441253662,
+ 0.051915280520915985,
+ 0.02004723809659481
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0246349573135376,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729104995727539,
+ 12.11208724975586,
+ 17.88361167907715,
+ 35.65410614013672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4916706277290359e-05,
+ 1.2563130439957604e-05,
+ 7.323697445826838e-06,
+ 3.0812991553830216e-06,
+ 1.2211262401251588e-06
+ ],
+ "bp_grad_F": [
+ 0.26523175835609436,
+ 0.2183263599872589,
+ 0.12557478249073029,
+ 0.05191792547702789,
+ 0.02004779316484928
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0246796607971191,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729097366333008,
+ 12.112085342407227,
+ 17.88372230529785,
+ 35.65440368652344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4912001461198088e-05,
+ 1.2556130059238058e-05,
+ 7.32138505554758e-06,
+ 3.077205747104017e-06,
+ 1.2217307130413246e-06
+ ],
+ "bp_grad_F": [
+ 0.2652417719364166,
+ 0.21833550930023193,
+ 0.1255796104669571,
+ 0.05191945284605026,
+ 0.02004816010594368
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.0247222185134888,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 10.729093551635742,
+ 12.112082481384277,
+ 17.88372230529785,
+ 35.65460205078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 1.4914756320649758e-05,
+ 1.2556190995383076e-05,
+ 7.322747933358187e-06,
+ 3.0772835089010186e-06,
+ 1.2216489722050028e-06
+ ],
+ "bp_grad_F": [
+ 0.2652438282966614,
+ 0.21833744645118713,
+ 0.12558062374591827,
+ 0.051919758319854736,
+ 0.020048221573233604
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796000063419342,
+ "loss_eval": 1.024727463722229,
+ "epoch": 80
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": -0.0034942624624818563,
+ "gamma_dfa_per_layer": [
+ -0.029981477186083794,
+ 0.023911481723189354,
+ 0.0022033676505088806,
+ -0.010110422037541866
+ ],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.505881309509277,
+ 11.757291793823242,
+ 12.0764741897583,
+ 12.435522079467773
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00031470530666410923,
+ 0.0002926285960711539,
+ 0.00027369827148504555,
+ 0.0002595284313429147,
+ 0.0002512428327463567
+ ],
+ "bp_grad_F": [
+ 0.014148155227303505,
+ 0.013173527084290981,
+ 0.01228535920381546,
+ 0.0115915322676301,
+ 0.01116928644478321
+ ],
+ "gamma_dfa": 0.11511426232755184,
+ "gamma_dfa_per_layer": [
+ 0.12020161747932434,
+ 0.12450753152370453,
+ 0.12499555945396423,
+ 0.09075234085321426
+ ],
+ "acc_eval": 0.3775000274181366,
+ "loss_eval": 1.8237801790237427,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.90947437286377,
+ 13.027632713317871,
+ 14.888558387756348,
+ 17.22944450378418
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006904517649672925,
+ 0.000503765360917896,
+ 0.0003708408330567181,
+ 0.00028136910987086594,
+ 0.00023244605108629912
+ ],
+ "bp_grad_F": [
+ 0.03382011875510216,
+ 0.024346396327018738,
+ 0.017825284972786903,
+ 0.013448701240122318,
+ 0.011137359775602818
+ ],
+ "gamma_dfa": 0.219235859811306,
+ "gamma_dfa_per_layer": [
+ 0.2247210592031479,
+ 0.20836304128170013,
+ 0.23224417865276337,
+ 0.2116151601076126
+ ],
+ "acc_eval": 0.6325000524520874,
+ "loss_eval": 1.0442804098129272,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.249103546142578,
+ 14.663236618041992,
+ 19.286497116088867,
+ 24.994598388671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000785678334068507,
+ 0.0004984966944903135,
+ 0.00031956040766090155,
+ 0.00021816199296154082,
+ 0.00017694469715934247
+ ],
+ "bp_grad_F": [
+ 0.049792274832725525,
+ 0.03142387419939041,
+ 0.020070550963282585,
+ 0.01388809084892273,
+ 0.011133435182273388
+ ],
+ "gamma_dfa": 0.20651238784193993,
+ "gamma_dfa_per_layer": [
+ 0.19393788278102875,
+ 0.1939619481563568,
+ 0.23087021708488464,
+ 0.2072795033454895
+ ],
+ "acc_eval": 0.690500020980835,
+ "loss_eval": 0.8105630278587341,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.623353004455566,
+ 17.037206649780273,
+ 26.137210845947266,
+ 36.338985443115234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007407923694700003,
+ 0.0004117340431548655,
+ 0.00024256351753138006,
+ 0.00016813547699712217,
+ 0.00014022440882399678
+ ],
+ "bp_grad_F": [
+ 0.06029670313000679,
+ 0.0337882824242115,
+ 0.0196156557649374,
+ 0.01336250826716423,
+ 0.011071481741964817
+ ],
+ "gamma_dfa": 0.18698954582214355,
+ "gamma_dfa_per_layer": [
+ 0.15680347383022308,
+ 0.17669467628002167,
+ 0.2232135385274887,
+ 0.19124649465084076
+ ],
+ "acc_eval": 0.7130000591278076,
+ "loss_eval": 0.7352707386016846,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.056242942810059,
+ 20.31708526611328,
+ 35.354278564453125,
+ 50.72277069091797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007306670304387808,
+ 0.000362707331078127,
+ 0.00019432755652815104,
+ 0.00014284192002378404,
+ 0.0001259525743080303
+ ],
+ "bp_grad_F": [
+ 0.06756022572517395,
+ 0.03394190967082977,
+ 0.018268020823597908,
+ 0.012735997326672077,
+ 0.011040973477065563
+ ],
+ "gamma_dfa": 0.16737862676382065,
+ "gamma_dfa_per_layer": [
+ 0.12552234530448914,
+ 0.16295458376407623,
+ 0.2097114473581314,
+ 0.17132613062858582
+ ],
+ "acc_eval": 0.7350000143051147,
+ "loss_eval": 0.716023862361908,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.544439315795898,
+ 24.727155685424805,
+ 46.518768310546875,
+ 67.0296859741211
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007029862026683986,
+ 0.0003191934374626726,
+ 0.00016633918858133256,
+ 0.00012432104267645627,
+ 0.00011442468530731276
+ ],
+ "bp_grad_F": [
+ 0.07251796871423721,
+ 0.03311065956950188,
+ 0.016890449449419975,
+ 0.012321571819484234,
+ 0.011077084578573704
+ ],
+ "gamma_dfa": 0.15210051462054253,
+ "gamma_dfa_per_layer": [
+ 0.10109913349151611,
+ 0.15017138421535492,
+ 0.20331066846847534,
+ 0.15382087230682373
+ ],
+ "acc_eval": 0.7305000424385071,
+ "loss_eval": 0.7123240828514099,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.096785545349121,
+ 29.970369338989258,
+ 58.48172378540039,
+ 84.44245910644531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007362618925981224,
+ 0.0003065088822040707,
+ 0.00015729048755019903,
+ 0.00012451721704564989,
+ 0.00011588833149289712
+ ],
+ "bp_grad_F": [
+ 0.07530932128429413,
+ 0.03182085230946541,
+ 0.01569041982293129,
+ 0.012093811295926571,
+ 0.011190102435648441
+ ],
+ "gamma_dfa": 0.14102506078779697,
+ "gamma_dfa_per_layer": [
+ 0.08732745796442032,
+ 0.14003422856330872,
+ 0.19598272442817688,
+ 0.14075583219528198
+ ],
+ "acc_eval": 0.7235000133514404,
+ "loss_eval": 0.727388858795166,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.721030235290527,
+ 35.83012008666992,
+ 70.75320434570312,
+ 101.73139953613281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007345590856857598,
+ 0.00026920062373392284,
+ 0.000134471949422732,
+ 0.00011552426440175623,
+ 0.000110697525087744
+ ],
+ "bp_grad_F": [
+ 0.0819108858704567,
+ 0.03190097585320473,
+ 0.015249059535562992,
+ 0.012194199487566948,
+ 0.011436647735536098
+ ],
+ "gamma_dfa": 0.1306514535099268,
+ "gamma_dfa_per_layer": [
+ 0.07609214633703232,
+ 0.13159415125846863,
+ 0.18644346296787262,
+ 0.12847605347633362
+ ],
+ "acc_eval": 0.7155000567436218,
+ "loss_eval": 0.7610863447189331,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.34220027923584,
+ 42.35697937011719,
+ 83.51715850830078,
+ 120.42235565185547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006878858548589051,
+ 0.0002570476208347827,
+ 0.00012823278666473925,
+ 0.00011104762234026566,
+ 0.00010812593973241746
+ ],
+ "bp_grad_F": [
+ 0.08083735406398773,
+ 0.029663894325494766,
+ 0.014093351550400257,
+ 0.01174441073089838,
+ 0.011170739307999611
+ ],
+ "gamma_dfa": 0.12087789550423622,
+ "gamma_dfa_per_layer": [
+ 0.06335650384426117,
+ 0.12819789350032806,
+ 0.17300739884376526,
+ 0.1189497858285904
+ ],
+ "acc_eval": 0.7225000262260437,
+ "loss_eval": 0.737341046333313,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 16.00116729736328,
+ 49.21657943725586,
+ 96.05623626708984,
+ 138.10394287109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007566744461655617,
+ 0.0002493424981366843,
+ 0.0001229145418619737,
+ 0.00010773885151138529,
+ 0.00010482135257916525
+ ],
+ "bp_grad_F": [
+ 0.08636438101530075,
+ 0.029551593586802483,
+ 0.013877596706151962,
+ 0.011869709938764572,
+ 0.011369508691132069
+ ],
+ "gamma_dfa": 0.11321612633764744,
+ "gamma_dfa_per_layer": [
+ 0.05804715305566788,
+ 0.11809944361448288,
+ 0.16106289625167847,
+ 0.11565501242876053
+ ],
+ "acc_eval": 0.7175000309944153,
+ "loss_eval": 0.7598624229431152,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 16.664016723632812,
+ 56.4381103515625,
+ 109.18519592285156,
+ 157.13400268554688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007165206479839981,
+ 0.00021803597337566316,
+ 0.00010753094829851761,
+ 0.00010056991595774889,
+ 9.790556214284152e-05
+ ],
+ "bp_grad_F": [
+ 0.09135312587022781,
+ 0.029706060886383057,
+ 0.013932082802057266,
+ 0.012196206487715244,
+ 0.011740063317120075
+ ],
+ "gamma_dfa": 0.1071977848187089,
+ "gamma_dfa_per_layer": [
+ 0.04954911395907402,
+ 0.1143685057759285,
+ 0.1548140048980713,
+ 0.11005951464176178
+ ],
+ "acc_eval": 0.7000000476837158,
+ "loss_eval": 0.825758159160614,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 17.334924697875977,
+ 63.52719497680664,
+ 121.75878143310547,
+ 175.05706787109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007098973728716373,
+ 0.0002017641963902861,
+ 0.00010367313370807096,
+ 9.554869029670954e-05,
+ 9.339704411104321e-05
+ ],
+ "bp_grad_F": [
+ 0.0928206816315651,
+ 0.02807745151221752,
+ 0.013300982303917408,
+ 0.011954967863857746,
+ 0.011584528721868992
+ ],
+ "gamma_dfa": 0.10307322815060616,
+ "gamma_dfa_per_layer": [
+ 0.046224936842918396,
+ 0.11165355145931244,
+ 0.14536075294017792,
+ 0.10905367136001587
+ ],
+ "acc_eval": 0.7085000276565552,
+ "loss_eval": 0.8147838711738586,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 18.066408157348633,
+ 71.18386840820312,
+ 135.29449462890625,
+ 194.25502014160156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000749382539652288,
+ 0.00023277483705896884,
+ 0.00012272220919840038,
+ 0.00011419993097661063,
+ 0.00011211293895030394
+ ],
+ "bp_grad_F": [
+ 0.08808046579360962,
+ 0.026459064334630966,
+ 0.01287052407860756,
+ 0.011758155189454556,
+ 0.01143786869943142
+ ],
+ "gamma_dfa": 0.09524188842624426,
+ "gamma_dfa_per_layer": [
+ 0.042861852794885635,
+ 0.09963438659906387,
+ 0.1363406628370285,
+ 0.10213065147399902
+ ],
+ "acc_eval": 0.7090000510215759,
+ "loss_eval": 0.7797307372093201,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 18.722259521484375,
+ 78.48313903808594,
+ 148.08277893066406,
+ 213.12060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007828621892258525,
+ 0.00022329931380227208,
+ 0.0001217587196151726,
+ 0.00011403425014577806,
+ 0.00011114090739283711
+ ],
+ "bp_grad_F": [
+ 0.09129610657691956,
+ 0.02616111747920513,
+ 0.012879838235676289,
+ 0.011936144903302193,
+ 0.011643719859421253
+ ],
+ "gamma_dfa": 0.0928388200700283,
+ "gamma_dfa_per_layer": [
+ 0.04325374215841293,
+ 0.09723485261201859,
+ 0.13119162619113922,
+ 0.09967505931854248
+ ],
+ "acc_eval": 0.7015000581741333,
+ "loss_eval": 0.810487687587738,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 19.439603805541992,
+ 86.18466186523438,
+ 160.40892028808594,
+ 230.23739624023438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007217489182949066,
+ 0.00018824212020263076,
+ 0.00010298609413439408,
+ 9.960142779164016e-05,
+ 9.748922457220033e-05
+ ],
+ "bp_grad_F": [
+ 0.09306738525629044,
+ 0.02548908442258835,
+ 0.012566950172185898,
+ 0.011724555864930153,
+ 0.011449399404227734
+ ],
+ "gamma_dfa": 0.09134612884372473,
+ "gamma_dfa_per_layer": [
+ 0.040905896574258804,
+ 0.09668857604265213,
+ 0.12694117426872253,
+ 0.10084886848926544
+ ],
+ "acc_eval": 0.7110000252723694,
+ "loss_eval": 0.7941330075263977,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 20.229736328125,
+ 94.05648040771484,
+ 173.3369903564453,
+ 248.50965881347656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007364301127381623,
+ 0.00019103182421531528,
+ 0.00010473190195625648,
+ 0.00010049886623164639,
+ 9.873881208477542e-05
+ ],
+ "bp_grad_F": [
+ 0.09542964398860931,
+ 0.025049429386854172,
+ 0.012468041852116585,
+ 0.011731654405593872,
+ 0.011484012007713318
+ ],
+ "gamma_dfa": 0.08733212016522884,
+ "gamma_dfa_per_layer": [
+ 0.034523673355579376,
+ 0.09200998395681381,
+ 0.12135256081819534,
+ 0.10144226253032684
+ ],
+ "acc_eval": 0.7200000286102295,
+ "loss_eval": 0.806917130947113,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 20.94115447998047,
+ 101.5516128540039,
+ 185.91993713378906,
+ 265.6839294433594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008022052352316678,
+ 0.00020157739345449954,
+ 0.00011702251504175365,
+ 0.00011363227531546727,
+ 0.00011240412277402356
+ ],
+ "bp_grad_F": [
+ 0.09439960867166519,
+ 0.024019507691264153,
+ 0.01232285425066948,
+ 0.011713731102645397,
+ 0.011482013389468193
+ ],
+ "gamma_dfa": 0.08548407163470984,
+ "gamma_dfa_per_layer": [
+ 0.038230378180742264,
+ 0.08889900892972946,
+ 0.11632363498210907,
+ 0.09848326444625854
+ ],
+ "acc_eval": 0.7120000123977661,
+ "loss_eval": 0.8131889700889587,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 21.71381950378418,
+ 109.32372283935547,
+ 199.24642944335938,
+ 285.1650085449219
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00076432921923697,
+ 0.00018322077812626958,
+ 0.00010481786011951044,
+ 0.00010164766717934981,
+ 0.00010087565897265449
+ ],
+ "bp_grad_F": [
+ 0.09489408135414124,
+ 0.023419344797730446,
+ 0.01224115677177906,
+ 0.011706860736012459,
+ 0.011501944623887539
+ ],
+ "gamma_dfa": 0.08550543524324894,
+ "gamma_dfa_per_layer": [
+ 0.04093854874372482,
+ 0.09244771301746368,
+ 0.11161119490861893,
+ 0.09702428430318832
+ ],
+ "acc_eval": 0.7150000333786011,
+ "loss_eval": 0.8401313424110413,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 22.474592208862305,
+ 117.0955810546875,
+ 212.0178680419922,
+ 303.7491455078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008428111323155463,
+ 0.00020001262600999326,
+ 0.00012667309783864766,
+ 0.00012337132648099214,
+ 0.00012319188681431115
+ ],
+ "bp_grad_F": [
+ 0.09607862681150436,
+ 0.023683469742536545,
+ 0.01269453763961792,
+ 0.012188468128442764,
+ 0.011980941519141197
+ ],
+ "gamma_dfa": 0.07937186863273382,
+ "gamma_dfa_per_layer": [
+ 0.036147553473711014,
+ 0.08243555575609207,
+ 0.1066455990076065,
+ 0.0922587662935257
+ ],
+ "acc_eval": 0.6840000152587891,
+ "loss_eval": 0.881807267665863,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 23.23648452758789,
+ 124.45619201660156,
+ 224.60977172851562,
+ 321.2709655761719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007923559751361609,
+ 0.00018490788352210075,
+ 0.00011116286623291671,
+ 0.00010867219680221751,
+ 0.00010773272515507415
+ ],
+ "bp_grad_F": [
+ 0.09617631882429123,
+ 0.02261228673160076,
+ 0.012236458249390125,
+ 0.011800081469118595,
+ 0.011619490571320057
+ ],
+ "gamma_dfa": 0.07946366257965565,
+ "gamma_dfa_per_layer": [
+ 0.036630548536777496,
+ 0.08521611988544464,
+ 0.10408685356378555,
+ 0.0919211283326149
+ ],
+ "acc_eval": 0.7070000171661377,
+ "loss_eval": 0.8307667374610901,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 23.941816329956055,
+ 131.71353149414062,
+ 236.79910278320312,
+ 338.2337951660156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007988678989931941,
+ 0.00017439998919144273,
+ 0.0001077677879948169,
+ 0.00010501289216335863,
+ 0.00010426317021483555
+ ],
+ "bp_grad_F": [
+ 0.09615935385227203,
+ 0.02214771881699562,
+ 0.012244326062500477,
+ 0.01184793096035719,
+ 0.011676526628434658
+ ],
+ "gamma_dfa": 0.0779404304921627,
+ "gamma_dfa_per_layer": [
+ 0.032858967781066895,
+ 0.0826181098818779,
+ 0.10167358815670013,
+ 0.09461105614900589
+ ],
+ "acc_eval": 0.6955000162124634,
+ "loss_eval": 0.8431603312492371,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 24.736867904663086,
+ 139.1349639892578,
+ 248.7137908935547,
+ 355.0362243652344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008002957911230624,
+ 0.00016955590399447829,
+ 0.00010642779670888558,
+ 0.00010389652743469924,
+ 0.00010333865793654695
+ ],
+ "bp_grad_F": [
+ 0.10074009746313095,
+ 0.022332124412059784,
+ 0.012284242548048496,
+ 0.011890492402017117,
+ 0.011716442182660103
+ ],
+ "gamma_dfa": 0.07599243335425854,
+ "gamma_dfa_per_layer": [
+ 0.03026191145181656,
+ 0.07909790426492691,
+ 0.10020720213651657,
+ 0.09440271556377411
+ ],
+ "acc_eval": 0.6995000243186951,
+ "loss_eval": 0.8646643161773682,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 25.527332305908203,
+ 146.32603454589844,
+ 260.3341064453125,
+ 371.9651184082031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008058008388616145,
+ 0.00016914791194722056,
+ 0.00010861256305361167,
+ 0.00010723753075581044,
+ 0.00010632628982421011
+ ],
+ "bp_grad_F": [
+ 0.10164787620306015,
+ 0.02202906273305416,
+ 0.01239779032766819,
+ 0.012042474001646042,
+ 0.011877987533807755
+ ],
+ "gamma_dfa": 0.07324381358921528,
+ "gamma_dfa_per_layer": [
+ 0.03170452266931534,
+ 0.07619009912014008,
+ 0.09431108087301254,
+ 0.09076955169439316
+ ],
+ "acc_eval": 0.6910000443458557,
+ "loss_eval": 0.9011825919151306,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 26.24439239501953,
+ 153.2904510498047,
+ 271.96038818359375,
+ 388.2030029296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007652259082533419,
+ 0.00016368107753805816,
+ 0.00010516044130781665,
+ 0.0001030244748108089,
+ 0.00010207654122496024
+ ],
+ "bp_grad_F": [
+ 0.09788329899311066,
+ 0.021043717861175537,
+ 0.012156899087131023,
+ 0.011852008290588856,
+ 0.011708464473485947
+ ],
+ "gamma_dfa": 0.07162218820303679,
+ "gamma_dfa_per_layer": [
+ 0.032286133617162704,
+ 0.0729740634560585,
+ 0.09137451648712158,
+ 0.08985403925180435
+ ],
+ "acc_eval": 0.7015000581741333,
+ "loss_eval": 0.8572027683258057,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 26.939895629882812,
+ 160.01840209960938,
+ 282.9203796386719,
+ 404.1251220703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007471513818018138,
+ 0.00015666495892219245,
+ 0.0001027472535497509,
+ 0.00010242985445074737,
+ 0.00010123744141310453
+ ],
+ "bp_grad_F": [
+ 0.09715361893177032,
+ 0.02044457010924816,
+ 0.011886605061590672,
+ 0.011604394763708115,
+ 0.01146735716611147
+ ],
+ "gamma_dfa": 0.07091694697737694,
+ "gamma_dfa_per_layer": [
+ 0.0328441858291626,
+ 0.07304085046052933,
+ 0.08939228951931,
+ 0.08839046210050583
+ ],
+ "acc_eval": 0.7035000324249268,
+ "loss_eval": 0.8259502649307251,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 27.655963897705078,
+ 166.2253875732422,
+ 293.953857421875,
+ 419.2309265136719
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008196054841391742,
+ 0.000168012484209612,
+ 0.00011266919318586588,
+ 0.0001119820517487824,
+ 0.00011136133980471641
+ ],
+ "bp_grad_F": [
+ 0.09666500240564346,
+ 0.020363574847579002,
+ 0.012169744819402695,
+ 0.011900369077920914,
+ 0.011767606250941753
+ ],
+ "gamma_dfa": 0.07011445891112089,
+ "gamma_dfa_per_layer": [
+ 0.03361910209059715,
+ 0.07148489356040955,
+ 0.08753866702318192,
+ 0.08781517297029495
+ ],
+ "acc_eval": 0.6930000185966492,
+ "loss_eval": 0.8744071125984192,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 28.399173736572266,
+ 173.29478454589844,
+ 305.1183776855469,
+ 435.8616027832031
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008379096980206668,
+ 0.00016787118511274457,
+ 0.00011563840962480754,
+ 0.00011382131197024137,
+ 0.00011414202890591696
+ ],
+ "bp_grad_F": [
+ 0.09941841661930084,
+ 0.01996329240500927,
+ 0.012196086347103119,
+ 0.011958655901253223,
+ 0.011834335513412952
+ ],
+ "gamma_dfa": 0.06707034399732947,
+ "gamma_dfa_per_layer": [
+ 0.027506088837981224,
+ 0.07163777202367783,
+ 0.08489245176315308,
+ 0.08424506336450577
+ ],
+ "acc_eval": 0.6860000491142273,
+ "loss_eval": 0.8969190716743469,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 29.067270278930664,
+ 179.52621459960938,
+ 315.666015625,
+ 450.67449951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007646313752047718,
+ 0.00014840309449937195,
+ 9.849335037870333e-05,
+ 9.682594100013375e-05,
+ 9.619411139283329e-05
+ ],
+ "bp_grad_F": [
+ 0.10344142466783524,
+ 0.020078541710972786,
+ 0.012122261337935925,
+ 0.011881489306688309,
+ 0.011760085821151733
+ ],
+ "gamma_dfa": 0.06692653149366379,
+ "gamma_dfa_per_layer": [
+ 0.027295783162117004,
+ 0.06953233480453491,
+ 0.08493673801422119,
+ 0.08594126999378204
+ ],
+ "acc_eval": 0.6980000138282776,
+ "loss_eval": 0.9112558960914612,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 29.80398941040039,
+ 186.03025817871094,
+ 326.7105407714844,
+ 466.4792785644531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008647075155749917,
+ 0.00016527411935385317,
+ 0.00011362476652720943,
+ 0.00011306258238619193,
+ 0.00011151444778079167
+ ],
+ "bp_grad_F": [
+ 0.0982326790690422,
+ 0.0193523820489645,
+ 0.012001772411167622,
+ 0.011787012219429016,
+ 0.011672897264361382
+ ],
+ "gamma_dfa": 0.06665132055059075,
+ "gamma_dfa_per_layer": [
+ 0.028357060626149178,
+ 0.06870155036449432,
+ 0.0840969979763031,
+ 0.08544967323541641
+ ],
+ "acc_eval": 0.6960000395774841,
+ "loss_eval": 0.8792264461517334,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 30.495162963867188,
+ 192.21092224121094,
+ 336.62432861328125,
+ 480.96929931640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007892370922490954,
+ 0.00014862553507555276,
+ 0.00010144516272703186,
+ 0.00010014566942118108,
+ 9.811606287257746e-05
+ ],
+ "bp_grad_F": [
+ 0.10485321283340454,
+ 0.01980445720255375,
+ 0.012311456725001335,
+ 0.01209663413465023,
+ 0.011984387412667274
+ ],
+ "gamma_dfa": 0.0650303359143436,
+ "gamma_dfa_per_layer": [
+ 0.02565421722829342,
+ 0.06553934514522552,
+ 0.08334222435951233,
+ 0.08558555692434311
+ ],
+ "acc_eval": 0.6845000386238098,
+ "loss_eval": 0.9355857968330383,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 31.204212188720703,
+ 198.0793914794922,
+ 346.7908020019531,
+ 494.94366455078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008273097337223589,
+ 0.00016349409997928888,
+ 0.00011394457396818325,
+ 0.00011259203165536746,
+ 0.00011180129513377324
+ ],
+ "bp_grad_F": [
+ 0.10106314718723297,
+ 0.019085418432950974,
+ 0.01192714087665081,
+ 0.011723030358552933,
+ 0.011616164818406105
+ ],
+ "gamma_dfa": 0.06359042041003704,
+ "gamma_dfa_per_layer": [
+ 0.025547169148921967,
+ 0.06356105208396912,
+ 0.08179818838834763,
+ 0.08345527201890945
+ ],
+ "acc_eval": 0.7055000066757202,
+ "loss_eval": 0.8810407519340515,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 31.86461067199707,
+ 203.8866424560547,
+ 357.24273681640625,
+ 509.47283935546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007937258342280984,
+ 0.0001423554786015302,
+ 0.0001006650782073848,
+ 9.906977356877178e-05,
+ 9.873251110548154e-05
+ ],
+ "bp_grad_F": [
+ 0.10255990922451019,
+ 0.018815871328115463,
+ 0.012050059624016285,
+ 0.011867615394294262,
+ 0.011764303781092167
+ ],
+ "gamma_dfa": 0.06225612107664347,
+ "gamma_dfa_per_layer": [
+ 0.026912778615951538,
+ 0.060097675770521164,
+ 0.07986276596784592,
+ 0.08215126395225525
+ ],
+ "acc_eval": 0.6975000500679016,
+ "loss_eval": 0.8993597626686096,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 32.55842590332031,
+ 209.36538696289062,
+ 366.7745056152344,
+ 523.1634521484375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009271818562410772,
+ 0.00017398923228029162,
+ 0.00012348532618489116,
+ 0.00012206545943627134,
+ 0.00011946412996621802
+ ],
+ "bp_grad_F": [
+ 0.10045517235994339,
+ 0.018744034692645073,
+ 0.0122413644567132,
+ 0.012060520239174366,
+ 0.011960742995142937
+ ],
+ "gamma_dfa": 0.06293319165706635,
+ "gamma_dfa_per_layer": [
+ 0.02326873689889908,
+ 0.06609776616096497,
+ 0.07875392585992813,
+ 0.0836123377084732
+ ],
+ "acc_eval": 0.6760000586509705,
+ "loss_eval": 0.9358338713645935,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 33.2861213684082,
+ 214.81686401367188,
+ 376.10357666015625,
+ 536.3932495117188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008684046333655715,
+ 0.0001622825366212055,
+ 0.00011986666504526511,
+ 0.00011786946561187506,
+ 0.00011659466690616682
+ ],
+ "bp_grad_F": [
+ 0.10286933183670044,
+ 0.018639566376805305,
+ 0.012188107706606388,
+ 0.01201487798243761,
+ 0.011918813921511173
+ ],
+ "gamma_dfa": 0.06226353673264384,
+ "gamma_dfa_per_layer": [
+ 0.023258207365870476,
+ 0.06267606467008591,
+ 0.0803714394569397,
+ 0.08274843543767929
+ ],
+ "acc_eval": 0.6810000538825989,
+ "loss_eval": 0.9304502010345459,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 33.87834167480469,
+ 220.428466796875,
+ 384.2508850097656,
+ 548.2610473632812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007953296881169081,
+ 0.00014800684584770352,
+ 0.00011162432201672345,
+ 0.00011058645759476349,
+ 0.00010956013284157962
+ ],
+ "bp_grad_F": [
+ 0.10028568655252457,
+ 0.018069755285978317,
+ 0.011859637685120106,
+ 0.011696909554302692,
+ 0.01160619780421257
+ ],
+ "gamma_dfa": 0.06300693331286311,
+ "gamma_dfa_per_layer": [
+ 0.027522550895810127,
+ 0.06186108663678169,
+ 0.07987839728593826,
+ 0.08276569843292236
+ ],
+ "acc_eval": 0.6955000162124634,
+ "loss_eval": 0.8840450048446655,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 34.509605407714844,
+ 225.59780883789062,
+ 393.6628112792969,
+ 561.568115234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008583659655414522,
+ 0.00015650303976144642,
+ 0.00011532937787706032,
+ 0.00011489073949633166,
+ 0.00011400022049201652
+ ],
+ "bp_grad_F": [
+ 0.09966019541025162,
+ 0.018014561384916306,
+ 0.012010997161269188,
+ 0.011846955865621567,
+ 0.011755259707570076
+ ],
+ "gamma_dfa": 0.06271304981783032,
+ "gamma_dfa_per_layer": [
+ 0.029912440106272697,
+ 0.06141362711787224,
+ 0.0793088749051094,
+ 0.08021725714206696
+ ],
+ "acc_eval": 0.687000036239624,
+ "loss_eval": 0.9074093103408813,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 35.15583801269531,
+ 230.31370544433594,
+ 402.0650634765625,
+ 574.2296752929688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008762985817156732,
+ 0.00015229854034259915,
+ 0.00011411930609028786,
+ 0.0001132417019107379,
+ 0.00011245955829508603
+ ],
+ "bp_grad_F": [
+ 0.09909173101186752,
+ 0.017660830169916153,
+ 0.011859647929668427,
+ 0.011700768023729324,
+ 0.011612875387072563
+ ],
+ "gamma_dfa": 0.059298016130924225,
+ "gamma_dfa_per_layer": [
+ 0.026200097054243088,
+ 0.0549272783100605,
+ 0.0762626901268959,
+ 0.0798019990324974
+ ],
+ "acc_eval": 0.7035000324249268,
+ "loss_eval": 0.8701910376548767,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 35.66206741333008,
+ 234.8238983154297,
+ 409.3634033203125,
+ 584.876953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009031461668200791,
+ 0.00016782402235548943,
+ 0.00012555152352433652,
+ 0.0001250550412805751,
+ 0.000123959660413675
+ ],
+ "bp_grad_F": [
+ 0.09997168928384781,
+ 0.01780031807720661,
+ 0.012050634250044823,
+ 0.011898917146027088,
+ 0.011813494376838207
+ ],
+ "gamma_dfa": 0.06037319032475352,
+ "gamma_dfa_per_layer": [
+ 0.028592003509402275,
+ 0.05390740931034088,
+ 0.07796172052621841,
+ 0.08103162795305252
+ ],
+ "acc_eval": 0.6850000619888306,
+ "loss_eval": 0.9033781886100769,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 36.278228759765625,
+ 239.4936981201172,
+ 417.3722229003906,
+ 596.1981201171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009072510292753577,
+ 0.00015473780513275415,
+ 0.00011584340245462954,
+ 0.00011548803740879521,
+ 0.00011424912372604012
+ ],
+ "bp_grad_F": [
+ 0.10279728472232819,
+ 0.017760641872882843,
+ 0.012076830491423607,
+ 0.01192280650138855,
+ 0.011838974431157112
+ ],
+ "gamma_dfa": 0.05956542398780584,
+ "gamma_dfa_per_layer": [
+ 0.025189489126205444,
+ 0.05668117478489876,
+ 0.07571582496166229,
+ 0.08067520707845688
+ ],
+ "acc_eval": 0.6835000514984131,
+ "loss_eval": 0.9166074395179749,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 36.87733459472656,
+ 244.1138153076172,
+ 425.2259826660156,
+ 607.8081665039062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008976306999102235,
+ 0.00015640830679330975,
+ 0.00012026254989905283,
+ 0.00011915730283362791,
+ 0.00011880237434525043
+ ],
+ "bp_grad_F": [
+ 0.10276701301336288,
+ 0.017705289646983147,
+ 0.012149399146437645,
+ 0.01199993398040533,
+ 0.01191749982535839
+ ],
+ "gamma_dfa": 0.05778269004076719,
+ "gamma_dfa_per_layer": [
+ 0.02565983682870865,
+ 0.051832567900419235,
+ 0.07554878294467926,
+ 0.07808957248926163
+ ],
+ "acc_eval": 0.6880000233650208,
+ "loss_eval": 0.9326384663581848,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 37.373634338378906,
+ 248.1051483154297,
+ 432.9554748535156,
+ 618.172607421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009300907258875668,
+ 0.00016527887783013284,
+ 0.00012494091060943902,
+ 0.00012375703954603523,
+ 0.00012343957496341318
+ ],
+ "bp_grad_F": [
+ 0.10167930275201797,
+ 0.017580606043338776,
+ 0.01197358313947916,
+ 0.01181697752326727,
+ 0.011733012273907661
+ ],
+ "gamma_dfa": 0.059646998066455126,
+ "gamma_dfa_per_layer": [
+ 0.025086766108870506,
+ 0.05520859733223915,
+ 0.0782475471496582,
+ 0.08004508167505264
+ ],
+ "acc_eval": 0.6935000419616699,
+ "loss_eval": 0.9074762463569641,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 37.94633483886719,
+ 252.25924682617188,
+ 439.8863525390625,
+ 628.1370239257812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008688273373991251,
+ 0.00015619541227351874,
+ 0.00011818459461210296,
+ 0.00011805404938058928,
+ 0.00011655993148451671
+ ],
+ "bp_grad_F": [
+ 0.10280012339353561,
+ 0.017362425103783607,
+ 0.012144921347498894,
+ 0.012009261175990105,
+ 0.011929930187761784
+ ],
+ "gamma_dfa": 0.057152220979332924,
+ "gamma_dfa_per_layer": [
+ 0.026838082820177078,
+ 0.05145636573433876,
+ 0.07389623671770096,
+ 0.0764181986451149
+ ],
+ "acc_eval": 0.6780000329017639,
+ "loss_eval": 0.9220576286315918,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 38.43475341796875,
+ 256.3348388671875,
+ 446.7797546386719,
+ 638.6549072265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009689890430308878,
+ 0.0001675912644714117,
+ 0.00013143723481334746,
+ 0.00012922017776872963,
+ 0.00012865127064287663
+ ],
+ "bp_grad_F": [
+ 0.10019267350435257,
+ 0.017157867550849915,
+ 0.012005961500108242,
+ 0.01186591386795044,
+ 0.011786815710365772
+ ],
+ "gamma_dfa": 0.05704171909019351,
+ "gamma_dfa_per_layer": [
+ 0.02657354436814785,
+ 0.04850248247385025,
+ 0.07429356873035431,
+ 0.07879728078842163
+ ],
+ "acc_eval": 0.6815000176429749,
+ "loss_eval": 0.9045827388763428,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 38.949981689453125,
+ 259.91455078125,
+ 453.5318603515625,
+ 649.1691284179688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008703607600182295,
+ 0.0001509855646872893,
+ 0.00011334709415677935,
+ 0.00011273188283666968,
+ 0.00011187820200575516
+ ],
+ "bp_grad_F": [
+ 0.10038246959447861,
+ 0.017015060409903526,
+ 0.011884159408509731,
+ 0.011748326942324638,
+ 0.01167102251201868
+ ],
+ "gamma_dfa": 0.056442280765622854,
+ "gamma_dfa_per_layer": [
+ 0.024923482909798622,
+ 0.04813612625002861,
+ 0.07466092705726624,
+ 0.07804858684539795
+ ],
+ "acc_eval": 0.6880000233650208,
+ "loss_eval": 0.8986373543739319,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 39.40317916870117,
+ 263.8382873535156,
+ 459.8589782714844,
+ 657.81396484375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008396115736104548,
+ 0.00014526791346725076,
+ 0.0001117709616664797,
+ 0.0001101615052903071,
+ 0.00010919143096543849
+ ],
+ "bp_grad_F": [
+ 0.10223646461963654,
+ 0.01701364293694496,
+ 0.011921641416847706,
+ 0.011793220415711403,
+ 0.01171908900141716
+ ],
+ "gamma_dfa": 0.05634786421433091,
+ "gamma_dfa_per_layer": [
+ 0.023860810324549675,
+ 0.05130583420395851,
+ 0.0730678141117096,
+ 0.07715699821710587
+ ],
+ "acc_eval": 0.6845000386238098,
+ "loss_eval": 0.9070615172386169,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 39.78729248046875,
+ 267.06787109375,
+ 465.8781433105469,
+ 665.705078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008805220131762326,
+ 0.0001506610424257815,
+ 0.0001190964540001005,
+ 0.00011831042502308264,
+ 0.0001174084609374404
+ ],
+ "bp_grad_F": [
+ 0.09873763471841812,
+ 0.01661210134625435,
+ 0.011734068393707275,
+ 0.011604530736804008,
+ 0.011532736010849476
+ ],
+ "gamma_dfa": 0.057100610341876745,
+ "gamma_dfa_per_layer": [
+ 0.025687912479043007,
+ 0.05223910138010979,
+ 0.07347920536994934,
+ 0.07699622213840485
+ ],
+ "acc_eval": 0.7010000348091125,
+ "loss_eval": 0.8647292256355286,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 40.20953369140625,
+ 270.48760986328125,
+ 471.71197509765625,
+ 674.6234741210938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008946783491410315,
+ 0.0001546104613225907,
+ 0.00012653943849727511,
+ 0.0001261695142602548,
+ 0.00012597300519701093
+ ],
+ "bp_grad_F": [
+ 0.10005417466163635,
+ 0.016553794965147972,
+ 0.011853700503706932,
+ 0.011732862330973148,
+ 0.01166335679590702
+ ],
+ "gamma_dfa": 0.056281615514308214,
+ "gamma_dfa_per_layer": [
+ 0.02603459171950817,
+ 0.051092494279146194,
+ 0.07222969830036163,
+ 0.07576967775821686
+ ],
+ "acc_eval": 0.6895000338554382,
+ "loss_eval": 0.8898184299468994,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 40.61681365966797,
+ 273.5674743652344,
+ 477.6903381347656,
+ 683.2316284179688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009305709972977638,
+ 0.0001684492890490219,
+ 0.00013056330499239266,
+ 0.00013055883755441755,
+ 0.00012972661352250725
+ ],
+ "bp_grad_F": [
+ 0.10108529776334763,
+ 0.01676928997039795,
+ 0.012042575515806675,
+ 0.011920345947146416,
+ 0.011849730275571346
+ ],
+ "gamma_dfa": 0.05756285693496466,
+ "gamma_dfa_per_layer": [
+ 0.028283007442951202,
+ 0.04865947738289833,
+ 0.0757322907447815,
+ 0.0775766521692276
+ ],
+ "acc_eval": 0.6825000047683716,
+ "loss_eval": 0.9249827861785889,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 40.986331939697266,
+ 276.55340576171875,
+ 482.9735412597656,
+ 690.4827880859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009371762280352414,
+ 0.00015377832460217178,
+ 0.00011931644257856533,
+ 0.00011877353972522542,
+ 0.00011843052197946236
+ ],
+ "bp_grad_F": [
+ 0.10423478484153748,
+ 0.01686144433915615,
+ 0.012089447118341923,
+ 0.011962956748902798,
+ 0.011895008385181427
+ ],
+ "gamma_dfa": 0.05634950753301382,
+ "gamma_dfa_per_layer": [
+ 0.024047940969467163,
+ 0.05029236152768135,
+ 0.07294473052024841,
+ 0.07811299711465836
+ ],
+ "acc_eval": 0.6770000457763672,
+ "loss_eval": 0.9276119470596313,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 41.36444091796875,
+ 279.21368408203125,
+ 487.9245910644531,
+ 698.8203735351562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009180991910398006,
+ 0.00016040228365454823,
+ 0.00012619509652722627,
+ 0.0001242315920535475,
+ 0.00012414241791702807
+ ],
+ "bp_grad_F": [
+ 0.09876055270433426,
+ 0.016378939151763916,
+ 0.011831536889076233,
+ 0.011710439808666706,
+ 0.011641835793852806
+ ],
+ "gamma_dfa": 0.056217589881271124,
+ "gamma_dfa_per_layer": [
+ 0.026943759992718697,
+ 0.04981214925646782,
+ 0.0719020888209343,
+ 0.07621236145496368
+ ],
+ "acc_eval": 0.6945000290870667,
+ "loss_eval": 0.8922800421714783,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 41.725521087646484,
+ 282.2077331542969,
+ 492.55194091796875,
+ 705.709228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009282235405407846,
+ 0.00015841209096834064,
+ 0.00012215816241223365,
+ 0.0001216854143422097,
+ 0.0001213739305967465
+ ],
+ "bp_grad_F": [
+ 0.10062722116708755,
+ 0.016464965417981148,
+ 0.011968642473220825,
+ 0.011850792914628983,
+ 0.011783461086452007
+ ],
+ "gamma_dfa": 0.05594501877203584,
+ "gamma_dfa_per_layer": [
+ 0.027507653459906578,
+ 0.047868166118860245,
+ 0.07275017350912094,
+ 0.07565408200025558
+ ],
+ "acc_eval": 0.674500048160553,
+ "loss_eval": 0.9168669581413269,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 42.07438659667969,
+ 284.91143798828125,
+ 497.33489990234375,
+ 712.7407836914062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008946438319981098,
+ 0.0001599262177478522,
+ 0.0001243542501470074,
+ 0.00012355486978776753,
+ 0.0001230162160936743
+ ],
+ "bp_grad_F": [
+ 0.09976927936077118,
+ 0.016204386949539185,
+ 0.011793862096965313,
+ 0.011675998568534851,
+ 0.01161060482263565
+ ],
+ "gamma_dfa": 0.057106493040919304,
+ "gamma_dfa_per_layer": [
+ 0.025031987577676773,
+ 0.05149566009640694,
+ 0.07346570491790771,
+ 0.07843261957168579
+ ],
+ "acc_eval": 0.6895000338554382,
+ "loss_eval": 0.8812824487686157,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 42.312625885009766,
+ 287.158447265625,
+ 501.61053466796875,
+ 718.7759399414062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008852323517203331,
+ 0.0001484409294789657,
+ 0.00011503385030664504,
+ 0.00011482135596452281,
+ 0.00011442313552834094
+ ],
+ "bp_grad_F": [
+ 0.10061701387166977,
+ 0.016211561858654022,
+ 0.011752818711102009,
+ 0.011636910028755665,
+ 0.011571302078664303
+ ],
+ "gamma_dfa": 0.055246823001652956,
+ "gamma_dfa_per_layer": [
+ 0.024583658203482628,
+ 0.04850705340504646,
+ 0.07144256681203842,
+ 0.07645401358604431
+ ],
+ "acc_eval": 0.6955000162124634,
+ "loss_eval": 0.888053834438324,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 42.61886978149414,
+ 289.2788391113281,
+ 505.75390625,
+ 724.4559326171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009071374079212546,
+ 0.00015266452101059258,
+ 0.00011854806507471949,
+ 0.00011884445120813325,
+ 0.00011772327707149088
+ ],
+ "bp_grad_F": [
+ 0.10303837805986404,
+ 0.016465138643980026,
+ 0.011987767182290554,
+ 0.011867417953908443,
+ 0.011802136898040771
+ ],
+ "gamma_dfa": 0.05469688028097153,
+ "gamma_dfa_per_layer": [
+ 0.02719976380467415,
+ 0.04610869660973549,
+ 0.07147730141878128,
+ 0.07400175929069519
+ ],
+ "acc_eval": 0.6820000410079956,
+ "loss_eval": 0.9107973575592041,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 42.90008544921875,
+ 291.5098876953125,
+ 509.49200439453125,
+ 730.070068359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009346315637230873,
+ 0.00017380902136210352,
+ 0.00014277170703280717,
+ 0.0001402509369654581,
+ 0.00014013791223987937
+ ],
+ "bp_grad_F": [
+ 0.10035568475723267,
+ 0.016459215432405472,
+ 0.012036965228617191,
+ 0.011920913122594357,
+ 0.01185610517859459
+ ],
+ "gamma_dfa": 0.055851065553724766,
+ "gamma_dfa_per_layer": [
+ 0.026028182357549667,
+ 0.04594290256500244,
+ 0.07459361851215363,
+ 0.07683955878019333
+ ],
+ "acc_eval": 0.6720000505447388,
+ "loss_eval": 0.9282984733581543,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 43.15349197387695,
+ 293.65966796875,
+ 513.3607177734375,
+ 735.3644409179688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009396777604706585,
+ 0.00015277721104212105,
+ 0.00012291918392293155,
+ 0.00012154672003816813,
+ 0.00012096676073269919
+ ],
+ "bp_grad_F": [
+ 0.10190626233816147,
+ 0.016208121553063393,
+ 0.011865625157952309,
+ 0.011748027056455612,
+ 0.011683868244290352
+ ],
+ "gamma_dfa": 0.05457223346456885,
+ "gamma_dfa_per_layer": [
+ 0.02600257657468319,
+ 0.046096257865428925,
+ 0.0713086724281311,
+ 0.0748814269900322
+ ],
+ "acc_eval": 0.6920000314712524,
+ "loss_eval": 0.8892928957939148,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 43.37159729003906,
+ 295.3875732421875,
+ 516.53369140625,
+ 740.1768798828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008509810431860387,
+ 0.000149228420923464,
+ 0.00012114718265365809,
+ 0.00012038950808346272,
+ 0.00011932845518458635
+ ],
+ "bp_grad_F": [
+ 0.09941542148590088,
+ 0.015937170013785362,
+ 0.01166422851383686,
+ 0.011551388539373875,
+ 0.011488799005746841
+ ],
+ "gamma_dfa": 0.053473991341888905,
+ "gamma_dfa_per_layer": [
+ 0.0227724090218544,
+ 0.045084040611982346,
+ 0.07109282910823822,
+ 0.07494668662548065
+ ],
+ "acc_eval": 0.6945000290870667,
+ "loss_eval": 0.8690445423126221,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 43.58628463745117,
+ 297.0165710449219,
+ 519.4993286132812,
+ 744.6467895507812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009939862648025155,
+ 0.0001676510728430003,
+ 0.00013252485950943083,
+ 0.0001307348720729351,
+ 0.0001300926087424159
+ ],
+ "bp_grad_F": [
+ 0.10170887410640717,
+ 0.016186155378818512,
+ 0.011895725503563881,
+ 0.011782051995396614,
+ 0.0117182033136487
+ ],
+ "gamma_dfa": 0.05389358149841428,
+ "gamma_dfa_per_layer": [
+ 0.024122020229697227,
+ 0.04528462514281273,
+ 0.0715978741645813,
+ 0.07456980645656586
+ ],
+ "acc_eval": 0.6840000152587891,
+ "loss_eval": 0.9150904417037964,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 43.756309509277344,
+ 298.4603576660156,
+ 522.1862182617188,
+ 748.0980224609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009121120092459023,
+ 0.00015141229960136116,
+ 0.00012266664998605847,
+ 0.00012074616097379476,
+ 0.00012072239769622684
+ ],
+ "bp_grad_F": [
+ 0.09929168969392776,
+ 0.015882758423686028,
+ 0.011736094020307064,
+ 0.011626454070210457,
+ 0.011565400287508965
+ ],
+ "gamma_dfa": 0.05446606734767556,
+ "gamma_dfa_per_layer": [
+ 0.023944402113556862,
+ 0.04696139693260193,
+ 0.07070320099592209,
+ 0.07625526934862137
+ ],
+ "acc_eval": 0.6895000338554382,
+ "loss_eval": 0.8752753138542175,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 43.956050872802734,
+ 299.8046569824219,
+ 524.5073852539062,
+ 751.9002075195312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009328208980150521,
+ 0.00015578871534671634,
+ 0.00012375388178043067,
+ 0.00012286445416975766,
+ 0.0001222269784193486
+ ],
+ "bp_grad_F": [
+ 0.09782548248767853,
+ 0.015724968165159225,
+ 0.011678245849907398,
+ 0.01156895887106657,
+ 0.01150886993855238
+ ],
+ "gamma_dfa": 0.05415696511045098,
+ "gamma_dfa_per_layer": [
+ 0.025110432878136635,
+ 0.04582852125167847,
+ 0.07056943327188492,
+ 0.07511947304010391
+ ],
+ "acc_eval": 0.6910000443458557,
+ "loss_eval": 0.8689600825309753,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.10476303100586,
+ 301.22088623046875,
+ 527.0880737304688,
+ 755.537109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009187725954689085,
+ 0.0001580083044245839,
+ 0.00012691691517829895,
+ 0.00012647418770939112,
+ 0.00012595193402376026
+ ],
+ "bp_grad_F": [
+ 0.09907824546098709,
+ 0.01592797227203846,
+ 0.011772784404456615,
+ 0.011660448275506496,
+ 0.011597777716815472
+ ],
+ "gamma_dfa": 0.053306530229747295,
+ "gamma_dfa_per_layer": [
+ 0.025752168148756027,
+ 0.04250373691320419,
+ 0.07085125893354416,
+ 0.0741189569234848
+ ],
+ "acc_eval": 0.6785000562667847,
+ "loss_eval": 0.8745812773704529,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.272037506103516,
+ 302.41107177734375,
+ 529.3627319335938,
+ 758.9468383789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009381037671118975,
+ 0.00015578897728119045,
+ 0.00012793939094990492,
+ 0.00012725923443213105,
+ 0.00012640930071938783
+ ],
+ "bp_grad_F": [
+ 0.09839630872011185,
+ 0.015703976154327393,
+ 0.011679527349770069,
+ 0.01157388836145401,
+ 0.011512565426528454
+ ],
+ "gamma_dfa": 0.053105687256902456,
+ "gamma_dfa_per_layer": [
+ 0.022858327254652977,
+ 0.04474852979183197,
+ 0.06992355734109879,
+ 0.07489233464002609
+ ],
+ "acc_eval": 0.6865000128746033,
+ "loss_eval": 0.8636536002159119,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.36368942260742,
+ 303.7563781738281,
+ 531.5054931640625,
+ 762.388427734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009112239349633455,
+ 0.0001562510442454368,
+ 0.00013036206655669957,
+ 0.00012987821537535638,
+ 0.0001294936373597011
+ ],
+ "bp_grad_F": [
+ 0.09861280024051666,
+ 0.015790371224284172,
+ 0.011699686758220196,
+ 0.01159034576267004,
+ 0.011528948321938515
+ ],
+ "gamma_dfa": 0.05348377674818039,
+ "gamma_dfa_per_layer": [
+ 0.0251171812415123,
+ 0.04412227123975754,
+ 0.07024820148944855,
+ 0.07444745302200317
+ ],
+ "acc_eval": 0.6885000467300415,
+ "loss_eval": 0.8699802160263062,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.498130798339844,
+ 304.7552185058594,
+ 533.51318359375,
+ 765.1610717773438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008680672035552561,
+ 0.00014313006249722093,
+ 0.00011654605623334646,
+ 0.00011439070658525452,
+ 0.00011445816198829561
+ ],
+ "bp_grad_F": [
+ 0.0990181565284729,
+ 0.015660114586353302,
+ 0.011611604131758213,
+ 0.011503342539072037,
+ 0.011442977003753185
+ ],
+ "gamma_dfa": 0.05415269639343023,
+ "gamma_dfa_per_layer": [
+ 0.024549636989831924,
+ 0.0454377755522728,
+ 0.07077726721763611,
+ 0.0758461058139801
+ ],
+ "acc_eval": 0.6960000395774841,
+ "loss_eval": 0.8598873615264893,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.600582122802734,
+ 305.7388610839844,
+ 534.99951171875,
+ 767.8171997070312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008962214924395084,
+ 0.00015309070295188576,
+ 0.00012299958325456828,
+ 0.000121716657304205,
+ 0.0001212474235217087
+ ],
+ "bp_grad_F": [
+ 0.10033439099788666,
+ 0.015828289091587067,
+ 0.011728483252227306,
+ 0.01162028405815363,
+ 0.011559616774320602
+ ],
+ "gamma_dfa": 0.05304920673370361,
+ "gamma_dfa_per_layer": [
+ 0.02494572103023529,
+ 0.043708547949790955,
+ 0.06946250051259995,
+ 0.07408005744218826
+ ],
+ "acc_eval": 0.6895000338554382,
+ "loss_eval": 0.8800998330116272,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.70732879638672,
+ 306.55181884765625,
+ 536.31005859375,
+ 769.971923828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009149253601208329,
+ 0.00015781939146108925,
+ 0.00012933975085616112,
+ 0.00012773934577126056,
+ 0.00012716377386823297
+ ],
+ "bp_grad_F": [
+ 0.09770160913467407,
+ 0.015633704140782356,
+ 0.011657179333269596,
+ 0.011551215313374996,
+ 0.011491267941892147
+ ],
+ "gamma_dfa": 0.05268599092960358,
+ "gamma_dfa_per_layer": [
+ 0.024415917694568634,
+ 0.04385191947221756,
+ 0.06913819909095764,
+ 0.07333792746067047
+ ],
+ "acc_eval": 0.6930000185966492,
+ "loss_eval": 0.8666836023330688,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.78550338745117,
+ 307.4527893066406,
+ 537.914306640625,
+ 771.5177612304688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000909268157556653,
+ 0.0001503752137068659,
+ 0.00012163108476670459,
+ 0.00012035916006425396,
+ 0.00012008652265649289
+ ],
+ "bp_grad_F": [
+ 0.09915008395910263,
+ 0.015667738392949104,
+ 0.011642162688076496,
+ 0.01153358444571495,
+ 0.011473594233393669
+ ],
+ "gamma_dfa": 0.05392309743911028,
+ "gamma_dfa_per_layer": [
+ 0.023599978536367416,
+ 0.04531348496675491,
+ 0.07121817022562027,
+ 0.07556075602769852
+ ],
+ "acc_eval": 0.6955000162124634,
+ "loss_eval": 0.8635799884796143,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.858604431152344,
+ 308.1347961425781,
+ 538.9302368164062,
+ 773.1725463867188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009114991407841444,
+ 0.00015059093129821122,
+ 0.00012239563511684537,
+ 0.00012128813978051767,
+ 0.00012036858242936432
+ ],
+ "bp_grad_F": [
+ 0.0976131409406662,
+ 0.015529998578131199,
+ 0.01157119870185852,
+ 0.011464742012321949,
+ 0.01140571665018797
+ ],
+ "gamma_dfa": 0.05296219326555729,
+ "gamma_dfa_per_layer": [
+ 0.02382323145866394,
+ 0.04349217563867569,
+ 0.0696524977684021,
+ 0.07488086819648743
+ ],
+ "acc_eval": 0.6940000057220459,
+ "loss_eval": 0.8525131344795227,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.92080307006836,
+ 308.6539001464844,
+ 539.7476806640625,
+ 774.7044067382812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009130545658990741,
+ 0.0001561250537633896,
+ 0.00012542278273031116,
+ 0.0001241281715920195,
+ 0.0001238062686752528
+ ],
+ "bp_grad_F": [
+ 0.0973346009850502,
+ 0.015503575094044209,
+ 0.01158667542040348,
+ 0.011482889764010906,
+ 0.01142406091094017
+ ],
+ "gamma_dfa": 0.05284834885969758,
+ "gamma_dfa_per_layer": [
+ 0.023774540051817894,
+ 0.04253865405917168,
+ 0.0699956938624382,
+ 0.07508450746536255
+ ],
+ "acc_eval": 0.6875000596046448,
+ "loss_eval": 0.8490641713142395,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 44.97352600097656,
+ 309.19366455078125,
+ 540.6045532226562,
+ 775.7159423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008941096602939069,
+ 0.0001490603171987459,
+ 0.00012243444507475942,
+ 0.00012086174683645368,
+ 0.00011930170876439661
+ ],
+ "bp_grad_F": [
+ 0.0978497788310051,
+ 0.015526177361607552,
+ 0.011586111970245838,
+ 0.011480187065899372,
+ 0.011420912109315395
+ ],
+ "gamma_dfa": 0.052993528079241514,
+ "gamma_dfa_per_layer": [
+ 0.02384653501212597,
+ 0.04263130575418472,
+ 0.0702076405286789,
+ 0.07528863102197647
+ ],
+ "acc_eval": 0.6950000524520874,
+ "loss_eval": 0.8494359850883484,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.018131256103516,
+ 309.6293640136719,
+ 541.2432861328125,
+ 776.7703857421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009062750032171607,
+ 0.00015435971727129072,
+ 0.00012295282795093954,
+ 0.00012264182441867888,
+ 0.00012187549873488024
+ ],
+ "bp_grad_F": [
+ 0.0975913405418396,
+ 0.015510785393416882,
+ 0.011592722497880459,
+ 0.011488175950944424,
+ 0.011429551988840103
+ ],
+ "gamma_dfa": 0.05261069582775235,
+ "gamma_dfa_per_layer": [
+ 0.023613562807440758,
+ 0.04278940334916115,
+ 0.06959826499223709,
+ 0.07444155216217041
+ ],
+ "acc_eval": 0.6895000338554382,
+ "loss_eval": 0.8503831624984741,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.05687713623047,
+ 309.88616943359375,
+ 541.6970825195312,
+ 777.6474609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009167437092401087,
+ 0.00015087658539414406,
+ 0.00012154471187386662,
+ 0.00012103841436328366,
+ 0.00012099531886633486
+ ],
+ "bp_grad_F": [
+ 0.09737422317266464,
+ 0.015458790585398674,
+ 0.011581062339246273,
+ 0.011477372609078884,
+ 0.01141849160194397
+ ],
+ "gamma_dfa": 0.05269155744463205,
+ "gamma_dfa_per_layer": [
+ 0.02412768080830574,
+ 0.04288121312856674,
+ 0.06955435872077942,
+ 0.07420297712087631
+ ],
+ "acc_eval": 0.6875000596046448,
+ "loss_eval": 0.8513321280479431,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.083457946777344,
+ 310.21551513671875,
+ 542.2005615234375,
+ 778.2576904296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009331087348982692,
+ 0.00015250151045620441,
+ 0.00012407499889377505,
+ 0.00012352959311101586,
+ 0.0001235192030435428
+ ],
+ "bp_grad_F": [
+ 0.09731114655733109,
+ 0.015489363111555576,
+ 0.011589608155190945,
+ 0.011484977789223194,
+ 0.01142611913383007
+ ],
+ "gamma_dfa": 0.05234858160838485,
+ "gamma_dfa_per_layer": [
+ 0.023583704605698586,
+ 0.04196107015013695,
+ 0.06969348341226578,
+ 0.07415606826543808
+ ],
+ "acc_eval": 0.6885000467300415,
+ "loss_eval": 0.8485224843025208,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.10480499267578,
+ 310.4107360839844,
+ 542.5189819335938,
+ 778.7670288085938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009211195865646005,
+ 0.00015081235324032605,
+ 0.00012383687135297805,
+ 0.00012388851610012352,
+ 0.0001234857481904328
+ ],
+ "bp_grad_F": [
+ 0.097723089158535,
+ 0.015484371222555637,
+ 0.011575440876185894,
+ 0.011470203287899494,
+ 0.011411197483539581
+ ],
+ "gamma_dfa": 0.052400246262550354,
+ "gamma_dfa_per_layer": [
+ 0.023820150643587112,
+ 0.04187368229031563,
+ 0.06974346935749054,
+ 0.07416368275880814
+ ],
+ "acc_eval": 0.690500020980835,
+ "loss_eval": 0.8478801250457764,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.121337890625,
+ 310.5526123046875,
+ 542.789794921875,
+ 779.1331787109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009062032913789153,
+ 0.00014932811609469354,
+ 0.00012137479643570259,
+ 0.00012096992577426136,
+ 0.00012082025205017999
+ ],
+ "bp_grad_F": [
+ 0.09714466333389282,
+ 0.015453615225851536,
+ 0.011561346240341663,
+ 0.011457313783466816,
+ 0.0113987410441041
+ ],
+ "gamma_dfa": 0.05261371610686183,
+ "gamma_dfa_per_layer": [
+ 0.023706024512648582,
+ 0.04261678457260132,
+ 0.06977313756942749,
+ 0.07435891777276993
+ ],
+ "acc_eval": 0.6915000081062317,
+ "loss_eval": 0.846295177936554,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.13352584838867,
+ 310.6623840332031,
+ 542.9544067382812,
+ 779.3726196289062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009290048037655652,
+ 0.0001487880654167384,
+ 0.00012229036656208336,
+ 0.0001213839859701693,
+ 0.00012132866686442867
+ ],
+ "bp_grad_F": [
+ 0.09700886905193329,
+ 0.015427183359861374,
+ 0.011550018563866615,
+ 0.011446088552474976,
+ 0.011387485079467297
+ ],
+ "gamma_dfa": 0.05256890505552292,
+ "gamma_dfa_per_layer": [
+ 0.023696668446063995,
+ 0.04250160604715347,
+ 0.06959902495145798,
+ 0.07447832077741623
+ ],
+ "acc_eval": 0.6925000548362732,
+ "loss_eval": 0.8456347584724426,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.14185333251953,
+ 310.71917724609375,
+ 543.0736694335938,
+ 779.531982421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009128348319791257,
+ 0.00014947194722481072,
+ 0.0001214019866893068,
+ 0.000121481396490708,
+ 0.00012067624629708007
+ ],
+ "bp_grad_F": [
+ 0.09731098264455795,
+ 0.015439406037330627,
+ 0.011552426032721996,
+ 0.01144845224916935,
+ 0.011389924213290215
+ ],
+ "gamma_dfa": 0.0525772743858397,
+ "gamma_dfa_per_layer": [
+ 0.023648327216506004,
+ 0.0424870140850544,
+ 0.06964967399835587,
+ 0.07452408224344254
+ ],
+ "acc_eval": 0.6945000290870667,
+ "loss_eval": 0.8456541895866394,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.14662170410156,
+ 310.7527160644531,
+ 543.1363525390625,
+ 779.6199951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009132170234806836,
+ 0.00014713683049194515,
+ 0.00012075807899236679,
+ 0.00011999421985819936,
+ 0.00011943812569370493
+ ],
+ "bp_grad_F": [
+ 0.09724143892526627,
+ 0.01543473545461893,
+ 0.011546480469405651,
+ 0.0114423343911767,
+ 0.011383815668523312
+ ],
+ "gamma_dfa": 0.0526476064696908,
+ "gamma_dfa_per_layer": [
+ 0.023711953312158585,
+ 0.0426546186208725,
+ 0.06969036906957626,
+ 0.07453348487615585
+ ],
+ "acc_eval": 0.6925000548362732,
+ "loss_eval": 0.8444594740867615,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.14855194091797,
+ 310.77044677734375,
+ 543.1617431640625,
+ 779.6598510742188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009067560313269496,
+ 0.00014785665553063154,
+ 0.00012018840061500669,
+ 0.00011918631935259327,
+ 0.00011903052654815838
+ ],
+ "bp_grad_F": [
+ 0.09721538424491882,
+ 0.015435173176229,
+ 0.01154935173690319,
+ 0.011445209383964539,
+ 0.011386674828827381
+ ],
+ "gamma_dfa": 0.05261166812852025,
+ "gamma_dfa_per_layer": [
+ 0.023721175268292427,
+ 0.042552798986434937,
+ 0.06965683400630951,
+ 0.07451586425304413
+ ],
+ "acc_eval": 0.6930000185966492,
+ "loss_eval": 0.8448338508605957,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 45.149070739746094,
+ 310.77496337890625,
+ 543.169189453125,
+ 779.66943359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009094586130231619,
+ 0.00014742475468665361,
+ 0.00012030002835672349,
+ 0.00011929625179618597,
+ 0.00011879605881404132
+ ],
+ "bp_grad_F": [
+ 0.09719900041818619,
+ 0.015434404835104942,
+ 0.011549265123903751,
+ 0.011445139534771442,
+ 0.011386608704924583
+ ],
+ "gamma_dfa": 0.05260759778320789,
+ "gamma_dfa_per_layer": [
+ 0.023730866611003876,
+ 0.04254307597875595,
+ 0.06965382397174835,
+ 0.0745026245713234
+ ],
+ "acc_eval": 0.6930000185966492,
+ "loss_eval": 0.844819962978363,
+ "epoch": 80
+ }
+ ]
+} \ No newline at end of file