summaryrefslogtreecommitdiff
path: root/results/snapshot_evolution_v2/snapshot_evolution_s123.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s123.json')
-rw-r--r--results/snapshot_evolution_v2/snapshot_evolution_s123.json5473
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s123.json b/results/snapshot_evolution_v2/snapshot_evolution_s123.json
new file mode 100644
index 0000000..4ccefc8
--- /dev/null
+++ b/results/snapshot_evolution_v2/snapshot_evolution_s123.json
@@ -0,0 +1,5473 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_evolution_v2",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 123,
+ "depth": 4,
+ "d_hidden": 256,
+ "log_every": 1
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.690464973449707,
+ 8.719978332519531,
+ 8.73093318939209,
+ 8.75937271118164,
+ 8.790542602539062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009977436857298017,
+ 0.000992251792922616,
+ 0.0009848480112850666,
+ 0.0009761073160916567,
+ 0.0009735578205436468
+ ],
+ "bp_grad_norms_F": [
+ 0.035340383648872375,
+ 0.03499162197113037,
+ 0.03454425558447838,
+ 0.034113530069589615,
+ 0.033874060958623886
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.095703125,
+ "loss_eval": 2.486203908920288,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 78.8471908569336,
+ 81.27874755859375,
+ 85.74082946777344,
+ 93.0085678100586,
+ 99.78337860107422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.44870927114971e-05,
+ 5.06363830936607e-05,
+ 4.9749945901567116e-05,
+ 5.010423774365336e-05,
+ 5.131187572260387e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025542855728417635,
+ 0.0021727080456912518,
+ 0.002010831143707037,
+ 0.0019116367911919951,
+ 0.0019338354468345642
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.396484375,
+ "loss_eval": 1.6637382507324219,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 94.79721069335938,
+ 98.6406021118164,
+ 103.38369750976562,
+ 111.4940185546875,
+ 118.88549041748047
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.842087219003588e-05,
+ 4.405825529829599e-05,
+ 4.263824666850269e-05,
+ 4.2027873860206455e-05,
+ 4.283937960281037e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020658739376813173,
+ 0.001806268934160471,
+ 0.001665781601332128,
+ 0.0015872427029535174,
+ 0.0015909546054899693
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4541015625,
+ "loss_eval": 1.5350896120071411,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 112.59109497070312,
+ 116.00851440429688,
+ 118.50328063964844,
+ 125.58804321289062,
+ 132.86842346191406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.3564141378737986e-05,
+ 4.136884308536537e-05,
+ 4.064830864081159e-05,
+ 3.9523682062281296e-05,
+ 3.8838741602376103e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00200729351490736,
+ 0.001785867614671588,
+ 0.0016562910750508308,
+ 0.0015452943043783307,
+ 0.0015010037459433079
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4814453125,
+ "loss_eval": 1.449176549911499,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 124.81511688232422,
+ 128.57049560546875,
+ 129.71421813964844,
+ 136.4766387939453,
+ 142.1854705810547
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.382780389278196e-05,
+ 4.2459021642571315e-05,
+ 4.143684418522753e-05,
+ 4.0614067984279245e-05,
+ 3.921420648111962e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018197334138676524,
+ 0.0016814853297546506,
+ 0.0015934663824737072,
+ 0.0015063106548041105,
+ 0.0014485444407910109
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4970703125,
+ "loss_eval": 1.4218697547912598,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 138.24440002441406,
+ 140.13018798828125,
+ 141.3839874267578,
+ 147.2488555908203,
+ 155.097412109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.045376044814475e-05,
+ 4.011149940197356e-05,
+ 3.9452468627132475e-05,
+ 3.831404319498688e-05,
+ 3.721412576851435e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017204430187121034,
+ 0.0016258049290627241,
+ 0.001551075023598969,
+ 0.0014644934562966228,
+ 0.0013933938462287188
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5078125,
+ "loss_eval": 1.3836241960525513,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 152.11605834960938,
+ 153.1806182861328,
+ 153.2488555908203,
+ 159.2217559814453,
+ 167.07318115234375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.981084591941908e-05,
+ 3.969454701291397e-05,
+ 3.9165588532341644e-05,
+ 3.808845940511674e-05,
+ 3.58163051714655e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017226944910362363,
+ 0.001611364888958633,
+ 0.0015574879944324493,
+ 0.001471089432016015,
+ 0.001374671934172511
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.525390625,
+ "loss_eval": 1.372281551361084,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 161.75347900390625,
+ 163.58787536621094,
+ 163.35731506347656,
+ 170.1693115234375,
+ 177.47879028320312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.749227471416816e-05,
+ 3.707691575982608e-05,
+ 3.776738958549686e-05,
+ 3.692766040330753e-05,
+ 3.5146917070960626e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016339722787961364,
+ 0.00156014587264508,
+ 0.0015048144850879908,
+ 0.00141648028511554,
+ 0.0013256004313006997
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.515625,
+ "loss_eval": 1.345876693725586,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 171.66441345214844,
+ 171.10499572753906,
+ 169.24270629882812,
+ 175.52674865722656,
+ 182.4739990234375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.675510379252955e-05,
+ 3.6888646718580276e-05,
+ 3.695035775308497e-05,
+ 3.644685784820467e-05,
+ 3.359343099873513e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016642085975036025,
+ 0.0015915494877845049,
+ 0.0015412021894007921,
+ 0.0014428672147914767,
+ 0.0013226643204689026
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.548828125,
+ "loss_eval": 1.323807954788208,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 177.58766174316406,
+ 178.5358123779297,
+ 176.316650390625,
+ 182.18365478515625,
+ 188.81033325195312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.550657493178733e-05,
+ 3.561190533218905e-05,
+ 3.632329753600061e-05,
+ 3.5655833926284686e-05,
+ 3.342977652209811e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016174933407455683,
+ 0.0015753052430227399,
+ 0.0015375673538073897,
+ 0.001461501931771636,
+ 0.0013270385097712278
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.54296875,
+ "loss_eval": 1.323765754699707,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 186.0078125,
+ 185.2810821533203,
+ 182.9329833984375,
+ 188.10736083984375,
+ 195.3680877685547
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5615968954516575e-05,
+ 3.5252433008281514e-05,
+ 3.600740819820203e-05,
+ 3.5232467780588195e-05,
+ 3.2765579817350954e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015362550038844347,
+ 0.001510681351646781,
+ 0.0014847773127257824,
+ 0.0014146054163575172,
+ 0.00128385319840163
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.544921875,
+ "loss_eval": 1.2933119535446167,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 193.46343994140625,
+ 194.1528778076172,
+ 190.9546661376953,
+ 196.03440856933594,
+ 201.5336151123047
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.449141877354123e-05,
+ 3.581260534701869e-05,
+ 3.6061541322851554e-05,
+ 3.5576940717874095e-05,
+ 3.29486902046483e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015161881456151605,
+ 0.0014996343525126576,
+ 0.001473701442591846,
+ 0.0013998147333040833,
+ 0.0012604170478880405
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5556640625,
+ "loss_eval": 1.2653318643569946,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 200.17047119140625,
+ 198.5863037109375,
+ 196.08795166015625,
+ 200.61297607421875,
+ 208.13084411621094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.377814937266521e-05,
+ 3.471539093879983e-05,
+ 3.4731467167148367e-05,
+ 3.4925535146612674e-05,
+ 3.2187374017667025e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014635181287303567,
+ 0.0014519579708576202,
+ 0.001435206620953977,
+ 0.0013784168986603618,
+ 0.0012511539971455932
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.546875,
+ "loss_eval": 1.2704923152923584,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 203.8260955810547,
+ 203.86688232421875,
+ 200.01004028320312,
+ 204.2325439453125,
+ 211.52891540527344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5213015507906675e-05,
+ 3.635779648902826e-05,
+ 3.70470697816927e-05,
+ 3.6254354199627414e-05,
+ 3.324731005704962e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014951277989894152,
+ 0.0014758999459445477,
+ 0.0014606777112931013,
+ 0.0014066072180867195,
+ 0.0012636061292141676
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.533203125,
+ "loss_eval": 1.2718024253845215,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 211.8421630859375,
+ 209.4982147216797,
+ 206.025634765625,
+ 210.11019897460938,
+ 216.48568725585938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.425328395678662e-05,
+ 3.4357526601525024e-05,
+ 3.5312823456479236e-05,
+ 3.490734161459841e-05,
+ 3.1354313250631094e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015326166758313775,
+ 0.0015238082269206643,
+ 0.0015112065011635423,
+ 0.0014346316456794739,
+ 0.0012716582277789712
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5595703125,
+ "loss_eval": 1.2611415386199951,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 220.0836639404297,
+ 218.3101806640625,
+ 212.22019958496094,
+ 216.97576904296875,
+ 224.16114807128906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.320865289424546e-05,
+ 3.393836959730834e-05,
+ 3.4554454032331705e-05,
+ 3.380324415047653e-05,
+ 3.0850649636704475e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015296684578061104,
+ 0.0015227487310767174,
+ 0.0015054721152409911,
+ 0.0014223494799807668,
+ 0.0012559365713968873
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5615234375,
+ "loss_eval": 1.2511423826217651,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 223.3075714111328,
+ 219.4958953857422,
+ 213.75701904296875,
+ 219.41580200195312,
+ 223.92572021484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.406661926419474e-05,
+ 3.485638080746867e-05,
+ 3.5736342397285625e-05,
+ 3.5617544199340045e-05,
+ 3.142367859254591e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001539028249680996,
+ 0.0015256714541465044,
+ 0.0015207449905574322,
+ 0.001449243980459869,
+ 0.0012804584112018347
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5478515625,
+ "loss_eval": 1.2619048357009888,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 229.43417358398438,
+ 224.83290100097656,
+ 218.015869140625,
+ 221.56915283203125,
+ 228.59274291992188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.325551369925961e-05,
+ 3.411810757825151e-05,
+ 3.506721623125486e-05,
+ 3.451627344475128e-05,
+ 3.0976541893323883e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001564670237712562,
+ 0.0015591747360303998,
+ 0.0015565806534141302,
+ 0.001464744214899838,
+ 0.0012746548745781183
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5498046875,
+ "loss_eval": 1.2594949007034302,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 233.65724182128906,
+ 228.65892028808594,
+ 223.14169311523438,
+ 227.2765350341797,
+ 233.75588989257812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4493146813474596e-05,
+ 3.510132592055015e-05,
+ 3.669387297122739e-05,
+ 3.577200186555274e-05,
+ 3.192189251421951e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015125939389690757,
+ 0.0015123466728255153,
+ 0.0015171029372140765,
+ 0.0014489478198811412,
+ 0.001258584321476519
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5595703125,
+ "loss_eval": 1.2556639909744263,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 237.43548583984375,
+ 232.39987182617188,
+ 227.10951232910156,
+ 230.72291564941406,
+ 237.13616943359375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.340727198519744e-05,
+ 3.450348594924435e-05,
+ 3.5213739465689287e-05,
+ 3.445050970185548e-05,
+ 3.137766179861501e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015336342621594667,
+ 0.0015343877021223307,
+ 0.0015299322549253702,
+ 0.0014644783223047853,
+ 0.0012699750950559974
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.560546875,
+ "loss_eval": 1.2415752410888672,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 240.3662109375,
+ 235.49240112304688,
+ 227.54061889648438,
+ 233.16600036621094,
+ 239.60838317871094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.387282777111977e-05,
+ 3.518611265462823e-05,
+ 3.594699956011027e-05,
+ 3.514933632686734e-05,
+ 3.159138941555284e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015161214396357536,
+ 0.0015244479291141033,
+ 0.0015337818767875433,
+ 0.0014538948889821768,
+ 0.0012562318006530404
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.560546875,
+ "loss_eval": 1.2436577081680298,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 246.6840057373047,
+ 239.0929412841797,
+ 228.7230682373047,
+ 233.1182403564453,
+ 237.92440795898438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.365568773006089e-05,
+ 3.4782005968736485e-05,
+ 3.604988887673244e-05,
+ 3.48928188032005e-05,
+ 3.140935586998239e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015826384769752622,
+ 0.0015907500637695193,
+ 0.0016004826175048947,
+ 0.0015078946016728878,
+ 0.0012762312544509768
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.578125,
+ "loss_eval": 1.2292213439941406,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 248.95265197753906,
+ 241.59408569335938,
+ 233.2073211669922,
+ 236.39898681640625,
+ 243.02566528320312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3556283597135916e-05,
+ 3.463738539721817e-05,
+ 3.5712662793230265e-05,
+ 3.4992117434740067e-05,
+ 3.1405961635755375e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015417077811434865,
+ 0.0015624086372554302,
+ 0.00158181122969836,
+ 0.0014982762513682246,
+ 0.001269534695893526
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5712890625,
+ "loss_eval": 1.201985239982605,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 250.6766815185547,
+ 243.67706298828125,
+ 236.90567016601562,
+ 240.1038360595703,
+ 244.89207458496094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3543499739607796e-05,
+ 3.4865890484070405e-05,
+ 3.564134021871723e-05,
+ 3.4787921322276816e-05,
+ 3.112335252808407e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015237597981467843,
+ 0.0015382410492748022,
+ 0.0015483599854633212,
+ 0.0014793339651077986,
+ 0.0012637422187253833
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.55859375,
+ "loss_eval": 1.2245514392852783,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 256.1240539550781,
+ 248.83609008789062,
+ 240.2549285888672,
+ 243.1914825439453,
+ 248.11964416503906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.322990596643649e-05,
+ 3.523347186273895e-05,
+ 3.6828067095484585e-05,
+ 3.5215769457863644e-05,
+ 3.133456266368739e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015543467598035932,
+ 0.0015818241517990828,
+ 0.0015992531552910805,
+ 0.001527936663478613,
+ 0.0012819069670513272
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5732421875,
+ "loss_eval": 1.2261133193969727,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 256.9990234375,
+ 248.78497314453125,
+ 239.55239868164062,
+ 243.13818359375,
+ 249.48153686523438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.39320904458873e-05,
+ 3.600086711230688e-05,
+ 3.7119287298992276e-05,
+ 3.6292254662839696e-05,
+ 3.193991506122984e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015332578914240003,
+ 0.00156042305752635,
+ 0.001574728754349053,
+ 0.0015015782555565238,
+ 0.0012670031283050776
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5771484375,
+ "loss_eval": 1.2080682516098022,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 260.4493103027344,
+ 251.83595275878906,
+ 240.95025634765625,
+ 242.58055114746094,
+ 247.42816162109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4877586585935205e-05,
+ 3.68267938029021e-05,
+ 3.760240360861644e-05,
+ 3.5770553949987516e-05,
+ 3.202233710908331e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016203002305701375,
+ 0.0016500651836395264,
+ 0.0016584799159318209,
+ 0.0015617734752595425,
+ 0.00129653827752918
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5576171875,
+ "loss_eval": 1.2154628038406372,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 263.1241760253906,
+ 253.4596405029297,
+ 243.6095733642578,
+ 245.4304656982422,
+ 250.32362365722656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.480416853562929e-05,
+ 3.640647264546715e-05,
+ 3.738802479347214e-05,
+ 3.5808730899589136e-05,
+ 3.25721557601355e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015986696816980839,
+ 0.0016261462587863207,
+ 0.0016554947942495346,
+ 0.0015633245930075645,
+ 0.0013003128115087748
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5634765625,
+ "loss_eval": 1.2160842418670654,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 266.5273132324219,
+ 256.0182189941406,
+ 245.50253295898438,
+ 246.18280029296875,
+ 251.716064453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.359848051331937e-05,
+ 3.572113564587198e-05,
+ 3.695064515341073e-05,
+ 3.506165376165882e-05,
+ 3.114769424428232e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016088238917291164,
+ 0.0016375494888052344,
+ 0.0016567507991567254,
+ 0.0015764845302328467,
+ 0.001285399659536779
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58203125,
+ "loss_eval": 1.2021496295928955,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 267.4769592285156,
+ 258.21368408203125,
+ 248.0418701171875,
+ 248.66949462890625,
+ 253.77452087402344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.400501736905426e-05,
+ 3.611011925386265e-05,
+ 3.7168374547036365e-05,
+ 3.569516775314696e-05,
+ 3.031879896298051e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015880028950050473,
+ 0.0016197538934648037,
+ 0.001652923645451665,
+ 0.0015723761171102524,
+ 0.00128253607545048
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5771484375,
+ "loss_eval": 1.2029783725738525,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 268.6047668457031,
+ 256.4200744628906,
+ 246.27796936035156,
+ 246.51229858398438,
+ 250.08482360839844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.425245813559741e-05,
+ 3.6405861465027556e-05,
+ 3.752295742742717e-05,
+ 3.6318160709924996e-05,
+ 3.103434937656857e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017358324257656932,
+ 0.0017647893400862813,
+ 0.0017767423996701837,
+ 0.0016745994798839092,
+ 0.0013456137385219336
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.2118260860443115,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 270.9348449707031,
+ 260.40045166015625,
+ 250.72512817382812,
+ 251.9379425048828,
+ 254.6614227294922
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.491883762762882e-05,
+ 3.647417179308832e-05,
+ 3.8068057619966567e-05,
+ 3.653564635897055e-05,
+ 3.172537253703922e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015994011191651225,
+ 0.0016339519061148167,
+ 0.0016624036943539977,
+ 0.0015806201845407486,
+ 0.0013034256407991052
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5849609375,
+ "loss_eval": 1.1830923557281494,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 274.6016845703125,
+ 262.9326477050781,
+ 250.766357421875,
+ 252.1786346435547,
+ 254.2251739501953
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4794014936778694e-05,
+ 3.6746245314134285e-05,
+ 3.771794217755087e-05,
+ 3.6664638173533604e-05,
+ 3.1814517569728196e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016584239201620221,
+ 0.0016917918110266328,
+ 0.001726189162582159,
+ 0.0016276866663247347,
+ 0.0013194811763241887
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.578125,
+ "loss_eval": 1.1851024627685547,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 273.59783935546875,
+ 261.92218017578125,
+ 250.27320861816406,
+ 251.19146728515625,
+ 255.70233154296875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.505383210722357e-05,
+ 3.6710382119053975e-05,
+ 3.839766577584669e-05,
+ 3.708387885126285e-05,
+ 3.1251351174432784e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016781548038125038,
+ 0.0017169808270409703,
+ 0.0017399545758962631,
+ 0.0016386040952056646,
+ 0.0013246783055365086
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5712890625,
+ "loss_eval": 1.1789460182189941,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 274.9112854003906,
+ 262.3539123535156,
+ 251.67474365234375,
+ 253.08824157714844,
+ 255.4647979736328
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4545508242445067e-05,
+ 3.622366421041079e-05,
+ 3.7300182157196105e-05,
+ 3.594972440623678e-05,
+ 3.1557658076053485e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001666227588430047,
+ 0.0016955926548689604,
+ 0.0017251977697014809,
+ 0.0016294753877446055,
+ 0.001327820005826652
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.583984375,
+ "loss_eval": 1.1757192611694336,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 273.9092712402344,
+ 261.26507568359375,
+ 250.60923767089844,
+ 250.5943145751953,
+ 253.19862365722656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.532320988597348e-05,
+ 3.7557252653641626e-05,
+ 3.882365126628429e-05,
+ 3.676790583995171e-05,
+ 3.2376574381487444e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001686039031483233,
+ 0.0017200085567310452,
+ 0.0017563666915521026,
+ 0.0016565105179324746,
+ 0.0013397492002695799
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5986328125,
+ "loss_eval": 1.1719229221343994,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 275.9344177246094,
+ 265.1002502441406,
+ 253.2598114013672,
+ 253.86024475097656,
+ 257.8154296875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.419027416384779e-05,
+ 3.54782423528377e-05,
+ 3.770734474528581e-05,
+ 3.707608630065806e-05,
+ 3.1706651498097926e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016564616234973073,
+ 0.001694328966550529,
+ 0.001729298266582191,
+ 0.0016409243689849973,
+ 0.0013242866843938828
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59375,
+ "loss_eval": 1.169456958770752,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 277.0843200683594,
+ 263.2900390625,
+ 250.48553466796875,
+ 251.51341247558594,
+ 253.14413452148438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5850312997354195e-05,
+ 3.7839381548110396e-05,
+ 3.925598502974026e-05,
+ 3.7184508983045816e-05,
+ 3.174091762048192e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017717990558594465,
+ 0.0018099851440638304,
+ 0.0018417692044749856,
+ 0.0017209915677085519,
+ 0.0013732420047745109
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5869140625,
+ "loss_eval": 1.1764099597930908,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 280.2084655761719,
+ 265.3043518066406,
+ 254.26673889160156,
+ 253.3932342529297,
+ 255.91488647460938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4716471418505535e-05,
+ 3.675218249554746e-05,
+ 3.84828781534452e-05,
+ 3.653839303296991e-05,
+ 3.1539821065962315e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00171388138551265,
+ 0.0017648075008764863,
+ 0.00180675252340734,
+ 0.0016973463352769613,
+ 0.0013539392966777086
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.1670037508010864,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 278.0702209472656,
+ 264.4510498046875,
+ 250.75350952148438,
+ 248.73284912109375,
+ 253.1072540283203
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.694290717248805e-05,
+ 3.843691956717521e-05,
+ 3.982238922617398e-05,
+ 3.8299614971037954e-05,
+ 3.253731847507879e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017997974064201117,
+ 0.0018521619495004416,
+ 0.0018853276269510388,
+ 0.001754313474521041,
+ 0.0013789198128506541
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.168372631072998,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 279.5745849609375,
+ 265.3549499511719,
+ 252.89109802246094,
+ 250.0029296875,
+ 251.57737731933594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5274497349746525e-05,
+ 3.741122054634616e-05,
+ 3.8946731365285814e-05,
+ 3.7627731217071414e-05,
+ 3.1920495530357584e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017959685064852238,
+ 0.0018515808042138815,
+ 0.001886399113573134,
+ 0.0017732164124026895,
+ 0.001389715587720275
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5966796875,
+ "loss_eval": 1.1735193729400635,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 280.56402587890625,
+ 265.1068115234375,
+ 251.912353515625,
+ 248.08627319335938,
+ 250.21177673339844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.672741513582878e-05,
+ 3.8823065551696345e-05,
+ 4.041267675347626e-05,
+ 3.835778989014216e-05,
+ 3.2424144592368975e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018404219299554825,
+ 0.0018969813827425241,
+ 0.0019448500825092196,
+ 0.0018052044324576855,
+ 0.0014045372372493148
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5966796875,
+ "loss_eval": 1.163725733757019,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 281.2812194824219,
+ 266.5726623535156,
+ 253.18124389648438,
+ 252.3292694091797,
+ 254.1314697265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.6245146475266665e-05,
+ 3.849809218081646e-05,
+ 4.034954326925799e-05,
+ 3.857027695630677e-05,
+ 3.267046849941835e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018043599557131529,
+ 0.0018654613522812724,
+ 0.0018976799910888076,
+ 0.0017763315699994564,
+ 0.0013986497651785612
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5830078125,
+ "loss_eval": 1.172363519668579,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 278.3638916015625,
+ 264.4734802246094,
+ 250.60198974609375,
+ 248.59568786621094,
+ 249.39353942871094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.7236037314869463e-05,
+ 3.946686410927214e-05,
+ 4.103714309167117e-05,
+ 3.970286707044579e-05,
+ 3.281752287875861e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018646781099960208,
+ 0.0019272645004093647,
+ 0.0019672266207635403,
+ 0.001839098404161632,
+ 0.0014395405305549502
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5830078125,
+ "loss_eval": 1.1776624917984009,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 280.8514099121094,
+ 269.1718444824219,
+ 253.03790283203125,
+ 251.60220336914062,
+ 251.88168334960938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.689880759338848e-05,
+ 3.937961082556285e-05,
+ 4.092283779755235e-05,
+ 3.866894985549152e-05,
+ 3.262344398535788e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018725661793723702,
+ 0.0019201217219233513,
+ 0.0019532060250639915,
+ 0.0018317755311727524,
+ 0.001439971849322319
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.595703125,
+ "loss_eval": 1.1693906784057617,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 280.3335266113281,
+ 263.89471435546875,
+ 253.01638793945312,
+ 250.5576171875,
+ 251.4005889892578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.6666475352831185e-05,
+ 3.875952461385168e-05,
+ 4.0531358536100015e-05,
+ 3.9068203477654606e-05,
+ 3.450641088420525e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018578553572297096,
+ 0.0019184533739462495,
+ 0.001965942559763789,
+ 0.0018550093518570065,
+ 0.0014542803401127458
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5732421875,
+ "loss_eval": 1.1839377880096436,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 280.3553771972656,
+ 263.3617248535156,
+ 248.94859313964844,
+ 246.9832000732422,
+ 246.24644470214844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.8412734284065664e-05,
+ 4.001844354206696e-05,
+ 4.220755727146752e-05,
+ 4.0393635572399944e-05,
+ 3.391467180335894e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001917686895467341,
+ 0.0019766101613640785,
+ 0.0020170181524008512,
+ 0.0018900329014286399,
+ 0.001476101577281952
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6005859375,
+ "loss_eval": 1.1689397096633911,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 278.8861389160156,
+ 263.3866882324219,
+ 249.24301147460938,
+ 246.43963623046875,
+ 246.34503173828125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.77853139070794e-05,
+ 4.044857996632345e-05,
+ 4.182702468824573e-05,
+ 4.050548523082398e-05,
+ 3.3606509532546625e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019284948939457536,
+ 0.001992136472836137,
+ 0.0020461773965507746,
+ 0.001900508883409202,
+ 0.001466717105358839
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.1585946083068848,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 279.963623046875,
+ 263.52496337890625,
+ 249.6890869140625,
+ 245.60646057128906,
+ 245.52540588378906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.724947964656167e-05,
+ 3.964625648222864e-05,
+ 4.1545175918145105e-05,
+ 3.953047780669294e-05,
+ 3.275729977758601e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019616533536463976,
+ 0.002027863636612892,
+ 0.0020759752951562405,
+ 0.0019283785950392485,
+ 0.001484199776314199
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.157920002937317,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 279.7983093261719,
+ 263.42352294921875,
+ 247.6257781982422,
+ 244.5139923095703,
+ 242.93429565429688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.738125451491214e-05,
+ 4.007351162726991e-05,
+ 4.2600284359650686e-05,
+ 4.0704209823161364e-05,
+ 3.302833283669315e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001973477192223072,
+ 0.002032764023169875,
+ 0.0020790304988622665,
+ 0.0019371822709217668,
+ 0.0014914683997631073
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6005859375,
+ "loss_eval": 1.1545627117156982,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 278.16461181640625,
+ 259.95208740234375,
+ 246.212890625,
+ 243.02810668945312,
+ 242.42227172851562
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.896220732713118e-05,
+ 4.0713552152737975e-05,
+ 4.242185241309926e-05,
+ 4.1096616769209504e-05,
+ 3.4584638342494145e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020273446571081877,
+ 0.0020888603758066893,
+ 0.0021337512880563736,
+ 0.0019914479926228523,
+ 0.0015125740319490433
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.1588966846466064,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 278.74609375,
+ 259.810302734375,
+ 244.75640869140625,
+ 241.40191650390625,
+ 241.2429962158203
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.005424489150755e-05,
+ 4.289989738026634e-05,
+ 4.383309351396747e-05,
+ 4.207885649520904e-05,
+ 3.527112494339235e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002059010788798332,
+ 0.002119551645591855,
+ 0.002172222128137946,
+ 0.0020189452916383743,
+ 0.0015335450880229473
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1555505990982056,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 277.6565246582031,
+ 262.0436096191406,
+ 246.2357635498047,
+ 241.67991638183594,
+ 240.23500061035156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.1031005821423605e-05,
+ 4.313238605391234e-05,
+ 4.465782694751397e-05,
+ 4.2896612285403535e-05,
+ 3.4334370866417885e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002025892725214362,
+ 0.0020990471821278334,
+ 0.0021509609650820494,
+ 0.002011507283896208,
+ 0.0015318752266466618
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1416809558868408,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 277.4100646972656,
+ 260.2519836425781,
+ 245.48947143554688,
+ 242.5662384033203,
+ 241.2648162841797
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.732202821993269e-05,
+ 3.9125570765463635e-05,
+ 4.136607458349317e-05,
+ 3.977569213020615e-05,
+ 3.3676675229799e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002009452786296606,
+ 0.002076543401926756,
+ 0.002131648361682892,
+ 0.00199576816521585,
+ 0.0015338497469201684
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.143639087677002,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 277.3269348144531,
+ 259.49072265625,
+ 243.7945098876953,
+ 240.342041015625,
+ 238.76239013671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.978172389906831e-05,
+ 4.20100441260729e-05,
+ 4.455841553863138e-05,
+ 4.2333795136073604e-05,
+ 3.435015969444066e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020786102395504713,
+ 0.0021364488638937473,
+ 0.0021890606731176376,
+ 0.0020492339972406626,
+ 0.0015625122468918562
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1515132188796997,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 276.1414489746094,
+ 257.6651306152344,
+ 242.12867736816406,
+ 238.3046875,
+ 235.9711151123047
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.158447700319812e-05,
+ 4.40051153418608e-05,
+ 4.566523784887977e-05,
+ 4.3018761061830446e-05,
+ 3.456107515376061e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021895321551710367,
+ 0.0022726275492459536,
+ 0.00232017133384943,
+ 0.002137792995199561,
+ 0.0015979791060090065
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.148828148841858,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 276.29547119140625,
+ 257.9006652832031,
+ 242.25363159179688,
+ 237.8865966796875,
+ 235.57620239257812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.9041460695443675e-05,
+ 4.0436327253701165e-05,
+ 4.2260016925865784e-05,
+ 4.071593502885662e-05,
+ 3.461613232502714e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021726686973124743,
+ 0.002256714040413499,
+ 0.0023172625806182623,
+ 0.0021478317212313414,
+ 0.0016112272860482335
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.165194034576416,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 274.73480224609375,
+ 257.3844909667969,
+ 239.9276580810547,
+ 236.4628448486328,
+ 232.49490356445312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.182914926786907e-05,
+ 4.482160511543043e-05,
+ 4.732825618702918e-05,
+ 4.5475029764929786e-05,
+ 3.673886021715589e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002222857205197215,
+ 0.0022976247128099203,
+ 0.002366685541346669,
+ 0.002194431144744158,
+ 0.0016426561633124948
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.150635004043579,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 273.9837341308594,
+ 255.2301025390625,
+ 239.6470184326172,
+ 235.07806396484375,
+ 232.15016174316406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.28417552029714e-05,
+ 4.5315191528061405e-05,
+ 4.770928717334755e-05,
+ 4.653819996747188e-05,
+ 3.727963485289365e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002205377910286188,
+ 0.00228099524974823,
+ 0.002334901597350836,
+ 0.0021908036433160305,
+ 0.001635397202335298
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6064453125,
+ "loss_eval": 1.150489330291748,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 273.4665222167969,
+ 255.21783447265625,
+ 238.12306213378906,
+ 232.99537658691406,
+ 229.35629272460938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.174295099801384e-05,
+ 4.412833004607819e-05,
+ 4.589854142977856e-05,
+ 4.366271969047375e-05,
+ 3.4910473914351314e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022425123024731874,
+ 0.002337042009457946,
+ 0.0024111224338412285,
+ 0.002237174427136779,
+ 0.0016597777139395475
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1445674896240234,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 272.8526306152344,
+ 254.31373596191406,
+ 238.0008087158203,
+ 233.6641082763672,
+ 229.88113403320312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.274978709872812e-05,
+ 4.589447416947223e-05,
+ 4.8100573621923104e-05,
+ 4.519677167991176e-05,
+ 3.628300692071207e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022435274440795183,
+ 0.0023362115025520325,
+ 0.0024012199137359858,
+ 0.00223422609269619,
+ 0.0016617706278339028
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1417796611785889,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 272.5745849609375,
+ 253.39877319335938,
+ 236.8953094482422,
+ 231.5461883544922,
+ 227.8491668701172
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.257826367393136e-05,
+ 4.485245153773576e-05,
+ 4.667421308113262e-05,
+ 4.5228414819575846e-05,
+ 3.560770346666686e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022986247204244137,
+ 0.002396916039288044,
+ 0.0024696297477930784,
+ 0.0022973858285695314,
+ 0.0016907128738239408
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1428865194320679,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 269.6819763183594,
+ 250.9730682373047,
+ 234.21188354492188,
+ 228.83775329589844,
+ 224.82958984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.29281426477246e-05,
+ 4.5681605115532875e-05,
+ 4.7611269110348076e-05,
+ 4.553339022095315e-05,
+ 3.683664544951171e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023400019854307175,
+ 0.002444769022986293,
+ 0.0025141045916825533,
+ 0.002344615990296006,
+ 0.0017126062884926796
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.625,
+ "loss_eval": 1.1239444017410278,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 269.7929992675781,
+ 250.5220947265625,
+ 233.3997802734375,
+ 228.2130584716797,
+ 224.5063018798828
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4715372496284544e-05,
+ 4.6482971811201423e-05,
+ 4.9765483709052205e-05,
+ 4.759176226798445e-05,
+ 3.8208585465326905e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023639060091227293,
+ 0.002476333873346448,
+ 0.0025423571933060884,
+ 0.00236364989541471,
+ 0.0017294714925810695
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1502506732940674,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 269.24493408203125,
+ 251.6195831298828,
+ 234.21717834472656,
+ 228.9242401123047,
+ 224.33628845214844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4276617700234056e-05,
+ 4.620026084012352e-05,
+ 4.972432361682877e-05,
+ 4.657481986214407e-05,
+ 3.729217132786289e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023896305356174707,
+ 0.002498477231711149,
+ 0.0025652945041656494,
+ 0.002390124835073948,
+ 0.0017562232678756118
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.146531581878662,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 268.0794982910156,
+ 250.7041778564453,
+ 233.16966247558594,
+ 227.9508056640625,
+ 223.48045349121094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.518003697739914e-05,
+ 4.807085497304797e-05,
+ 5.077984678791836e-05,
+ 4.9026388296624646e-05,
+ 3.8487425626954064e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023859951179474592,
+ 0.002494273241609335,
+ 0.0025624327827244997,
+ 0.0023940331302583218,
+ 0.0017616016557440162
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1454447507858276,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 267.8343811035156,
+ 247.6757049560547,
+ 231.40367126464844,
+ 225.93670654296875,
+ 220.4804229736328
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.405072468216531e-05,
+ 4.688911576522514e-05,
+ 4.961229205946438e-05,
+ 4.743603858514689e-05,
+ 3.724359339685179e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002465154742822051,
+ 0.0025785581674426794,
+ 0.002648484194651246,
+ 0.0024633395951241255,
+ 0.0017954027280211449
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.165484070777893,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 267.8901062011719,
+ 248.67857360839844,
+ 231.63746643066406,
+ 225.49383544921875,
+ 220.6399383544922
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.755932604894042e-05,
+ 4.9960097385337576e-05,
+ 5.191187665332109e-05,
+ 4.949339563609101e-05,
+ 3.946756987716071e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024303828831762075,
+ 0.0025356977712363005,
+ 0.002610789379104972,
+ 0.00243638688698411,
+ 0.0017875435296446085
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1472151279449463,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 267.3486022949219,
+ 247.69305419921875,
+ 229.9873504638672,
+ 223.6610870361328,
+ 218.91578674316406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.743155659525655e-05,
+ 5.06583419337403e-05,
+ 5.422766844276339e-05,
+ 5.0596820074133575e-05,
+ 3.959470632253215e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025001303292810917,
+ 0.0026160534471273422,
+ 0.002682509133592248,
+ 0.002501503797248006,
+ 0.0018251334549859166
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.157745599746704,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 266.2055969238281,
+ 246.88201904296875,
+ 229.0934295654297,
+ 223.09255981445312,
+ 217.90614318847656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6090037358226255e-05,
+ 4.8821068048710003e-05,
+ 5.145218892721459e-05,
+ 4.892798824585043e-05,
+ 3.874724279739894e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002517222659662366,
+ 0.00262960116378963,
+ 0.002704967511817813,
+ 0.002524228999391198,
+ 0.0018283555982634425
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1513168811798096,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 263.8387451171875,
+ 244.32431030273438,
+ 227.78903198242188,
+ 222.13900756835938,
+ 216.27389526367188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.680602069129236e-05,
+ 5.040669202571735e-05,
+ 5.318928378983401e-05,
+ 4.9446778575656936e-05,
+ 3.913935870514251e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025120435748249292,
+ 0.0026304670609533787,
+ 0.0027123456820845604,
+ 0.002537800231948495,
+ 0.001847997889854014
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6240234375,
+ "loss_eval": 1.1497204303741455,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 263.52716064453125,
+ 243.21226501464844,
+ 226.427001953125,
+ 220.67845153808594,
+ 214.70176696777344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6976576413726434e-05,
+ 5.0085352995665744e-05,
+ 5.2343326387926936e-05,
+ 4.9784572183853015e-05,
+ 4.0186921978602186e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026124012656509876,
+ 0.0027241536881774664,
+ 0.002797869499772787,
+ 0.002603790955618024,
+ 0.0018792233895510435
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.153285026550293,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 264.0121765136719,
+ 243.2773895263672,
+ 226.7365264892578,
+ 220.29107666015625,
+ 214.1591339111328
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6254041080828756e-05,
+ 4.949727008352056e-05,
+ 5.206605055718683e-05,
+ 5.012763722334057e-05,
+ 3.8815273001091555e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026143237482756376,
+ 0.0027275518514215946,
+ 0.0028062777128070593,
+ 0.002607470378279686,
+ 0.0018867084290832281
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1514866352081299,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 263.4013671875,
+ 243.0095672607422,
+ 225.4296112060547,
+ 219.55067443847656,
+ 213.40794372558594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8506815801374614e-05,
+ 5.151949153514579e-05,
+ 5.5085791245801374e-05,
+ 5.175785190658644e-05,
+ 4.0316641388926655e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002606831956654787,
+ 0.002728143008425832,
+ 0.0028109808918088675,
+ 0.0026184367015957832,
+ 0.0018970600795000792
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1346663236618042,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 262.27703857421875,
+ 242.7241668701172,
+ 224.5229949951172,
+ 218.4025115966797,
+ 212.19247436523438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.704251477960497e-05,
+ 5.0965834816452116e-05,
+ 5.3327348723541945e-05,
+ 5.0449500122340396e-05,
+ 4.0479797462467104e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026277368888258934,
+ 0.0027542279567569494,
+ 0.00283243996091187,
+ 0.00264621595852077,
+ 0.0019058829639106989
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6240234375,
+ "loss_eval": 1.137591004371643,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 262.1747131347656,
+ 241.88607788085938,
+ 224.1046142578125,
+ 217.9982147216797,
+ 211.7519989013672
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.847371383220889e-05,
+ 5.121564754517749e-05,
+ 5.3943567763781175e-05,
+ 5.087414683657698e-05,
+ 4.037184771732427e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026811074931174517,
+ 0.002809705911204219,
+ 0.002887698821723461,
+ 0.002692745067179203,
+ 0.0019356919219717383
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1538643836975098,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 261.7838439941406,
+ 239.75706481933594,
+ 222.1133575439453,
+ 216.12124633789062,
+ 210.44593811035156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8369467549491674e-05,
+ 5.07068180013448e-05,
+ 5.281560879666358e-05,
+ 5.086012970423326e-05,
+ 4.062180232722312e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027064597234129906,
+ 0.0028339733835309744,
+ 0.0029109998140484095,
+ 0.002717787167057395,
+ 0.0019469966646283865
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1476709842681885,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 260.708251953125,
+ 239.65792846679688,
+ 222.502197265625,
+ 216.31419372558594,
+ 210.15716552734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.919906132272445e-05,
+ 5.164166941540316e-05,
+ 5.366719051380642e-05,
+ 5.108323966851458e-05,
+ 4.000464832643047e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002715736860409379,
+ 0.0028464714996516705,
+ 0.0029330456163734198,
+ 0.0027443754952400923,
+ 0.001961463363841176
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1511735916137695,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 260.4088439941406,
+ 239.9808349609375,
+ 222.2389373779297,
+ 215.33692932128906,
+ 208.58534240722656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8405916459159926e-05,
+ 5.163977766642347e-05,
+ 5.34093014721293e-05,
+ 5.167788185644895e-05,
+ 4.020798587589525e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027501434087753296,
+ 0.0028795108664780855,
+ 0.0029617082327604294,
+ 0.002769613405689597,
+ 0.001984042814001441
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1523363590240479,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 259.8567199707031,
+ 238.8525848388672,
+ 221.2687225341797,
+ 213.9132537841797,
+ 207.3290557861328
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8219208110822365e-05,
+ 5.1672555855475366e-05,
+ 5.364803655538708e-05,
+ 5.1243885536678135e-05,
+ 4.079756035935134e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028046013321727514,
+ 0.002939376747235656,
+ 0.0030214993748813868,
+ 0.002813557395711541,
+ 0.0019953204318881035
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1514203548431396,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 259.52423095703125,
+ 238.27757263183594,
+ 219.9165802001953,
+ 213.4214324951172,
+ 206.20606994628906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8479021643288434e-05,
+ 5.219021113589406e-05,
+ 5.5094871640903875e-05,
+ 5.1899030950153247e-05,
+ 4.124108454561792e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028202880639582872,
+ 0.002952422248199582,
+ 0.0030410154722630978,
+ 0.002832787809893489,
+ 0.0020088190212845802
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.625,
+ "loss_eval": 1.1545820236206055,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 258.1958923339844,
+ 237.08778381347656,
+ 219.2870635986328,
+ 212.87725830078125,
+ 205.84408569335938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.005837374483235e-05,
+ 5.344217424863018e-05,
+ 5.582463927567005e-05,
+ 5.345495083020069e-05,
+ 4.113194518140517e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028330644126981497,
+ 0.002965509658679366,
+ 0.0030466399621218443,
+ 0.00284536718390882,
+ 0.0020232615061104298
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.1552448272705078,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 258.44268798828125,
+ 236.90562438964844,
+ 218.65948486328125,
+ 212.63186645507812,
+ 204.90692138671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.896440077573061e-05,
+ 5.1820486987708136e-05,
+ 5.4638629080727696e-05,
+ 5.3578904044115916e-05,
+ 4.117973367101513e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002839416265487671,
+ 0.0029778846073895693,
+ 0.003062452422454953,
+ 0.002849552081897855,
+ 0.0020236214622855186
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1515182256698608,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 258.24615478515625,
+ 236.87181091308594,
+ 219.06484985351562,
+ 213.2528076171875,
+ 205.03671264648438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8622885515214875e-05,
+ 5.181535379961133e-05,
+ 5.509376205736771e-05,
+ 5.2298331866040826e-05,
+ 4.074195385328494e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002838765038177371,
+ 0.00297414674423635,
+ 0.003058358561247587,
+ 0.0028491863049566746,
+ 0.0020313323475420475
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1609394550323486,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 257.9989929199219,
+ 236.4859161376953,
+ 218.73072814941406,
+ 212.0786895751953,
+ 204.2919464111328
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0208276661578566e-05,
+ 5.2276191127020866e-05,
+ 5.509322727448307e-05,
+ 5.315374437486753e-05,
+ 4.122377504245378e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028634185437113047,
+ 0.0029970910400152206,
+ 0.0030890253838151693,
+ 0.002881886437535286,
+ 0.0020408176351338625
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.1592046022415161,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 257.24053955078125,
+ 235.7548065185547,
+ 217.84329223632812,
+ 211.033935546875,
+ 203.8216094970703
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0660164561122656e-05,
+ 5.414208135334775e-05,
+ 5.5454143875977024e-05,
+ 5.3000938351033255e-05,
+ 4.292939411243424e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028948886319994926,
+ 0.003031315514817834,
+ 0.0031204961705952883,
+ 0.002907233312726021,
+ 0.0020496752113103867
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.1583250761032104,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 256.78289794921875,
+ 235.2476348876953,
+ 217.21603393554688,
+ 210.80035400390625,
+ 203.15478515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9510348617332056e-05,
+ 5.1982155127916485e-05,
+ 5.440499808173627e-05,
+ 5.1704166253330186e-05,
+ 4.0308059396920726e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028964560478925705,
+ 0.0030334230978041887,
+ 0.0031210912857204676,
+ 0.002908239373937249,
+ 0.0020543786231428385
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1597179174423218,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 256.531982421875,
+ 235.45941162109375,
+ 217.1429443359375,
+ 210.1690673828125,
+ 202.77899169921875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.943124076817185e-05,
+ 5.149367279955186e-05,
+ 5.385246913647279e-05,
+ 5.262702325126156e-05,
+ 4.104706385987811e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029305708594620228,
+ 0.0030687344260513783,
+ 0.003160761669278145,
+ 0.002940374892205,
+ 0.0020649591460824013
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.161116600036621,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 256.3059387207031,
+ 235.24874877929688,
+ 217.37142944335938,
+ 210.53717041015625,
+ 203.14259338378906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.934536627843045e-05,
+ 5.2089759265072644e-05,
+ 5.424721530289389e-05,
+ 5.292960850056261e-05,
+ 4.041651845909655e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002913407515734434,
+ 0.0030489542987197638,
+ 0.003135726321488619,
+ 0.002922008978202939,
+ 0.002062067622318864
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.155902624130249,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 256.7462463378906,
+ 235.3153839111328,
+ 216.87977600097656,
+ 210.572509765625,
+ 202.77845764160156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.990033630747348e-05,
+ 5.337029870133847e-05,
+ 5.522817809833214e-05,
+ 5.3465773817151785e-05,
+ 4.164372876402922e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029192205984145403,
+ 0.0030557813588529825,
+ 0.003147577866911888,
+ 0.0029307191725820303,
+ 0.0020654413383454084
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.1561503410339355,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 256.68145751953125,
+ 234.77310180664062,
+ 216.7720947265625,
+ 209.664794921875,
+ 202.22833251953125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9965801736107096e-05,
+ 5.341583164408803e-05,
+ 5.593279274762608e-05,
+ 5.420796514954418e-05,
+ 4.210533734294586e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002943370258435607,
+ 0.00308181531727314,
+ 0.003169203409925103,
+ 0.002951863221824169,
+ 0.0020759364124387503
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1583542823791504,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 256.4252014160156,
+ 234.56448364257812,
+ 216.34176635742188,
+ 209.5242156982422,
+ 201.7559356689453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9815931561170146e-05,
+ 5.2233976020943373e-05,
+ 5.5747830629115924e-05,
+ 5.41718618478626e-05,
+ 4.169955354882404e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029554881621152163,
+ 0.0030950764194130898,
+ 0.0031847492791712284,
+ 0.0029650654178112745,
+ 0.002081435639411211
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.159005045890808,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 256.15167236328125,
+ 234.47537231445312,
+ 216.2799072265625,
+ 209.95578002929688,
+ 201.94126892089844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.007637446396984e-05,
+ 5.260824036668055e-05,
+ 5.540058555197902e-05,
+ 5.322153810993768e-05,
+ 4.1122035327134654e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002944375155493617,
+ 0.00308293872512877,
+ 0.003174267942085862,
+ 0.0029555640649050474,
+ 0.0020777545869350433
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1595215797424316,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 256.1369934082031,
+ 234.51614379882812,
+ 216.30044555664062,
+ 209.4623565673828,
+ 201.70799255371094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.048588718636893e-05,
+ 5.3128016588743776e-05,
+ 5.624579353025183e-05,
+ 5.411298116086982e-05,
+ 4.109516885364428e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029427227564156055,
+ 0.0030841128900647163,
+ 0.003178349928930402,
+ 0.0029583934228867292,
+ 0.002080487785860896
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1565905809402466,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 255.9738311767578,
+ 234.28948974609375,
+ 216.3280029296875,
+ 209.589111328125,
+ 201.76205444335938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.070818224339746e-05,
+ 5.330924614099786e-05,
+ 5.596653136308305e-05,
+ 5.407314529293217e-05,
+ 4.100686783203855e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029472638852894306,
+ 0.003088710131123662,
+ 0.0031828396022319794,
+ 0.0029631764627993107,
+ 0.0020829145796597004
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.1584088802337646,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 255.89332580566406,
+ 234.19253540039062,
+ 216.33103942871094,
+ 209.45057678222656,
+ 201.54258728027344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.041498661739752e-05,
+ 5.279783727019094e-05,
+ 5.5226330005098134e-05,
+ 5.407658318290487e-05,
+ 4.1154507925966755e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002949801040813327,
+ 0.00309200631454587,
+ 0.0031869453378021717,
+ 0.0029658437706530094,
+ 0.002085147425532341
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.158942699432373,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 255.63841247558594,
+ 234.11630249023438,
+ 216.2378692626953,
+ 209.49703979492188,
+ 201.46917724609375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.020374737796374e-05,
+ 5.243354826234281e-05,
+ 5.587147097685374e-05,
+ 5.334949673851952e-05,
+ 4.121083111385815e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002950438065454364,
+ 0.003093136241659522,
+ 0.0031878354493528605,
+ 0.0029664800968021154,
+ 0.0020843464881181717
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.1582318544387817,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 255.8027801513672,
+ 234.07070922851562,
+ 216.1463623046875,
+ 209.4476318359375,
+ 201.27279663085938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0307549827266484e-05,
+ 5.278814569464885e-05,
+ 5.604944453807548e-05,
+ 5.306081584421918e-05,
+ 4.1182753193425015e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002952505135908723,
+ 0.003095670836046338,
+ 0.0031897351145744324,
+ 0.00296790711581707,
+ 0.002085329731926322
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.15840482711792,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 255.60986328125,
+ 234.11065673828125,
+ 216.12860107421875,
+ 209.42921447753906,
+ 201.28346252441406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0218295655213296e-05,
+ 5.269264511298388e-05,
+ 5.5988577514654025e-05,
+ 5.322946162777953e-05,
+ 4.136392453801818e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002954497467726469,
+ 0.003097717184573412,
+ 0.0031918887980282307,
+ 0.002969518303871155,
+ 0.00208606431260705
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1585593223571777,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 255.57244873046875,
+ 234.11569213867188,
+ 216.13626098632812,
+ 209.40383911132812,
+ 201.28627014160156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.005559796700254e-05,
+ 5.2759678510483354e-05,
+ 5.5868193157948554e-05,
+ 5.3356721764430404e-05,
+ 4.125368650420569e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029547216836363077,
+ 0.00309770368039608,
+ 0.003191797062754631,
+ 0.0029695071280002594,
+ 0.0020862380042672157
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1585021018981934,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 255.5677947998047,
+ 234.11875915527344,
+ 216.1315460205078,
+ 209.4070281982422,
+ 201.2687530517578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.006368883186951e-05,
+ 5.279530887492001e-05,
+ 5.585233884630725e-05,
+ 5.334027810022235e-05,
+ 4.123226608498953e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002954971743747592,
+ 0.0030978918075561523,
+ 0.003191987983882427,
+ 0.002969692926853895,
+ 0.002086336025968194
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.1584858894348145,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.690464973449707,
+ 8.719978332519531,
+ 8.73093318939209,
+ 8.75937271118164,
+ 8.790542602539062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009977436857298017,
+ 0.000992251792922616,
+ 0.0009848480112850666,
+ 0.0009761073160916567,
+ 0.0009735578205436468
+ ],
+ "bp_grad_norms_F": [
+ 0.035340383648872375,
+ 0.03499162197113037,
+ 0.03454425558447838,
+ 0.034113530069589615,
+ 0.033874060958623886
+ ],
+ "gamma_dfa": 0.006830460682976991,
+ "acc_eval": 0.095703125,
+ "loss_eval": 2.486203908920288,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 861.2440185546875,
+ 2373.370849609375,
+ 4675.99951171875,
+ 6090.40869140625,
+ 6962.984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.380779051236459e-06,
+ 1.3197138741816161e-06,
+ 1.3154849511920474e-06,
+ 1.3285966815601569e-06,
+ 1.3258621720524388e-06
+ ],
+ "bp_grad_norms_F": [
+ 0.0001391920231981203,
+ 6.988063250901178e-05,
+ 6.874280370539054e-05,
+ 6.720778765156865e-05,
+ 6.707101420033723e-05
+ ],
+ "gamma_dfa": 0.10659917898010463,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9665180444717407,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1679.144775390625,
+ 8850.173828125,
+ 31676.23046875,
+ 40712.2109375,
+ 45375.55859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1123192962259054e-06,
+ 2.7329409135745664e-07,
+ 2.7436919936008053e-07,
+ 2.75225175982996e-07,
+ 2.744452558545163e-07
+ ],
+ "bp_grad_norms_F": [
+ 7.363831537077203e-05,
+ 2.2035641450202093e-05,
+ 1.9731569409486838e-05,
+ 1.9022963897441514e-05,
+ 1.7921549442689866e-05
+ ],
+ "gamma_dfa": 0.10788296448299661,
+ "acc_eval": 0.29296875,
+ "loss_eval": 1.972828984260559,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 2530.16015625,
+ 21436.486328125,
+ 88828.296875,
+ 114079.484375,
+ 124374.78125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.110604312605574e-07,
+ 1.1556701196013819e-07,
+ 1.1451407289087001e-07,
+ 1.1523399479074214e-07,
+ 1.1543902900257308e-07
+ ],
+ "bp_grad_norms_F": [
+ 0.00011594755778787658,
+ 1.8132053810404614e-05,
+ 1.1369732419552747e-05,
+ 8.215727575588971e-06,
+ 7.219489361887099e-06
+ ],
+ "gamma_dfa": 0.1084698709892109,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9430747032165527,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 3363.359375,
+ 41233.19921875,
+ 182355.03125,
+ 240225.46875,
+ 257539.390625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.176944111757621e-07,
+ 6.474806468759198e-08,
+ 6.307719502274267e-08,
+ 6.379124783961743e-08,
+ 6.374663996666641e-08
+ ],
+ "bp_grad_norms_F": [
+ 3.5978406231151894e-05,
+ 4.323610028222902e-06,
+ 3.5177260997443227e-06,
+ 3.4877305097325006e-06,
+ 3.479522774796351e-06
+ ],
+ "gamma_dfa": 0.10987455540453084,
+ "acc_eval": 0.3173828125,
+ "loss_eval": 1.959622859954834,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 4170.119140625,
+ 70935.8515625,
+ 335571.09375,
+ 441693.5625,
+ 469995.8125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.856212285631045e-07,
+ 4.0158354863706336e-08,
+ 3.8916198263905244e-08,
+ 3.9119736783277403e-08,
+ 3.916203894505088e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.611691706988495e-05,
+ 2.208936621173052e-06,
+ 1.6750394706832594e-06,
+ 1.6634863868603134e-06,
+ 1.659758027017233e-06
+ ],
+ "gamma_dfa": 0.1083616423420608,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.932759165763855,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 5013.92236328125,
+ 106898.6171875,
+ 530492.6875,
+ 719779.5,
+ 763058.3125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.242272950705228e-07,
+ 2.814423716301917e-08,
+ 2.683668043346188e-08,
+ 2.6872848835068908e-08,
+ 2.6873932412740942e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.2560918296221644e-05,
+ 1.2798993793694535e-06,
+ 1.0339434766137856e-06,
+ 1.0326252777304035e-06,
+ 1.030524344969308e-06
+ ],
+ "gamma_dfa": 0.11125951120629907,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9531997442245483,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 5811.36279296875,
+ 156264.234375,
+ 809496.6875,
+ 1104418.875,
+ 1163013.625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5694648659045924e-07,
+ 2.0201103012595922e-08,
+ 1.89678583950581e-08,
+ 1.8967025283700423e-08,
+ 1.8932304612917505e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.9050115952268243e-05,
+ 9.341621307612513e-07,
+ 6.890153372296481e-07,
+ 6.891143584653037e-07,
+ 6.886222649882257e-07
+ ],
+ "gamma_dfa": 0.11049338441807777,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9362893104553223,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 6660.841796875,
+ 217521.65625,
+ 1158874.5,
+ 1615614.625,
+ 1694436.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.212987280676316e-07,
+ 1.5324568281016582e-08,
+ 1.4045938634410504e-08,
+ 1.4053354924215e-08,
+ 1.4027999206689401e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.7352898794342764e-05,
+ 6.539408445860317e-07,
+ 5.044145154897706e-07,
+ 5.047700142313261e-07,
+ 5.048477760283276e-07
+ ],
+ "gamma_dfa": 0.11245601065456867,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9441646337509155,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 7480.24169921875,
+ 295557.40625,
+ 1585967.0,
+ 2246827.75,
+ 2356427.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.889860297727864e-07,
+ 1.193609300287335e-08,
+ 1.1067995409064224e-08,
+ 1.103960478587851e-08,
+ 1.1055576010221557e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.5521236491622403e-05,
+ 4.5597263920171827e-07,
+ 3.8742672359148855e-07,
+ 3.8764648024880444e-07,
+ 3.877208314406744e-07
+ ],
+ "gamma_dfa": 0.11317481694277376,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9356626272201538,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 8273.8408203125,
+ 388312.4375,
+ 2104540.5,
+ 3043837.75,
+ 3180222.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.619119925384439e-07,
+ 9.19370091168048e-09,
+ 8.51864179196582e-09,
+ 8.482276214749618e-09,
+ 8.476813917468462e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4210399967851117e-05,
+ 3.5443522961031704e-07,
+ 3.0404962103602884e-07,
+ 3.0431687036980293e-07,
+ 3.0445681886703824e-07
+ ],
+ "gamma_dfa": 0.11495429277420044,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.936495304107666,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 9086.7265625,
+ 501434.3125,
+ 2767834.0,
+ 4046107.75,
+ 4214970.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.471596189934644e-07,
+ 7.524303846651037e-09,
+ 7.025830139895106e-09,
+ 7.019247405537499e-09,
+ 7.011437208603866e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3406845027930103e-05,
+ 4.39807990915142e-07,
+ 2.471441860052437e-07,
+ 2.474318421263888e-07,
+ 2.475488827258232e-07
+ ],
+ "gamma_dfa": 0.11651878873817623,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9542189836502075,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 9854.2626953125,
+ 612623.625,
+ 3485830.25,
+ 5139234.5,
+ 5346583.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.3279393701614026e-07,
+ 6.378383154981293e-09,
+ 5.839252636974379e-09,
+ 5.8299334249056756e-09,
+ 5.825462778830115e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2396733836794738e-05,
+ 2.516441668376501e-07,
+ 2.0780194631697668e-07,
+ 2.0795941679807584e-07,
+ 2.080748373600727e-07
+ ],
+ "gamma_dfa": 0.11470737145282328,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9374217987060547,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 10653.666015625,
+ 745430.125,
+ 4325399.0,
+ 6434218.5,
+ 6688000.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.1187355514484807e-07,
+ 5.294193083926757e-09,
+ 4.98529528769609e-09,
+ 4.991081326011226e-09,
+ 4.989251234377434e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1210328011657111e-05,
+ 2.000140426616781e-07,
+ 1.7647043648594263e-07,
+ 1.7654315342952032e-07,
+ 1.7665543339262513e-07
+ ],
+ "gamma_dfa": 0.11383607180323452,
+ "acc_eval": 0.291015625,
+ "loss_eval": 1.9233126640319824,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11404.5263671875,
+ 893037.0625,
+ 5298411.0,
+ 7870617.0,
+ 8170729.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.9957101926593168e-07,
+ 4.642851436642559e-09,
+ 4.288450483613815e-09,
+ 4.285100718703916e-09,
+ 4.289933297485504e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0866175216506235e-05,
+ 1.758858729772328e-07,
+ 1.538420519864303e-07,
+ 1.5386244456294662e-07,
+ 1.5397839092656795e-07
+ ],
+ "gamma_dfa": 0.1139617893495597,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.932279109954834,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 12171.2412109375,
+ 1062066.875,
+ 6388639.0,
+ 9528923.0,
+ 9891447.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.9334000000981177e-07,
+ 4.044033108385747e-09,
+ 3.810601167941741e-09,
+ 3.801854830953744e-09,
+ 3.8046659156520946e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0322088201064616e-05,
+ 1.529211743900305e-07,
+ 1.350435638869385e-07,
+ 1.3504063645086717e-07,
+ 1.3514510044387862e-07
+ ],
+ "gamma_dfa": 0.11320225725648925,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.921454906463623,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 12924.974609375,
+ 1273988.625,
+ 7574387.5,
+ 11500420.0,
+ 11920183.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.8497563303299103e-07,
+ 3.6160896499382034e-09,
+ 3.388503477808058e-09,
+ 3.385580482628825e-09,
+ 3.3854716807724117e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.76746559899766e-06,
+ 1.3485876593222201e-07,
+ 1.1896084117779537e-07,
+ 1.1894425000491538e-07,
+ 1.1903343022368063e-07
+ ],
+ "gamma_dfa": 0.11276883230311796,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9356281757354736,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 13632.109375,
+ 1465148.75,
+ 8873670.0,
+ 13535396.0,
+ 14019399.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7523743167657813e-07,
+ 3.18161341716916e-09,
+ 3.0166942277531916e-09,
+ 3.0173783471809656e-09,
+ 3.0215525637089513e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.427177246834617e-06,
+ 1.1933295240851294e-07,
+ 1.0663712401992598e-07,
+ 1.0661205607220836e-07,
+ 1.0669979388922002e-07
+ ],
+ "gamma_dfa": 0.11264261469477788,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.926081657409668,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 14394.1845703125,
+ 1699121.5,
+ 10379340.0,
+ 15814831.0,
+ 16377349.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6784264289526618e-07,
+ 2.8936604223872564e-09,
+ 2.7336535257660444e-09,
+ 2.7314879247342105e-09,
+ 2.733708148738856e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.04797616385622e-06,
+ 1.087723191517398e-07,
+ 9.662341682314946e-08,
+ 9.658959498892727e-08,
+ 9.665905764677518e-08
+ ],
+ "gamma_dfa": 0.11253939801827073,
+ "acc_eval": 0.3154296875,
+ "loss_eval": 1.922888994216919,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 15138.509765625,
+ 1969752.0,
+ 12071423.0,
+ 18393228.0,
+ 19044056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5837277089758572e-07,
+ 2.609559235366987e-09,
+ 2.4664128517315476e-09,
+ 2.4639881246457662e-09,
+ 2.4657431652030937e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.502225682605058e-06,
+ 9.664965716638108e-08,
+ 8.704243725787819e-08,
+ 8.700892806245974e-08,
+ 8.707356613513184e-08
+ ],
+ "gamma_dfa": 0.11155363742727786,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9243314266204834,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 15811.982421875,
+ 2268261.5,
+ 13867645.0,
+ 21375086.0,
+ 22149420.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5073908343765652e-07,
+ 2.376487229227564e-09,
+ 2.2317030445861974e-09,
+ 2.2317414583028494e-09,
+ 2.2311954506193388e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.195236659958027e-06,
+ 8.728681422098816e-08,
+ 7.846901439734211e-08,
+ 7.84395552955175e-08,
+ 7.849664029890846e-08
+ ],
+ "gamma_dfa": 0.11315422086045146,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.924652338027954,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 16487.935546875,
+ 2556303.5,
+ 15702076.0,
+ 24321856.0,
+ 25185988.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.443007136003871e-07,
+ 2.174122659681643e-09,
+ 2.0514809850880056e-09,
+ 2.052057856971601e-09,
+ 2.05182382195801e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.002187314559706e-06,
+ 8.025331510452816e-08,
+ 7.266314838716426e-08,
+ 7.2638087544874e-08,
+ 7.268938162496852e-08
+ ],
+ "gamma_dfa": 0.11267373809823766,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9348869323730469,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 17153.216796875,
+ 2908610.25,
+ 17831918.0,
+ 27718528.0,
+ 28682196.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.43127067531168e-07,
+ 2.0134633960111614e-09,
+ 1.908325941712974e-09,
+ 1.9070569567958273e-09,
+ 1.9050578892176873e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.550354439445073e-06,
+ 7.309487415341209e-08,
+ 6.660556550741603e-08,
+ 6.657593587533484e-08,
+ 6.66217090383725e-08
+ ],
+ "gamma_dfa": 0.11266892295680009,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9210036993026733,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 17796.001953125,
+ 3236156.25,
+ 20246900.0,
+ 31494576.0,
+ 32571052.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.3518946673229948e-07,
+ 1.8474217711172969e-09,
+ 1.7507182370479768e-09,
+ 1.7496273319039801e-09,
+ 1.7511733174657707e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.284599632839672e-06,
+ 6.709063882226474e-08,
+ 6.151606157800416e-08,
+ 6.149030440383285e-08,
+ 6.153235432293513e-08
+ ],
+ "gamma_dfa": 0.11186322406865656,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9283114671707153,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 18460.63671875,
+ 3604280.25,
+ 22626418.0,
+ 35429216.0,
+ 36622356.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.3137012899733236e-07,
+ 1.7567419741126855e-09,
+ 1.6593408869169934e-09,
+ 1.6595901319860218e-09,
+ 1.6608053821087765e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.130098310881294e-06,
+ 6.264485108431472e-08,
+ 5.731577701340029e-08,
+ 5.729528851361465e-08,
+ 5.733248187311801e-08
+ ],
+ "gamma_dfa": 0.11299802124267444,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.942992925643921,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 19115.904296875,
+ 4038094.25,
+ 25405536.0,
+ 39835936.0,
+ 41154148.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2640579427625198e-07,
+ 1.5953075527264104e-09,
+ 1.5003157605164574e-09,
+ 1.4991035079958692e-09,
+ 1.4979777418488993e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.799941729696002e-06,
+ 5.7522207441706996e-08,
+ 5.297441418861126e-08,
+ 5.2952817242157835e-08,
+ 5.298943506204523e-08
+ ],
+ "gamma_dfa": 0.11197824770351872,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9319748878479004,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 19780.572265625,
+ 4490110.5,
+ 28153634.0,
+ 44291160.0,
+ 45731404.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2269519800156559e-07,
+ 1.4798114955638653e-09,
+ 1.4102843337582271e-09,
+ 1.4097069067631196e-09,
+ 1.4109671209183716e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.577545264008222e-06,
+ 5.327013141709358e-08,
+ 4.94958669605694e-08,
+ 4.9476955865657146e-08,
+ 4.950964083150211e-08
+ ],
+ "gamma_dfa": 0.11252723945653997,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9247620105743408,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 20381.6796875,
+ 4929967.0,
+ 30880866.0,
+ 48905308.0,
+ 50483824.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1911821928833888e-07,
+ 1.377626124288156e-09,
+ 1.3317531522005766e-09,
+ 1.3313244950907688e-09,
+ 1.3306112878197496e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.326347829599399e-06,
+ 4.955709798082353e-08,
+ 4.649340468176888e-08,
+ 4.6477893533847237e-08,
+ 4.650862805988254e-08
+ ],
+ "gamma_dfa": 0.11152978462632746,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9170689582824707,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 21001.544921875,
+ 5444194.5,
+ 33907076.0,
+ 53832084.0,
+ 55554724.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1559290413742929e-07,
+ 1.3061883796794405e-09,
+ 1.2378150726632953e-09,
+ 1.2379912650573033e-09,
+ 1.2384089309591673e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.23212235950632e-06,
+ 4.7021419646853246e-08,
+ 4.3998962695468435e-08,
+ 4.3984215380987735e-08,
+ 4.4011432720481025e-08
+ ],
+ "gamma_dfa": 0.11285935762862209,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.9198743104934692,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 21623.64453125,
+ 5895143.0,
+ 37025488.0,
+ 58791348.0,
+ 60687928.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1377478870144841e-07,
+ 1.2547849426169932e-09,
+ 1.1888731110687445e-09,
+ 1.1877619998656996e-09,
+ 1.1896320595283782e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.024939921189798e-06,
+ 4.443810297516393e-08,
+ 4.161294953064498e-08,
+ 4.159920763413538e-08,
+ 4.162497546644772e-08
+ ],
+ "gamma_dfa": 0.11188641694025137,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.917163372039795,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 22195.29296875,
+ 6369258.5,
+ 40117404.0,
+ 64235468.0,
+ 66270544.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1021134582733794e-07,
+ 1.153794726427293e-09,
+ 1.1123471033158694e-09,
+ 1.1119479781385166e-09,
+ 1.1122585075185043e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.96408472119947e-06,
+ 4.2022573865097e-08,
+ 3.954471239353552e-08,
+ 3.953241289877951e-08,
+ 3.955623029128219e-08
+ ],
+ "gamma_dfa": 0.11316103948047385,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9332935810089111,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 22786.513671875,
+ 6899202.5,
+ 43496572.0,
+ 69758712.0,
+ 71960648.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0609301170916297e-07,
+ 1.1096534802135238e-09,
+ 1.05872854927469e-09,
+ 1.0590027743617725e-09,
+ 1.0579482845329835e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.711301128030755e-06,
+ 3.962547268088201e-08,
+ 3.742779952631281e-08,
+ 3.741677900848117e-08,
+ 3.743992138538488e-08
+ ],
+ "gamma_dfa": 0.11225346029095817,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9247596263885498,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 23367.078125,
+ 7480530.0,
+ 47061616.0,
+ 75610000.0,
+ 77981320.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.054115728038596e-07,
+ 1.0618838031106748e-09,
+ 1.0191184562913236e-09,
+ 1.01949926278877e-09,
+ 1.0192180432966325e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.768360097135883e-06,
+ 3.826109207238915e-08,
+ 3.593911657162607e-08,
+ 3.592855790657268e-08,
+ 3.594948694285449e-08
+ ],
+ "gamma_dfa": 0.11492819089471595,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.939026117324829,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 23912.85546875,
+ 8053234.0,
+ 51027352.0,
+ 81931568.0,
+ 84515616.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0266481353937706e-07,
+ 9.919576271499864e-10,
+ 9.572211912001194e-10,
+ 9.572932446744176e-10,
+ 9.577664217275128e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.472421435115393e-06,
+ 3.587240016145188e-08,
+ 3.39712649122248e-08,
+ 3.396091940999213e-08,
+ 3.398050552050336e-08
+ ],
+ "gamma_dfa": 0.11253271601162851,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9187253713607788,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 24486.8359375,
+ 8682399.0,
+ 55030492.0,
+ 88236184.0,
+ 91025880.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0101911129822838e-07,
+ 9.702203485062455e-10,
+ 9.30652499508966e-10,
+ 9.30728105696943e-10,
+ 9.303261494508774e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.286908617563313e-06,
+ 3.4072087373715476e-08,
+ 3.2386065385026086e-08,
+ 3.2376764380614986e-08,
+ 3.2396076932172946e-08
+ ],
+ "gamma_dfa": 0.11125053715659305,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9214520454406738,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 25051.91796875,
+ 9255517.0,
+ 58776788.0,
+ 94748472.0,
+ 97725744.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.793318156425812e-08,
+ 9.150468716079274e-10,
+ 8.747003676923271e-10,
+ 8.746902091516517e-10,
+ 8.743750723461119e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.294927632348845e-06,
+ 3.279593840943562e-08,
+ 3.115108881956985e-08,
+ 3.114205782139834e-08,
+ 3.115993862934374e-08
+ ],
+ "gamma_dfa": 0.11356210591475246,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9334189891815186,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 25539.400390625,
+ 9852175.0,
+ 62733436.0,
+ 101270040.0,
+ 104412528.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.590952032567657e-08,
+ 8.831190223546059e-10,
+ 8.506708115696426e-10,
+ 8.503630022360653e-10,
+ 8.506205184666271e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.156022325536469e-06,
+ 3.1347209272780674e-08,
+ 2.992178593785866e-08,
+ 2.9913682197957314e-08,
+ 2.9930919964726854e-08
+ ],
+ "gamma_dfa": 0.11300312746607233,
+ "acc_eval": 0.3291015625,
+ "loss_eval": 1.9240946769714355,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 26058.23046875,
+ 10503947.0,
+ 66954420.0,
+ 108182184.0,
+ 111535672.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.312070403666439e-08,
+ 8.298656206662258e-10,
+ 8.076765367626138e-10,
+ 8.076487811869981e-10,
+ 8.083505531608637e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.084062195237493e-06,
+ 3.008365112577849e-08,
+ 2.8773875726528786e-08,
+ 2.8766294235538226e-08,
+ 2.878227967073599e-08
+ ],
+ "gamma_dfa": 0.11286510003083094,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9284429550170898,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 26547.951171875,
+ 11128081.0,
+ 71119440.0,
+ 115305784.0,
+ 118851064.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.278523549482998e-08,
+ 8.024952369289906e-10,
+ 7.701798643289237e-10,
+ 7.699446635811569e-10,
+ 7.706733029522184e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.915013960271608e-06,
+ 2.8781727223758935e-08,
+ 2.7522533585511155e-08,
+ 2.751522920618754e-08,
+ 2.7530596469205193e-08
+ ],
+ "gamma_dfa": 0.11193350053144968,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9189305305480957,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 27052.158203125,
+ 11815623.0,
+ 75267568.0,
+ 122747224.0,
+ 126538816.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.042137349979384e-08,
+ 7.699976212194315e-10,
+ 7.406790181185841e-10,
+ 7.406811275423308e-10,
+ 7.407266466863405e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.783120857609902e-06,
+ 2.7648876965713498e-08,
+ 2.6492134708178128e-08,
+ 2.6485189152936073e-08,
+ 2.6500073246893407e-08
+ ],
+ "gamma_dfa": 0.1119252087228233,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9200191497802734,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 27573.439453125,
+ 12446571.0,
+ 79631776.0,
+ 129906592.0,
+ 133912576.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.999781897500725e-08,
+ 7.431448234562765e-10,
+ 7.212022645752825e-10,
+ 7.211930497241781e-10,
+ 7.215293917894883e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.7411135710717645e-06,
+ 2.6746526771148638e-08,
+ 2.567137080689008e-08,
+ 2.566465262532347e-08,
+ 2.5678824400188205e-08
+ ],
+ "gamma_dfa": 0.1126710368462227,
+ "acc_eval": 0.3291015625,
+ "loss_eval": 1.9156131744384766,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 28020.1953125,
+ 13139046.0,
+ 84357848.0,
+ 137652880.0,
+ 141892912.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.93968845616655e-08,
+ 7.234106647047156e-10,
+ 7.015109604324721e-10,
+ 7.013014613477253e-10,
+ 7.019884118442121e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.706852905655978e-06,
+ 2.5948086346261334e-08,
+ 2.480862271170281e-08,
+ 2.4802661258149783e-08,
+ 2.4816182886411298e-08
+ ],
+ "gamma_dfa": 0.11299434299689892,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.917637825012207,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 28489.8828125,
+ 13728548.0,
+ 88388480.0,
+ 144432224.0,
+ 148906448.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.832166287220389e-08,
+ 7.007013858029154e-10,
+ 6.849794620400473e-10,
+ 6.849559253119253e-10,
+ 6.857461820608535e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.678155619330937e-06,
+ 2.5201579489930737e-08,
+ 2.418770428391781e-08,
+ 2.4181909807907687e-08,
+ 2.419472266979028e-08
+ ],
+ "gamma_dfa": 0.11410953500489995,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9333336353302002,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 28918.5546875,
+ 14414132.0,
+ 92681240.0,
+ 151898304.0,
+ 156571040.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.454645694655483e-08,
+ 6.792187368098723e-10,
+ 6.553820264265653e-10,
+ 6.554308207284976e-10,
+ 6.556304388283252e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.511462066147942e-06,
+ 2.4275013998931172e-08,
+ 2.338800797474505e-08,
+ 2.338238225263467e-08,
+ 2.3394919779207157e-08
+ ],
+ "gamma_dfa": 0.11213390928969602,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9155462980270386,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 29332.80078125,
+ 15055747.0,
+ 96975336.0,
+ 159279984.0,
+ 164189344.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.274933804841567e-08,
+ 6.447524736330479e-10,
+ 6.278008113369538e-10,
+ 6.277455777414787e-10,
+ 6.275664987676066e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.426053692441201e-06,
+ 2.3487833900048827e-08,
+ 2.272233956546188e-08,
+ 2.2717028258512073e-08,
+ 2.272915367029782e-08
+ ],
+ "gamma_dfa": 0.11223121372131573,
+ "acc_eval": 0.3173828125,
+ "loss_eval": 1.9162096977233887,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 29736.349609375,
+ 15823423.0,
+ 101458080.0,
+ 166481584.0,
+ 171638352.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.434898290943238e-08,
+ 6.55440757224568e-10,
+ 6.384029416217629e-10,
+ 6.384751061183636e-10,
+ 6.382625539202991e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.4675143726635724e-06,
+ 2.308258295613541e-08,
+ 2.2235047580920764e-08,
+ 2.2229942331364327e-08,
+ 2.2241332331418562e-08
+ ],
+ "gamma_dfa": 0.11349940555010107,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.935542106628418,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 30168.33984375,
+ 16512403.0,
+ 106240736.0,
+ 174293312.0,
+ 179686352.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.255891259523196e-08,
+ 6.180955192114368e-10,
+ 6.070984825967685e-10,
+ 6.070359770404821e-10,
+ 6.068190394614703e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.380563041195273e-06,
+ 2.227099038520919e-08,
+ 2.156298606337259e-08,
+ 2.1558207663474604e-08,
+ 2.1569489305761635e-08
+ ],
+ "gamma_dfa": 0.11322060551538016,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.9260894060134888,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 30560.10546875,
+ 17240642.0,
+ 111300408.0,
+ 182109792.0,
+ 187762288.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.14508851476603e-08,
+ 6.030238530740917e-10,
+ 5.890909982042558e-10,
+ 5.890405385677866e-10,
+ 5.88881721164114e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.2523201955191325e-06,
+ 2.1578937747790405e-08,
+ 2.0878760054188206e-08,
+ 2.0874194817110947e-08,
+ 2.08853556671329e-08
+ ],
+ "gamma_dfa": 0.11227845895700739,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.9136857986450195,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 30927.453125,
+ 17981622.0,
+ 115698520.0,
+ 189446720.0,
+ 195329056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.999796736157805e-08,
+ 5.827110460820961e-10,
+ 5.688347570753649e-10,
+ 5.688115534141502e-10,
+ 5.69402469619007e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.254153282090556e-06,
+ 2.1111715042820833e-08,
+ 2.044158087244341e-08,
+ 2.043698899001356e-08,
+ 2.0447874504725405e-08
+ ],
+ "gamma_dfa": 0.11285097184736514,
+ "acc_eval": 0.3251953125,
+ "loss_eval": 1.9130818843841553,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 31297.09765625,
+ 18680606.0,
+ 120312440.0,
+ 197032272.0,
+ 203114064.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.911415877970285e-08,
+ 5.74776504169705e-10,
+ 5.532440061628563e-10,
+ 5.531197722064007e-10,
+ 5.533422053893844e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.17833052779315e-06,
+ 2.0621358842731752e-08,
+ 1.9960678443453617e-08,
+ 1.9956562624656726e-08,
+ 1.9966993392017685e-08
+ ],
+ "gamma_dfa": 0.11243592749451636,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9191365242004395,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 31637.244140625,
+ 19360764.0,
+ 124754384.0,
+ 204064768.0,
+ 210382992.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.003268447964729e-08,
+ 5.749308251701279e-10,
+ 5.599746222273438e-10,
+ 5.599968821989876e-10,
+ 5.599694041791281e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.128593900531996e-06,
+ 2.0178502424528233e-08,
+ 1.9575201903876405e-08,
+ 1.9571228193626666e-08,
+ 1.9581117172151608e-08
+ ],
+ "gamma_dfa": 0.11233749791426817,
+ "acc_eval": 0.330078125,
+ "loss_eval": 1.9152377843856812,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 31964.60546875,
+ 20067444.0,
+ 128969536.0,
+ 211772368.0,
+ 218247696.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.774531951554309e-08,
+ 5.427598370744136e-10,
+ 5.298457228519737e-10,
+ 5.297982053065198e-10,
+ 5.30141264221129e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.058078957314137e-06,
+ 1.9621586133666824e-08,
+ 1.90722975190738e-08,
+ 1.9068517431719556e-08,
+ 1.907839575210346e-08
+ ],
+ "gamma_dfa": 0.11183859535958618,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.9089019298553467,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 32292.658203125,
+ 20829408.0,
+ 133566216.0,
+ 219264704.0,
+ 225938912.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.692310788343093e-08,
+ 5.312774109533791e-10,
+ 5.173871886476888e-10,
+ 5.171740258269608e-10,
+ 5.173406147918058e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.047169568366371e-06,
+ 1.926170511978853e-08,
+ 1.867934962263007e-08,
+ 1.8675748947316606e-08,
+ 1.868521692927061e-08
+ ],
+ "gamma_dfa": 0.11216733865148854,
+ "acc_eval": 0.330078125,
+ "loss_eval": 1.917893886566162,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 32582.02734375,
+ 21555154.0,
+ 138235216.0,
+ 226622112.0,
+ 233550816.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.588336359276582e-08,
+ 5.294207294781472e-10,
+ 5.160025184913763e-10,
+ 5.156744475875996e-10,
+ 5.168100947194887e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.991732683061855e-06,
+ 1.8877956975416055e-08,
+ 1.8321758332717764e-08,
+ 1.831830331866513e-08,
+ 1.832757234865312e-08
+ ],
+ "gamma_dfa": 0.11230919507215731,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.913461685180664,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 32871.28125,
+ 22246662.0,
+ 142493184.0,
+ 233885040.0,
+ 241005264.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.552973357860537e-08,
+ 5.124695112712629e-10,
+ 4.966513311721599e-10,
+ 4.966223543512172e-10,
+ 4.969377687125132e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.012842964584706e-06,
+ 1.8570215587487837e-08,
+ 1.8001765411668202e-08,
+ 1.799840099181438e-08,
+ 1.800739823920594e-08
+ ],
+ "gamma_dfa": 0.11296637258055853,
+ "acc_eval": 0.33203125,
+ "loss_eval": 1.9206554889678955,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 33169.98828125,
+ 22902584.0,
+ 146822496.0,
+ 241191920.0,
+ 248487904.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.486269026912851e-08,
+ 4.992010138593628e-10,
+ 4.874242676145002e-10,
+ 4.874663450671335e-10,
+ 4.884102011715186e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.938752797694178e-06,
+ 1.8166964821375586e-08,
+ 1.767327617585579e-08,
+ 1.7670013008341812e-08,
+ 1.7678777552987412e-08
+ ],
+ "gamma_dfa": 0.11258088904469332,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.913904070854187,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 33456.9140625,
+ 23628216.0,
+ 151346624.0,
+ 248325424.0,
+ 255824304.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.482947239623172e-08,
+ 5.02439700955648e-10,
+ 4.890933769097217e-10,
+ 4.891700933207233e-10,
+ 4.892242166931737e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.895439022016944e-06,
+ 1.781435265968412e-08,
+ 1.7326955870089478e-08,
+ 1.7324007117736073e-08,
+ 1.7332443036366385e-08
+ ],
+ "gamma_dfa": 0.11223017568408977,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9154590368270874,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 33716.85546875,
+ 24280678.0,
+ 155270816.0,
+ 255050304.0,
+ 262737184.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.482827157900829e-08,
+ 4.958616850458952e-10,
+ 4.826584132366918e-10,
+ 4.826221089437865e-10,
+ 4.828137889489881e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.898983777617104e-06,
+ 1.7600514823357116e-08,
+ 1.7106302152569697e-08,
+ 1.7103344518432095e-08,
+ 1.7111482009113388e-08
+ ],
+ "gamma_dfa": 0.11287979638109391,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9285999536514282,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 33981.390625,
+ 24925848.0,
+ 159148752.0,
+ 261662432.0,
+ 269540768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.396101153744894e-08,
+ 4.846232304345222e-10,
+ 4.728849534174628e-10,
+ 4.72891226177552e-10,
+ 4.725210223099907e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.847520019917283e-06,
+ 1.7274359720431676e-08,
+ 1.6806101399424733e-08,
+ 1.6803195279635474e-08,
+ 1.681126526875687e-08
+ ],
+ "gamma_dfa": 0.11251267153238587,
+ "acc_eval": 0.330078125,
+ "loss_eval": 1.913767695426941,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 34242.87890625,
+ 25494510.0,
+ 162965072.0,
+ 268190960.0,
+ 276245600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.276207725226413e-08,
+ 4.64974586611433e-10,
+ 4.573621481540613e-10,
+ 4.5720988106623395e-10,
+ 4.578690204759539e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.846054823952727e-06,
+ 1.7068730429059542e-08,
+ 1.6637597965996065e-08,
+ 1.663470783341836e-08,
+ 1.6642776046182917e-08
+ ],
+ "gamma_dfa": 0.11268835317605408,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9175846576690674,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 34498.37890625,
+ 26013872.0,
+ 166717360.0,
+ 274736192.0,
+ 282985952.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.275441760157264e-08,
+ 4.638447681504232e-10,
+ 4.554343846496778e-10,
+ 4.5541673210358624e-10,
+ 4.558452226799403e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.7814804727531737e-06,
+ 1.6729790885960938e-08,
+ 1.629800472358056e-08,
+ 1.629528156854576e-08,
+ 1.630315793477166e-08
+ ],
+ "gamma_dfa": 0.11192971542368468,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9148613214492798,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 34741.75390625,
+ 26574266.0,
+ 170266464.0,
+ 280835296.0,
+ 289264896.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.206668328763044e-08,
+ 4.543688481017938e-10,
+ 4.4642781138470866e-10,
+ 4.464762171085823e-10,
+ 4.4638817642272954e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.800365902861813e-06,
+ 1.6550599113429598e-08,
+ 1.6135599523181554e-08,
+ 1.6132924329781417e-08,
+ 1.6140655034746487e-08
+ ],
+ "gamma_dfa": 0.11263992198291817,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.9202332496643066,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 34981.7578125,
+ 27132752.0,
+ 173824032.0,
+ 286969856.0,
+ 295549056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.146741154429037e-08,
+ 4.5107212409689623e-10,
+ 4.4140177624107935e-10,
+ 4.4141457156143815e-10,
+ 4.4168110835407504e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.7655997857655166e-06,
+ 1.6349241960256222e-08,
+ 1.5922701379622595e-08,
+ 1.5920058160645567e-08,
+ 1.592757570278991e-08
+ ],
+ "gamma_dfa": 0.11310465578208095,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9224812984466553,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 35201.25,
+ 27683016.0,
+ 177040880.0,
+ 292723872.0,
+ 301473504.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.122528700165276e-08,
+ 4.486005733550513e-10,
+ 4.4048292791032395e-10,
+ 4.4043477198663084e-10,
+ 4.4109013663806707e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.748537892533932e-06,
+ 1.6115603074240425e-08,
+ 1.5725172275438126e-08,
+ 1.572264451965566e-08,
+ 1.5729948898979274e-08
+ ],
+ "gamma_dfa": 0.11326105792613816,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9233062267303467,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 35399.75390625,
+ 28156860.0,
+ 180111792.0,
+ 298457728.0,
+ 307298976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.082014974457707e-08,
+ 4.4495629403229486e-10,
+ 4.324987312731565e-10,
+ 4.3260212079232474e-10,
+ 4.3259393289751813e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.685790488816565e-06,
+ 1.5895359695150546e-08,
+ 1.5473323955461638e-08,
+ 1.547100403342938e-08,
+ 1.5478214265840506e-08
+ ],
+ "gamma_dfa": 0.11222807004196511,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9198863506317139,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 35584.6640625,
+ 28666806.0,
+ 183522992.0,
+ 303940064.0,
+ 312955008.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.149574088316513e-08,
+ 4.4883607941414994e-10,
+ 4.353337967888393e-10,
+ 4.3539158389727106e-10,
+ 4.35594643688475e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.6930814530933276e-06,
+ 1.5769751726679715e-08,
+ 1.5353194271483517e-08,
+ 1.535078197889561e-08,
+ 1.5357914051605803e-08
+ ],
+ "gamma_dfa": 0.11321029500413715,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9162211418151855,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 35768.86328125,
+ 29145662.0,
+ 186551392.0,
+ 308909184.0,
+ 318089856.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.985555245364594e-08,
+ 4.355726057614362e-10,
+ 4.2523776166980554e-10,
+ 4.251851093428627e-10,
+ 4.2568140679044575e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.7230390717013506e-06,
+ 1.5615523096812467e-08,
+ 1.523139303571952e-08,
+ 1.522908021911462e-08,
+ 1.5236116368555486e-08
+ ],
+ "gamma_dfa": 0.11393742701784504,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9276196956634521,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 35944.30859375,
+ 29545796.0,
+ 189503824.0,
+ 313822880.0,
+ 323180096.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.027381343505112e-08,
+ 4.2508935260698877e-10,
+ 4.156285593470699e-10,
+ 4.156731903126598e-10,
+ 4.1562600583411324e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.67820075553027e-06,
+ 1.5450812185235918e-08,
+ 1.5081118576176777e-08,
+ 1.5078812864999236e-08,
+ 1.5085870330722173e-08
+ ],
+ "gamma_dfa": 0.11295431066082529,
+ "acc_eval": 0.3251953125,
+ "loss_eval": 1.9145984649658203,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 36107.91015625,
+ 29963964.0,
+ 192509232.0,
+ 318614048.0,
+ 328116416.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.995779955332182e-08,
+ 4.257695862541766e-10,
+ 4.1527120631101866e-10,
+ 4.1522696392348735e-10,
+ 4.1541275974665837e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.6363949220685754e-06,
+ 1.5271682585193957e-08,
+ 1.4899570466297973e-08,
+ 1.4897324263074552e-08,
+ 1.4904214751254585e-08
+ ],
+ "gamma_dfa": 0.11261070579712396,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9148796796798706,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 36263.38671875,
+ 30397186.0,
+ 195132224.0,
+ 323205344.0,
+ 332809856.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.94296602432587e-08,
+ 4.221426264106043e-10,
+ 4.1666703420872864e-10,
+ 4.166992584320184e-10,
+ 4.166444134146019e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.677051836348255e-06,
+ 1.5217779036902357e-08,
+ 1.486149248108859e-08,
+ 1.4859250718757266e-08,
+ 1.4866162523219373e-08
+ ],
+ "gamma_dfa": 0.11349719034842565,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.9238262176513672,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 36417.9921875,
+ 30770712.0,
+ 197719328.0,
+ 327539232.0,
+ 337245152.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.906716976118332e-08,
+ 4.1953429619212557e-10,
+ 4.080901727654407e-10,
+ 4.080701054842706e-10,
+ 4.0843109450072745e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.6080327845411375e-06,
+ 1.500828084033401e-08,
+ 1.4656276192681617e-08,
+ 1.465407439837918e-08,
+ 1.466091692492455e-08
+ ],
+ "gamma_dfa": 0.11264980123269197,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9172749519348145,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 36554.734375,
+ 31127202.0,
+ 200166992.0,
+ 331766240.0,
+ 341638624.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.895474768953136e-08,
+ 4.153002663986882e-10,
+ 4.053070101761591e-10,
+ 4.0528172484677327e-10,
+ 4.0563402636806245e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5790299079963006e-06,
+ 1.4871366360580396e-08,
+ 1.4521869928785236e-08,
+ 1.4519704549798007e-08,
+ 1.4526481351140319e-08
+ ],
+ "gamma_dfa": 0.1125820265888251,
+ "acc_eval": 0.3291015625,
+ "loss_eval": 1.90960693359375,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 36685.06640625,
+ 31478428.0,
+ 202703456.0,
+ 335890528.0,
+ 345860736.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.840604527269534e-08,
+ 4.11831152513642e-10,
+ 4.0155134772845713e-10,
+ 4.014005239305618e-10,
+ 4.018080868029017e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5732464311877266e-06,
+ 1.4777253198872131e-08,
+ 1.4430981742918902e-08,
+ 1.4428859884674239e-08,
+ 1.443555053270984e-08
+ ],
+ "gamma_dfa": 0.11229235199152754,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.912062644958496,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 36808.640625,
+ 31756406.0,
+ 205006400.0,
+ 339625888.0,
+ 349722048.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.845510824859957e-08,
+ 4.056126268192628e-10,
+ 3.9775802096464474e-10,
+ 3.9773195847914167e-10,
+ 3.978435358931165e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.601402113417862e-06,
+ 1.4699119255112691e-08,
+ 1.434870711136682e-08,
+ 1.4346603904868971e-08,
+ 1.4353199517813664e-08
+ ],
+ "gamma_dfa": 0.11323098125649267,
+ "acc_eval": 0.3271484375,
+ "loss_eval": 1.9194645881652832,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 36922.67578125,
+ 32105574.0,
+ 207090144.0,
+ 343260640.0,
+ 353436544.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.8447327805643e-08,
+ 4.050982882475296e-10,
+ 3.977037865698918e-10,
+ 3.9765896131527256e-10,
+ 3.979234441953139e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.603466893764562e-06,
+ 1.4652233204515142e-08,
+ 1.4306199780378392e-08,
+ 1.4304094797523703e-08,
+ 1.4310627349800598e-08
+ ],
+ "gamma_dfa": 0.11329636031587142,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.922640323638916,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 37024.05859375,
+ 32409028.0,
+ 208845456.0,
+ 346325312.0,
+ 356587104.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.819700359983472e-08,
+ 4.0326031403026263e-10,
+ 3.9583156197231517e-10,
+ 3.9586384170675615e-10,
+ 3.9581374289276994e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5432237837085268e-06,
+ 1.4486117194678627e-08,
+ 1.4156262828635136e-08,
+ 1.4154186267489877e-08,
+ 1.4160684180808403e-08
+ ],
+ "gamma_dfa": 0.11267639175457589,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9154051542282104,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 37125.02734375,
+ 32663892.0,
+ 210781344.0,
+ 349533728.0,
+ 359873568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.772787486397647e-08,
+ 3.9591485645473767e-10,
+ 3.875866017022389e-10,
+ 3.8754283115949306e-10,
+ 3.8766378995802597e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5503553590388037e-06,
+ 1.4420066918319208e-08,
+ 1.40893732236691e-08,
+ 1.4087291333453322e-08,
+ 1.4093810563053921e-08
+ ],
+ "gamma_dfa": 0.11297615164312447,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.913941502571106,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 37216.296875,
+ 32930840.0,
+ 212456432.0,
+ 352475008.0,
+ 362884992.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.74248425980295e-08,
+ 3.9426073517034865e-10,
+ 3.872507869928654e-10,
+ 3.8720734951702696e-10,
+ 3.8765768373139053e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.55011752617429e-06,
+ 1.4357588895563822e-08,
+ 1.402936344874206e-08,
+ 1.402732330291201e-08,
+ 1.4033815887160017e-08
+ ],
+ "gamma_dfa": 0.11311322844358074,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.914380431175232,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 37298.37890625,
+ 33147848.0,
+ 214118832.0,
+ 355022880.0,
+ 365529568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.774458682912154e-08,
+ 3.987353780487979e-10,
+ 3.904769285689724e-10,
+ 3.904657153164237e-10,
+ 3.907260348601227e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.509487669361988e-06,
+ 1.4249152968659473e-08,
+ 1.3931584774695693e-08,
+ 1.3929625453101835e-08,
+ 1.3936028331329453e-08
+ ],
+ "gamma_dfa": 0.11238172389857937,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9106721878051758,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 37372.10546875,
+ 33388374.0,
+ 215761392.0,
+ 357596800.0,
+ 368190304.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.751073300392818e-08,
+ 3.9374201121766816e-10,
+ 3.8655822987010424e-10,
+ 3.866116038420131e-10,
+ 3.8653891198947576e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.537302973199985e-06,
+ 1.4222394817409167e-08,
+ 1.3910858243093571e-08,
+ 1.3908881157931319e-08,
+ 1.3915280483445258e-08
+ ],
+ "gamma_dfa": 0.11306001050525083,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9138463735580444,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 37442.84375,
+ 33566284.0,
+ 216908128.0,
+ 359755968.0,
+ 370379136.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.704155453007843e-08,
+ 3.923593672183756e-10,
+ 3.850708640840139e-10,
+ 3.8509884170423447e-10,
+ 3.849042473635933e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.509628641040763e-06,
+ 1.4144676541150147e-08,
+ 1.3834353218555862e-08,
+ 1.3832397449675682e-08,
+ 1.3838723056380786e-08
+ ],
+ "gamma_dfa": 0.11266809623703011,
+ "acc_eval": 0.3251953125,
+ "loss_eval": 1.9121947288513184,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 37512.11328125,
+ 33717608.0,
+ 218115872.0,
+ 361736960.0,
+ 372400416.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.701832688804643e-08,
+ 3.917752788851203e-10,
+ 3.835655681960759e-10,
+ 3.835243511662867e-10,
+ 3.835320394607322e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5144942103215726e-06,
+ 1.4111047441645042e-08,
+ 1.3798888254257236e-08,
+ 1.3796943143518092e-08,
+ 1.3803241216692186e-08
+ ],
+ "gamma_dfa": 0.11281233225781762,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.9152591228485107,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 37568.84375,
+ 33899664.0,
+ 219258560.0,
+ 363709504.0,
+ 374424128.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.695909604559347e-08,
+ 3.8868031015937277e-10,
+ 3.823757421805851e-10,
+ 3.8241659838789133e-10,
+ 3.8222841558521736e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.516150854920852e-06,
+ 1.40706539752955e-08,
+ 1.3756586092483758e-08,
+ 1.375462410635464e-08,
+ 1.3760891093284044e-08
+ ],
+ "gamma_dfa": 0.11307295318874822,
+ "acc_eval": 0.326171875,
+ "loss_eval": 1.9149377346038818,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 37613.421875,
+ 34060644.0,
+ 220322080.0,
+ 365325472.0,
+ 376109056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.71154296583154e-08,
+ 3.8974332094987574e-10,
+ 3.834943751446218e-10,
+ 3.8340422503502225e-10,
+ 3.8375369548759863e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4982940633199178e-06,
+ 1.4013506799415154e-08,
+ 1.370163893454901e-08,
+ 1.3699707146486162e-08,
+ 1.3705942158992457e-08
+ ],
+ "gamma_dfa": 0.1128659905607492,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.912517786026001,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 37660.46875,
+ 34177292.0,
+ 221168784.0,
+ 366778016.0,
+ 377600544.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.68943869186478e-08,
+ 3.894674860394076e-10,
+ 3.8076572450584933e-10,
+ 3.8073258434856427e-10,
+ 3.8100084198688933e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4944750950671732e-06,
+ 1.397998961039093e-08,
+ 1.3671985321650482e-08,
+ 1.3670069520799188e-08,
+ 1.3676272558882374e-08
+ ],
+ "gamma_dfa": 0.11273636969053769,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9171113967895508,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 37701.8671875,
+ 34327872.0,
+ 222020640.0,
+ 368143552.0,
+ 379001216.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.639802307972786e-08,
+ 3.87883669628053e-10,
+ 3.8044753458699176e-10,
+ 3.804264403495239e-10,
+ 3.8037359373355173e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4919537483801832e-06,
+ 1.3943878052202763e-08,
+ 1.3639727569625393e-08,
+ 1.3637805551525162e-08,
+ 1.364400148418099e-08
+ ],
+ "gamma_dfa": 0.11286781356830033,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.9123945236206055,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 37739.8125,
+ 34429904.0,
+ 222737072.0,
+ 369295712.0,
+ 380185984.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.741821323430486e-08,
+ 3.8846115213431176e-10,
+ 3.8069486452130263e-10,
+ 3.8060576912357647e-10,
+ 3.809500215279371e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.500515958876349e-06,
+ 1.3945418153582523e-08,
+ 1.364027113481825e-08,
+ 1.3638369544821671e-08,
+ 1.364453350305439e-08
+ ],
+ "gamma_dfa": 0.11293645015939546,
+ "acc_eval": 0.3154296875,
+ "loss_eval": 1.917877197265625,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 37773.1484375,
+ 34523684.0,
+ 223309680.0,
+ 370332384.0,
+ 381249280.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.685363729275196e-08,
+ 3.8528755186284513e-10,
+ 3.7927344598287505e-10,
+ 3.7934516639026583e-10,
+ 3.7926364826468273e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4931999834952876e-06,
+ 1.3911479967987361e-08,
+ 1.360801249461474e-08,
+ 1.3606110904618163e-08,
+ 1.3612289961884017e-08
+ ],
+ "gamma_dfa": 0.11282484548610228,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9136494398117065,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 37800.29296875,
+ 34600436.0,
+ 223845264.0,
+ 371228288.0,
+ 382171744.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.65767956320451e-08,
+ 3.853606878045923e-10,
+ 3.7911099259879677e-10,
+ 3.789283054000947e-10,
+ 3.791919833684432e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4772997423715424e-06,
+ 1.3876966242776234e-08,
+ 1.3575736979021258e-08,
+ 1.3573847823522556e-08,
+ 1.3580010893576855e-08
+ ],
+ "gamma_dfa": 0.11266115616490424,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.912358045578003,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 37822.953125,
+ 34659448.0,
+ 224278352.0,
+ 371994688.0,
+ 382956800.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.695878340678973e-08,
+ 3.8400196911148043e-10,
+ 3.7754030457470833e-10,
+ 3.775957047036371e-10,
+ 3.7752789783240814e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.488719130473328e-06,
+ 1.387363113281026e-08,
+ 1.3571511026100325e-08,
+ 1.3569623646958462e-08,
+ 1.3575775170693305e-08
+ ],
+ "gamma_dfa": 0.11286654848299804,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9152348041534424,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 37843.71484375,
+ 34715836.0,
+ 224633712.0,
+ 372602496.0,
+ 383583840.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.682009967562408e-08,
+ 3.831650552399424e-10,
+ 3.7603772873318064e-10,
+ 3.7600736413345714e-10,
+ 3.763372669052245e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4864976896642474e-06,
+ 1.3852580416084948e-08,
+ 1.355203504971314e-08,
+ 1.3550148558749697e-08,
+ 1.3556297417949281e-08
+ ],
+ "gamma_dfa": 0.11291119743145828,
+ "acc_eval": 0.326171875,
+ "loss_eval": 1.914948582649231,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 37859.484375,
+ 34761876.0,
+ 224938096.0,
+ 373110784.0,
+ 384106720.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.677319674963655e-08,
+ 3.8410433167435087e-10,
+ 3.768680645332978e-10,
+ 3.768474976517666e-10,
+ 3.767945122579164e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.480063014649204e-06,
+ 1.3833711953736838e-08,
+ 1.3534608989118624e-08,
+ 1.3532734044474637e-08,
+ 1.3538858922856889e-08
+ ],
+ "gamma_dfa": 0.1127637956833496,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9153952598571777,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 37872.0625,
+ 34797108.0,
+ 225202544.0,
+ 373570400.0,
+ 384579200.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.67909034746117e-08,
+ 3.821318816932262e-10,
+ 3.753052590926842e-10,
+ 3.7535435870594824e-10,
+ 3.7532754681990355e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4843556022678968e-06,
+ 1.3827068379157481e-08,
+ 1.352985190550271e-08,
+ 1.3527971631788205e-08,
+ 1.3534107168311493e-08
+ ],
+ "gamma_dfa": 0.1129197701375233,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9156945943832397,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 37881.54296875,
+ 34826116.0,
+ 225403072.0,
+ 373889952.0,
+ 384906848.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.663099583192889e-08,
+ 3.844494445015556e-10,
+ 3.765425748980533e-10,
+ 3.7651176620911997e-10,
+ 3.7661743168548867e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.480702616798226e-06,
+ 1.382177039488397e-08,
+ 1.3523890451949683e-08,
+ 1.3522016395484115e-08,
+ 1.3528141273866368e-08
+ ],
+ "gamma_dfa": 0.11285195982236473,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9148646593093872,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 37889.18359375,
+ 34847784.0,
+ 225551344.0,
+ 374143840.0,
+ 385168448.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.623226767032975e-08,
+ 3.819731198007048e-10,
+ 3.7512581929632915e-10,
+ 3.752123889366743e-10,
+ 3.7511962980296687e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4782924558385275e-06,
+ 1.3813751031932497e-08,
+ 1.3516644692401769e-08,
+ 1.3514763530508844e-08,
+ 1.3520896402496874e-08
+ ],
+ "gamma_dfa": 0.11281965267244232,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9142093658447266,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 37895.046875,
+ 34865808.0,
+ 225670928.0,
+ 374345440.0,
+ 385375392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.64825137164371e-08,
+ 3.829765116147854e-10,
+ 3.7528671836817296e-10,
+ 3.7535685670775365e-10,
+ 3.752768373832538e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4792733458743896e-06,
+ 1.3809607679604596e-08,
+ 1.3512363672418815e-08,
+ 1.3510485175061149e-08,
+ 1.351661271797866e-08
+ ],
+ "gamma_dfa": 0.11288163481003721,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.9146695137023926,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 37898.87109375,
+ 34878456.0,
+ 225750400.0,
+ 374473248.0,
+ 385506496.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.652722817079848e-08,
+ 3.8302755411834255e-10,
+ 3.759152988891401e-10,
+ 3.7595143664859165e-10,
+ 3.7588568368995823e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.480078930806485e-06,
+ 1.3808159060602065e-08,
+ 1.3511034957502943e-08,
+ 1.3509157348323697e-08,
+ 1.351528045034911e-08
+ ],
+ "gamma_dfa": 0.1128929610213163,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9147298336029053,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 37900.7109375,
+ 34885860.0,
+ 225787696.0,
+ 374537472.0,
+ 385572896.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.630104820715133e-08,
+ 3.8308795025088216e-10,
+ 3.7579228617801164e-10,
+ 3.7582850720419003e-10,
+ 3.7576297629016153e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4770955608109944e-06,
+ 1.3803015619373582e-08,
+ 1.3505847995531894e-08,
+ 1.3503973050887907e-08,
+ 1.3510093488378061e-08
+ ],
+ "gamma_dfa": 0.11285188281362935,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.9143996238708496,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 37902.46875,
+ 34890740.0,
+ 225820192.0,
+ 374593792.0,
+ 385630976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.624973991620209e-08,
+ 3.8267702895389277e-10,
+ 3.7545791475857015e-10,
+ 3.7555664134103495e-10,
+ 3.75430270205257e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.476953224890167e-06,
+ 1.3801756182374447e-08,
+ 1.350452816240022e-08,
+ 1.3502653217756233e-08,
+ 1.3508774543424806e-08
+ ],
+ "gamma_dfa": 0.11284657929081732,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9143402576446533,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 37903.22265625,
+ 34893256.0,
+ 225836736.0,
+ 374620576.0,
+ 385658624.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.627380599866228e-08,
+ 3.8272779390169376e-10,
+ 3.7550038078926207e-10,
+ 3.7559910737172686e-10,
+ 3.7547268072479767e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.477006657703896e-06,
+ 1.3801344067587706e-08,
+ 1.3504034335198867e-08,
+ 1.350215939055488e-08,
+ 1.3508279828045033e-08
+ ],
+ "gamma_dfa": 0.11284785682073561,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9143691062927246,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 37903.25,
+ 34893376.0,
+ 225837280.0,
+ 374621408.0,
+ 385659456.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.626758874972438e-08,
+ 3.826984007471168e-10,
+ 3.755481758904722e-10,
+ 3.756469302285126e-10,
+ 3.755204758260078e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.476960500847781e-06,
+ 1.3801311204986177e-08,
+ 1.3503997919883659e-08,
+ 1.3502122975239672e-08,
+ 1.3508243412729826e-08
+ ],
+ "gamma_dfa": 0.11284651984533411,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9143500328063965,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file