diff options
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s123.json')
| -rw-r--r-- | results/snapshot_evolution_v2/snapshot_evolution_s123.json | 5473 |
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s123.json b/results/snapshot_evolution_v2/snapshot_evolution_s123.json new file mode 100644 index 0000000..4ccefc8 --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s123.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009977436857298017, + 0.000992251792922616, + 0.0009848480112850666, + 0.0009761073160916567, + 0.0009735578205436468 + ], + "bp_grad_norms_F": [ + 0.035340383648872375, + 0.03499162197113037, + 0.03454425558447838, + 0.034113530069589615, + 0.033874060958623886 + ], + "gamma_dfa": NaN, + "acc_eval": 0.095703125, + "loss_eval": 2.486203908920288, + "epoch": 0 + }, + { + "hidden_norms": [ + 78.8471908569336, + 81.27874755859375, + 85.74082946777344, + 93.0085678100586, + 99.78337860107422 + ], + "bp_grad_norms_per_sample_med": [ + 5.44870927114971e-05, + 5.06363830936607e-05, + 4.9749945901567116e-05, + 5.010423774365336e-05, + 5.131187572260387e-05 + ], + "bp_grad_norms_F": [ + 0.0025542855728417635, + 0.0021727080456912518, + 0.002010831143707037, + 0.0019116367911919951, + 0.0019338354468345642 + ], + "gamma_dfa": NaN, + "acc_eval": 0.396484375, + "loss_eval": 1.6637382507324219, + "epoch": 1 + }, + { + "hidden_norms": [ + 94.79721069335938, + 98.6406021118164, + 103.38369750976562, + 111.4940185546875, + 118.88549041748047 + ], + "bp_grad_norms_per_sample_med": [ + 4.842087219003588e-05, + 4.405825529829599e-05, + 4.263824666850269e-05, + 4.2027873860206455e-05, + 4.283937960281037e-05 + ], + "bp_grad_norms_F": [ + 0.0020658739376813173, + 0.001806268934160471, + 0.001665781601332128, + 0.0015872427029535174, + 0.0015909546054899693 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4541015625, + "loss_eval": 1.5350896120071411, + "epoch": 2 + }, + { + "hidden_norms": [ + 112.59109497070312, + 116.00851440429688, + 118.50328063964844, + 125.58804321289062, + 132.86842346191406 + ], + "bp_grad_norms_per_sample_med": [ + 4.3564141378737986e-05, + 4.136884308536537e-05, + 4.064830864081159e-05, + 3.9523682062281296e-05, + 3.8838741602376103e-05 + ], + "bp_grad_norms_F": [ + 0.00200729351490736, + 0.001785867614671588, + 0.0016562910750508308, + 0.0015452943043783307, + 0.0015010037459433079 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4814453125, + "loss_eval": 1.449176549911499, + "epoch": 3 + }, + { + "hidden_norms": [ + 124.81511688232422, + 128.57049560546875, + 129.71421813964844, + 136.4766387939453, + 142.1854705810547 + ], + "bp_grad_norms_per_sample_med": [ + 4.382780389278196e-05, + 4.2459021642571315e-05, + 4.143684418522753e-05, + 4.0614067984279245e-05, + 3.921420648111962e-05 + ], + "bp_grad_norms_F": [ + 0.0018197334138676524, + 0.0016814853297546506, + 0.0015934663824737072, + 0.0015063106548041105, + 0.0014485444407910109 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4970703125, + "loss_eval": 1.4218697547912598, + "epoch": 4 + }, + { + "hidden_norms": [ + 138.24440002441406, + 140.13018798828125, + 141.3839874267578, + 147.2488555908203, + 155.097412109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.045376044814475e-05, + 4.011149940197356e-05, + 3.9452468627132475e-05, + 3.831404319498688e-05, + 3.721412576851435e-05 + ], + "bp_grad_norms_F": [ + 0.0017204430187121034, + 0.0016258049290627241, + 0.001551075023598969, + 0.0014644934562966228, + 0.0013933938462287188 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5078125, + "loss_eval": 1.3836241960525513, + "epoch": 5 + }, + { + "hidden_norms": [ + 152.11605834960938, + 153.1806182861328, + 153.2488555908203, + 159.2217559814453, + 167.07318115234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.981084591941908e-05, + 3.969454701291397e-05, + 3.9165588532341644e-05, + 3.808845940511674e-05, + 3.58163051714655e-05 + ], + "bp_grad_norms_F": [ + 0.0017226944910362363, + 0.001611364888958633, + 0.0015574879944324493, + 0.001471089432016015, + 0.001374671934172511 + ], + "gamma_dfa": NaN, + "acc_eval": 0.525390625, + "loss_eval": 1.372281551361084, + "epoch": 6 + }, + { + "hidden_norms": [ + 161.75347900390625, + 163.58787536621094, + 163.35731506347656, + 170.1693115234375, + 177.47879028320312 + ], + "bp_grad_norms_per_sample_med": [ + 3.749227471416816e-05, + 3.707691575982608e-05, + 3.776738958549686e-05, + 3.692766040330753e-05, + 3.5146917070960626e-05 + ], + "bp_grad_norms_F": [ + 0.0016339722787961364, + 0.00156014587264508, + 0.0015048144850879908, + 0.00141648028511554, + 0.0013256004313006997 + ], + "gamma_dfa": NaN, + "acc_eval": 0.515625, + "loss_eval": 1.345876693725586, + "epoch": 7 + }, + { + "hidden_norms": [ + 171.66441345214844, + 171.10499572753906, + 169.24270629882812, + 175.52674865722656, + 182.4739990234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.675510379252955e-05, + 3.6888646718580276e-05, + 3.695035775308497e-05, + 3.644685784820467e-05, + 3.359343099873513e-05 + ], + "bp_grad_norms_F": [ + 0.0016642085975036025, + 0.0015915494877845049, + 0.0015412021894007921, + 0.0014428672147914767, + 0.0013226643204689026 + ], + "gamma_dfa": NaN, + "acc_eval": 0.548828125, + "loss_eval": 1.323807954788208, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.58766174316406, + 178.5358123779297, + 176.316650390625, + 182.18365478515625, + 188.81033325195312 + ], + "bp_grad_norms_per_sample_med": [ + 3.550657493178733e-05, + 3.561190533218905e-05, + 3.632329753600061e-05, + 3.5655833926284686e-05, + 3.342977652209811e-05 + ], + "bp_grad_norms_F": [ + 0.0016174933407455683, + 0.0015753052430227399, + 0.0015375673538073897, + 0.001461501931771636, + 0.0013270385097712278 + ], + "gamma_dfa": NaN, + "acc_eval": 0.54296875, + "loss_eval": 1.323765754699707, + "epoch": 9 + }, + { + "hidden_norms": [ + 186.0078125, + 185.2810821533203, + 182.9329833984375, + 188.10736083984375, + 195.3680877685547 + ], + "bp_grad_norms_per_sample_med": [ + 3.5615968954516575e-05, + 3.5252433008281514e-05, + 3.600740819820203e-05, + 3.5232467780588195e-05, + 3.2765579817350954e-05 + ], + "bp_grad_norms_F": [ + 0.0015362550038844347, + 0.001510681351646781, + 0.0014847773127257824, + 0.0014146054163575172, + 0.00128385319840163 + ], + "gamma_dfa": NaN, + "acc_eval": 0.544921875, + "loss_eval": 1.2933119535446167, + "epoch": 10 + }, + { + "hidden_norms": [ + 193.46343994140625, + 194.1528778076172, + 190.9546661376953, + 196.03440856933594, + 201.5336151123047 + ], + "bp_grad_norms_per_sample_med": [ + 3.449141877354123e-05, + 3.581260534701869e-05, + 3.6061541322851554e-05, + 3.5576940717874095e-05, + 3.29486902046483e-05 + ], + "bp_grad_norms_F": [ + 0.0015161881456151605, + 0.0014996343525126576, + 0.001473701442591846, + 0.0013998147333040833, + 0.0012604170478880405 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5556640625, + "loss_eval": 1.2653318643569946, + "epoch": 11 + }, + { + "hidden_norms": [ + 200.17047119140625, + 198.5863037109375, + 196.08795166015625, + 200.61297607421875, + 208.13084411621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.377814937266521e-05, + 3.471539093879983e-05, + 3.4731467167148367e-05, + 3.4925535146612674e-05, + 3.2187374017667025e-05 + ], + "bp_grad_norms_F": [ + 0.0014635181287303567, + 0.0014519579708576202, + 0.001435206620953977, + 0.0013784168986603618, + 0.0012511539971455932 + ], + "gamma_dfa": NaN, + "acc_eval": 0.546875, + "loss_eval": 1.2704923152923584, + "epoch": 12 + }, + { + "hidden_norms": [ + 203.8260955810547, + 203.86688232421875, + 200.01004028320312, + 204.2325439453125, + 211.52891540527344 + ], + "bp_grad_norms_per_sample_med": [ + 3.5213015507906675e-05, + 3.635779648902826e-05, + 3.70470697816927e-05, + 3.6254354199627414e-05, + 3.324731005704962e-05 + ], + "bp_grad_norms_F": [ + 0.0014951277989894152, + 0.0014758999459445477, + 0.0014606777112931013, + 0.0014066072180867195, + 0.0012636061292141676 + ], + "gamma_dfa": NaN, + "acc_eval": 0.533203125, + "loss_eval": 1.2718024253845215, + "epoch": 13 + }, + { + "hidden_norms": [ + 211.8421630859375, + 209.4982147216797, + 206.025634765625, + 210.11019897460938, + 216.48568725585938 + ], + "bp_grad_norms_per_sample_med": [ + 3.425328395678662e-05, + 3.4357526601525024e-05, + 3.5312823456479236e-05, + 3.490734161459841e-05, + 3.1354313250631094e-05 + ], + "bp_grad_norms_F": [ + 0.0015326166758313775, + 0.0015238082269206643, + 0.0015112065011635423, + 0.0014346316456794739, + 0.0012716582277789712 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5595703125, + "loss_eval": 1.2611415386199951, + "epoch": 14 + }, + { + "hidden_norms": [ + 220.0836639404297, + 218.3101806640625, + 212.22019958496094, + 216.97576904296875, + 224.16114807128906 + ], + "bp_grad_norms_per_sample_med": [ + 3.320865289424546e-05, + 3.393836959730834e-05, + 3.4554454032331705e-05, + 3.380324415047653e-05, + 3.0850649636704475e-05 + ], + "bp_grad_norms_F": [ + 0.0015296684578061104, + 0.0015227487310767174, + 0.0015054721152409911, + 0.0014223494799807668, + 0.0012559365713968873 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5615234375, + "loss_eval": 1.2511423826217651, + "epoch": 15 + }, + { + "hidden_norms": [ + 223.3075714111328, + 219.4958953857422, + 213.75701904296875, + 219.41580200195312, + 223.92572021484375 + ], + "bp_grad_norms_per_sample_med": [ + 3.406661926419474e-05, + 3.485638080746867e-05, + 3.5736342397285625e-05, + 3.5617544199340045e-05, + 3.142367859254591e-05 + ], + "bp_grad_norms_F": [ + 0.001539028249680996, + 0.0015256714541465044, + 0.0015207449905574322, + 0.001449243980459869, + 0.0012804584112018347 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2619048357009888, + "epoch": 16 + }, + { + "hidden_norms": [ + 229.43417358398438, + 224.83290100097656, + 218.015869140625, + 221.56915283203125, + 228.59274291992188 + ], + "bp_grad_norms_per_sample_med": [ + 3.325551369925961e-05, + 3.411810757825151e-05, + 3.506721623125486e-05, + 3.451627344475128e-05, + 3.0976541893323883e-05 + ], + "bp_grad_norms_F": [ + 0.001564670237712562, + 0.0015591747360303998, + 0.0015565806534141302, + 0.001464744214899838, + 0.0012746548745781183 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5498046875, + "loss_eval": 1.2594949007034302, + "epoch": 17 + }, + { + "hidden_norms": [ + 233.65724182128906, + 228.65892028808594, + 223.14169311523438, + 227.2765350341797, + 233.75588989257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4493146813474596e-05, + 3.510132592055015e-05, + 3.669387297122739e-05, + 3.577200186555274e-05, + 3.192189251421951e-05 + ], + "bp_grad_norms_F": [ + 0.0015125939389690757, + 0.0015123466728255153, + 0.0015171029372140765, + 0.0014489478198811412, + 0.001258584321476519 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5595703125, + "loss_eval": 1.2556639909744263, + "epoch": 18 + }, + { + "hidden_norms": [ + 237.43548583984375, + 232.39987182617188, + 227.10951232910156, + 230.72291564941406, + 237.13616943359375 + ], + "bp_grad_norms_per_sample_med": [ + 3.340727198519744e-05, + 3.450348594924435e-05, + 3.5213739465689287e-05, + 3.445050970185548e-05, + 3.137766179861501e-05 + ], + "bp_grad_norms_F": [ + 0.0015336342621594667, + 0.0015343877021223307, + 0.0015299322549253702, + 0.0014644783223047853, + 0.0012699750950559974 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.2415752410888672, + "epoch": 19 + }, + { + "hidden_norms": [ + 240.3662109375, + 235.49240112304688, + 227.54061889648438, + 233.16600036621094, + 239.60838317871094 + ], + "bp_grad_norms_per_sample_med": [ + 3.387282777111977e-05, + 3.518611265462823e-05, + 3.594699956011027e-05, + 3.514933632686734e-05, + 3.159138941555284e-05 + ], + "bp_grad_norms_F": [ + 0.0015161214396357536, + 0.0015244479291141033, + 0.0015337818767875433, + 0.0014538948889821768, + 0.0012562318006530404 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.2436577081680298, + "epoch": 20 + }, + { + "hidden_norms": [ + 246.6840057373047, + 239.0929412841797, + 228.7230682373047, + 233.1182403564453, + 237.92440795898438 + ], + "bp_grad_norms_per_sample_med": [ + 3.365568773006089e-05, + 3.4782005968736485e-05, + 3.604988887673244e-05, + 3.48928188032005e-05, + 3.140935586998239e-05 + ], + "bp_grad_norms_F": [ + 0.0015826384769752622, + 0.0015907500637695193, + 0.0016004826175048947, + 0.0015078946016728878, + 0.0012762312544509768 + ], + "gamma_dfa": NaN, + "acc_eval": 0.578125, + "loss_eval": 1.2292213439941406, + "epoch": 21 + }, + { + "hidden_norms": [ + 248.95265197753906, + 241.59408569335938, + 233.2073211669922, + 236.39898681640625, + 243.02566528320312 + ], + "bp_grad_norms_per_sample_med": [ + 3.3556283597135916e-05, + 3.463738539721817e-05, + 3.5712662793230265e-05, + 3.4992117434740067e-05, + 3.1405961635755375e-05 + ], + "bp_grad_norms_F": [ + 0.0015417077811434865, + 0.0015624086372554302, + 0.00158181122969836, + 0.0014982762513682246, + 0.001269534695893526 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5712890625, + "loss_eval": 1.201985239982605, + "epoch": 22 + }, + { + "hidden_norms": [ + 250.6766815185547, + 243.67706298828125, + 236.90567016601562, + 240.1038360595703, + 244.89207458496094 + ], + "bp_grad_norms_per_sample_med": [ + 3.3543499739607796e-05, + 3.4865890484070405e-05, + 3.564134021871723e-05, + 3.4787921322276816e-05, + 3.112335252808407e-05 + ], + "bp_grad_norms_F": [ + 0.0015237597981467843, + 0.0015382410492748022, + 0.0015483599854633212, + 0.0014793339651077986, + 0.0012637422187253833 + ], + "gamma_dfa": NaN, + "acc_eval": 0.55859375, + "loss_eval": 1.2245514392852783, + "epoch": 23 + }, + { + "hidden_norms": [ + 256.1240539550781, + 248.83609008789062, + 240.2549285888672, + 243.1914825439453, + 248.11964416503906 + ], + "bp_grad_norms_per_sample_med": [ + 3.322990596643649e-05, + 3.523347186273895e-05, + 3.6828067095484585e-05, + 3.5215769457863644e-05, + 3.133456266368739e-05 + ], + "bp_grad_norms_F": [ + 0.0015543467598035932, + 0.0015818241517990828, + 0.0015992531552910805, + 0.001527936663478613, + 0.0012819069670513272 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.2261133193969727, + "epoch": 24 + }, + { + "hidden_norms": [ + 256.9990234375, + 248.78497314453125, + 239.55239868164062, + 243.13818359375, + 249.48153686523438 + ], + "bp_grad_norms_per_sample_med": [ + 3.39320904458873e-05, + 3.600086711230688e-05, + 3.7119287298992276e-05, + 3.6292254662839696e-05, + 3.193991506122984e-05 + ], + "bp_grad_norms_F": [ + 0.0015332578914240003, + 0.00156042305752635, + 0.001574728754349053, + 0.0015015782555565238, + 0.0012670031283050776 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5771484375, + "loss_eval": 1.2080682516098022, + "epoch": 25 + }, + { + "hidden_norms": [ + 260.4493103027344, + 251.83595275878906, + 240.95025634765625, + 242.58055114746094, + 247.42816162109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.4877586585935205e-05, + 3.68267938029021e-05, + 3.760240360861644e-05, + 3.5770553949987516e-05, + 3.202233710908331e-05 + ], + "bp_grad_norms_F": [ + 0.0016203002305701375, + 0.0016500651836395264, + 0.0016584799159318209, + 0.0015617734752595425, + 0.00129653827752918 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5576171875, + "loss_eval": 1.2154628038406372, + "epoch": 26 + }, + { + "hidden_norms": [ + 263.1241760253906, + 253.4596405029297, + 243.6095733642578, + 245.4304656982422, + 250.32362365722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.480416853562929e-05, + 3.640647264546715e-05, + 3.738802479347214e-05, + 3.5808730899589136e-05, + 3.25721557601355e-05 + ], + "bp_grad_norms_F": [ + 0.0015986696816980839, + 0.0016261462587863207, + 0.0016554947942495346, + 0.0015633245930075645, + 0.0013003128115087748 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5634765625, + "loss_eval": 1.2160842418670654, + "epoch": 27 + }, + { + "hidden_norms": [ + 266.5273132324219, + 256.0182189941406, + 245.50253295898438, + 246.18280029296875, + 251.716064453125 + ], + "bp_grad_norms_per_sample_med": [ + 3.359848051331937e-05, + 3.572113564587198e-05, + 3.695064515341073e-05, + 3.506165376165882e-05, + 3.114769424428232e-05 + ], + "bp_grad_norms_F": [ + 0.0016088238917291164, + 0.0016375494888052344, + 0.0016567507991567254, + 0.0015764845302328467, + 0.001285399659536779 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.2021496295928955, + "epoch": 28 + }, + { + "hidden_norms": [ + 267.4769592285156, + 258.21368408203125, + 248.0418701171875, + 248.66949462890625, + 253.77452087402344 + ], + "bp_grad_norms_per_sample_med": [ + 3.400501736905426e-05, + 3.611011925386265e-05, + 3.7168374547036365e-05, + 3.569516775314696e-05, + 3.031879896298051e-05 + ], + "bp_grad_norms_F": [ + 0.0015880028950050473, + 0.0016197538934648037, + 0.001652923645451665, + 0.0015723761171102524, + 0.00128253607545048 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5771484375, + "loss_eval": 1.2029783725738525, + "epoch": 29 + }, + { + "hidden_norms": [ + 268.6047668457031, + 256.4200744628906, + 246.27796936035156, + 246.51229858398438, + 250.08482360839844 + ], + "bp_grad_norms_per_sample_med": [ + 3.425245813559741e-05, + 3.6405861465027556e-05, + 3.752295742742717e-05, + 3.6318160709924996e-05, + 3.103434937656857e-05 + ], + "bp_grad_norms_F": [ + 0.0017358324257656932, + 0.0017647893400862813, + 0.0017767423996701837, + 0.0016745994798839092, + 0.0013456137385219336 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5859375, + "loss_eval": 1.2118260860443115, + "epoch": 30 + }, + { + "hidden_norms": [ + 270.9348449707031, + 260.40045166015625, + 250.72512817382812, + 251.9379425048828, + 254.6614227294922 + ], + "bp_grad_norms_per_sample_med": [ + 3.491883762762882e-05, + 3.647417179308832e-05, + 3.8068057619966567e-05, + 3.653564635897055e-05, + 3.172537253703922e-05 + ], + "bp_grad_norms_F": [ + 0.0015994011191651225, + 0.0016339519061148167, + 0.0016624036943539977, + 0.0015806201845407486, + 0.0013034256407991052 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5849609375, + "loss_eval": 1.1830923557281494, + "epoch": 31 + }, + { + "hidden_norms": [ + 274.6016845703125, + 262.9326477050781, + 250.766357421875, + 252.1786346435547, + 254.2251739501953 + ], + "bp_grad_norms_per_sample_med": [ + 3.4794014936778694e-05, + 3.6746245314134285e-05, + 3.771794217755087e-05, + 3.6664638173533604e-05, + 3.1814517569728196e-05 + ], + "bp_grad_norms_F": [ + 0.0016584239201620221, + 0.0016917918110266328, + 0.001726189162582159, + 0.0016276866663247347, + 0.0013194811763241887 + ], + "gamma_dfa": NaN, + "acc_eval": 0.578125, + "loss_eval": 1.1851024627685547, + "epoch": 32 + }, + { + "hidden_norms": [ + 273.59783935546875, + 261.92218017578125, + 250.27320861816406, + 251.19146728515625, + 255.70233154296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.505383210722357e-05, + 3.6710382119053975e-05, + 3.839766577584669e-05, + 3.708387885126285e-05, + 3.1251351174432784e-05 + ], + "bp_grad_norms_F": [ + 0.0016781548038125038, + 0.0017169808270409703, + 0.0017399545758962631, + 0.0016386040952056646, + 0.0013246783055365086 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5712890625, + "loss_eval": 1.1789460182189941, + "epoch": 33 + }, + { + "hidden_norms": [ + 274.9112854003906, + 262.3539123535156, + 251.67474365234375, + 253.08824157714844, + 255.4647979736328 + ], + "bp_grad_norms_per_sample_med": [ + 3.4545508242445067e-05, + 3.622366421041079e-05, + 3.7300182157196105e-05, + 3.594972440623678e-05, + 3.1557658076053485e-05 + ], + "bp_grad_norms_F": [ + 0.001666227588430047, + 0.0016955926548689604, + 0.0017251977697014809, + 0.0016294753877446055, + 0.001327820005826652 + ], + "gamma_dfa": NaN, + "acc_eval": 0.583984375, + "loss_eval": 1.1757192611694336, + "epoch": 34 + }, + { + "hidden_norms": [ + 273.9092712402344, + 261.26507568359375, + 250.60923767089844, + 250.5943145751953, + 253.19862365722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.532320988597348e-05, + 3.7557252653641626e-05, + 3.882365126628429e-05, + 3.676790583995171e-05, + 3.2376574381487444e-05 + ], + "bp_grad_norms_F": [ + 0.001686039031483233, + 0.0017200085567310452, + 0.0017563666915521026, + 0.0016565105179324746, + 0.0013397492002695799 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1719229221343994, + "epoch": 35 + }, + { + "hidden_norms": [ + 275.9344177246094, + 265.1002502441406, + 253.2598114013672, + 253.86024475097656, + 257.8154296875 + ], + "bp_grad_norms_per_sample_med": [ + 3.419027416384779e-05, + 3.54782423528377e-05, + 3.770734474528581e-05, + 3.707608630065806e-05, + 3.1706651498097926e-05 + ], + "bp_grad_norms_F": [ + 0.0016564616234973073, + 0.001694328966550529, + 0.001729298266582191, + 0.0016409243689849973, + 0.0013242866843938828 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.169456958770752, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.0843200683594, + 263.2900390625, + 250.48553466796875, + 251.51341247558594, + 253.14413452148438 + ], + "bp_grad_norms_per_sample_med": [ + 3.5850312997354195e-05, + 3.7839381548110396e-05, + 3.925598502974026e-05, + 3.7184508983045816e-05, + 3.174091762048192e-05 + ], + "bp_grad_norms_F": [ + 0.0017717990558594465, + 0.0018099851440638304, + 0.0018417692044749856, + 0.0017209915677085519, + 0.0013732420047745109 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5869140625, + "loss_eval": 1.1764099597930908, + "epoch": 37 + }, + { + "hidden_norms": [ + 280.2084655761719, + 265.3043518066406, + 254.26673889160156, + 253.3932342529297, + 255.91488647460938 + ], + "bp_grad_norms_per_sample_med": [ + 3.4716471418505535e-05, + 3.675218249554746e-05, + 3.84828781534452e-05, + 3.653839303296991e-05, + 3.1539821065962315e-05 + ], + "bp_grad_norms_F": [ + 0.00171388138551265, + 0.0017648075008764863, + 0.00180675252340734, + 0.0016973463352769613, + 0.0013539392966777086 + ], + "gamma_dfa": NaN, + "acc_eval": 0.591796875, + "loss_eval": 1.1670037508010864, + "epoch": 38 + }, + { + "hidden_norms": [ + 278.0702209472656, + 264.4510498046875, + 250.75350952148438, + 248.73284912109375, + 253.1072540283203 + ], + "bp_grad_norms_per_sample_med": [ + 3.694290717248805e-05, + 3.843691956717521e-05, + 3.982238922617398e-05, + 3.8299614971037954e-05, + 3.253731847507879e-05 + ], + "bp_grad_norms_F": [ + 0.0017997974064201117, + 0.0018521619495004416, + 0.0018853276269510388, + 0.001754313474521041, + 0.0013789198128506541 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.168372631072998, + "epoch": 39 + }, + { + "hidden_norms": [ + 279.5745849609375, + 265.3549499511719, + 252.89109802246094, + 250.0029296875, + 251.57737731933594 + ], + "bp_grad_norms_per_sample_med": [ + 3.5274497349746525e-05, + 3.741122054634616e-05, + 3.8946731365285814e-05, + 3.7627731217071414e-05, + 3.1920495530357584e-05 + ], + "bp_grad_norms_F": [ + 0.0017959685064852238, + 0.0018515808042138815, + 0.001886399113573134, + 0.0017732164124026895, + 0.001389715587720275 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5966796875, + "loss_eval": 1.1735193729400635, + "epoch": 40 + }, + { + "hidden_norms": [ + 280.56402587890625, + 265.1068115234375, + 251.912353515625, + 248.08627319335938, + 250.21177673339844 + ], + "bp_grad_norms_per_sample_med": [ + 3.672741513582878e-05, + 3.8823065551696345e-05, + 4.041267675347626e-05, + 3.835778989014216e-05, + 3.2424144592368975e-05 + ], + "bp_grad_norms_F": [ + 0.0018404219299554825, + 0.0018969813827425241, + 0.0019448500825092196, + 0.0018052044324576855, + 0.0014045372372493148 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5966796875, + "loss_eval": 1.163725733757019, + "epoch": 41 + }, + { + "hidden_norms": [ + 281.2812194824219, + 266.5726623535156, + 253.18124389648438, + 252.3292694091797, + 254.1314697265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.6245146475266665e-05, + 3.849809218081646e-05, + 4.034954326925799e-05, + 3.857027695630677e-05, + 3.267046849941835e-05 + ], + "bp_grad_norms_F": [ + 0.0018043599557131529, + 0.0018654613522812724, + 0.0018976799910888076, + 0.0017763315699994564, + 0.0013986497651785612 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.172363519668579, + "epoch": 42 + }, + { + "hidden_norms": [ + 278.3638916015625, + 264.4734802246094, + 250.60198974609375, + 248.59568786621094, + 249.39353942871094 + ], + "bp_grad_norms_per_sample_med": [ + 3.7236037314869463e-05, + 3.946686410927214e-05, + 4.103714309167117e-05, + 3.970286707044579e-05, + 3.281752287875861e-05 + ], + "bp_grad_norms_F": [ + 0.0018646781099960208, + 0.0019272645004093647, + 0.0019672266207635403, + 0.001839098404161632, + 0.0014395405305549502 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.1776624917984009, + "epoch": 43 + }, + { + "hidden_norms": [ + 280.8514099121094, + 269.1718444824219, + 253.03790283203125, + 251.60220336914062, + 251.88168334960938 + ], + "bp_grad_norms_per_sample_med": [ + 3.689880759338848e-05, + 3.937961082556285e-05, + 4.092283779755235e-05, + 3.866894985549152e-05, + 3.262344398535788e-05 + ], + "bp_grad_norms_F": [ + 0.0018725661793723702, + 0.0019201217219233513, + 0.0019532060250639915, + 0.0018317755311727524, + 0.001439971849322319 + ], + "gamma_dfa": NaN, + "acc_eval": 0.595703125, + "loss_eval": 1.1693906784057617, + "epoch": 44 + }, + { + "hidden_norms": [ + 280.3335266113281, + 263.89471435546875, + 253.01638793945312, + 250.5576171875, + 251.4005889892578 + ], + "bp_grad_norms_per_sample_med": [ + 3.6666475352831185e-05, + 3.875952461385168e-05, + 4.0531358536100015e-05, + 3.9068203477654606e-05, + 3.450641088420525e-05 + ], + "bp_grad_norms_F": [ + 0.0018578553572297096, + 0.0019184533739462495, + 0.001965942559763789, + 0.0018550093518570065, + 0.0014542803401127458 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.1839377880096436, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.3553771972656, + 263.3617248535156, + 248.94859313964844, + 246.9832000732422, + 246.24644470214844 + ], + "bp_grad_norms_per_sample_med": [ + 3.8412734284065664e-05, + 4.001844354206696e-05, + 4.220755727146752e-05, + 4.0393635572399944e-05, + 3.391467180335894e-05 + ], + "bp_grad_norms_F": [ + 0.001917686895467341, + 0.0019766101613640785, + 0.0020170181524008512, + 0.0018900329014286399, + 0.001476101577281952 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1689397096633911, + "epoch": 46 + }, + { + "hidden_norms": [ + 278.8861389160156, + 263.3866882324219, + 249.24301147460938, + 246.43963623046875, + 246.34503173828125 + ], + "bp_grad_norms_per_sample_med": [ + 3.77853139070794e-05, + 4.044857996632345e-05, + 4.182702468824573e-05, + 4.050548523082398e-05, + 3.3606509532546625e-05 + ], + "bp_grad_norms_F": [ + 0.0019284948939457536, + 0.001992136472836137, + 0.0020461773965507746, + 0.001900508883409202, + 0.001466717105358839 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1585946083068848, + "epoch": 47 + }, + { + "hidden_norms": [ + 279.963623046875, + 263.52496337890625, + 249.6890869140625, + 245.60646057128906, + 245.52540588378906 + ], + "bp_grad_norms_per_sample_med": [ + 3.724947964656167e-05, + 3.964625648222864e-05, + 4.1545175918145105e-05, + 3.953047780669294e-05, + 3.275729977758601e-05 + ], + "bp_grad_norms_F": [ + 0.0019616533536463976, + 0.002027863636612892, + 0.0020759752951562405, + 0.0019283785950392485, + 0.001484199776314199 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.157920002937317, + "epoch": 48 + }, + { + "hidden_norms": [ + 279.7983093261719, + 263.42352294921875, + 247.6257781982422, + 244.5139923095703, + 242.93429565429688 + ], + "bp_grad_norms_per_sample_med": [ + 3.738125451491214e-05, + 4.007351162726991e-05, + 4.2600284359650686e-05, + 4.0704209823161364e-05, + 3.302833283669315e-05 + ], + "bp_grad_norms_F": [ + 0.001973477192223072, + 0.002032764023169875, + 0.0020790304988622665, + 0.0019371822709217668, + 0.0014914683997631073 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1545627117156982, + "epoch": 49 + }, + { + "hidden_norms": [ + 278.16461181640625, + 259.95208740234375, + 246.212890625, + 243.02810668945312, + 242.42227172851562 + ], + "bp_grad_norms_per_sample_med": [ + 3.896220732713118e-05, + 4.0713552152737975e-05, + 4.242185241309926e-05, + 4.1096616769209504e-05, + 3.4584638342494145e-05 + ], + "bp_grad_norms_F": [ + 0.0020273446571081877, + 0.0020888603758066893, + 0.0021337512880563736, + 0.0019914479926228523, + 0.0015125740319490433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1588966846466064, + "epoch": 50 + }, + { + "hidden_norms": [ + 278.74609375, + 259.810302734375, + 244.75640869140625, + 241.40191650390625, + 241.2429962158203 + ], + "bp_grad_norms_per_sample_med": [ + 4.005424489150755e-05, + 4.289989738026634e-05, + 4.383309351396747e-05, + 4.207885649520904e-05, + 3.527112494339235e-05 + ], + "bp_grad_norms_F": [ + 0.002059010788798332, + 0.002119551645591855, + 0.002172222128137946, + 0.0020189452916383743, + 0.0015335450880229473 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1555505990982056, + "epoch": 51 + }, + { + "hidden_norms": [ + 277.6565246582031, + 262.0436096191406, + 246.2357635498047, + 241.67991638183594, + 240.23500061035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.1031005821423605e-05, + 4.313238605391234e-05, + 4.465782694751397e-05, + 4.2896612285403535e-05, + 3.4334370866417885e-05 + ], + "bp_grad_norms_F": [ + 0.002025892725214362, + 0.0020990471821278334, + 0.0021509609650820494, + 0.002011507283896208, + 0.0015318752266466618 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1416809558868408, + "epoch": 52 + }, + { + "hidden_norms": [ + 277.4100646972656, + 260.2519836425781, + 245.48947143554688, + 242.5662384033203, + 241.2648162841797 + ], + "bp_grad_norms_per_sample_med": [ + 3.732202821993269e-05, + 3.9125570765463635e-05, + 4.136607458349317e-05, + 3.977569213020615e-05, + 3.3676675229799e-05 + ], + "bp_grad_norms_F": [ + 0.002009452786296606, + 0.002076543401926756, + 0.002131648361682892, + 0.00199576816521585, + 0.0015338497469201684 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.143639087677002, + "epoch": 53 + }, + { + "hidden_norms": [ + 277.3269348144531, + 259.49072265625, + 243.7945098876953, + 240.342041015625, + 238.76239013671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.978172389906831e-05, + 4.20100441260729e-05, + 4.455841553863138e-05, + 4.2333795136073604e-05, + 3.435015969444066e-05 + ], + "bp_grad_norms_F": [ + 0.0020786102395504713, + 0.0021364488638937473, + 0.0021890606731176376, + 0.0020492339972406626, + 0.0015625122468918562 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1515132188796997, + "epoch": 54 + }, + { + "hidden_norms": [ + 276.1414489746094, + 257.6651306152344, + 242.12867736816406, + 238.3046875, + 235.9711151123047 + ], + "bp_grad_norms_per_sample_med": [ + 4.158447700319812e-05, + 4.40051153418608e-05, + 4.566523784887977e-05, + 4.3018761061830446e-05, + 3.456107515376061e-05 + ], + "bp_grad_norms_F": [ + 0.0021895321551710367, + 0.0022726275492459536, + 0.00232017133384943, + 0.002137792995199561, + 0.0015979791060090065 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.148828148841858, + "epoch": 55 + }, + { + "hidden_norms": [ + 276.29547119140625, + 257.9006652832031, + 242.25363159179688, + 237.8865966796875, + 235.57620239257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.9041460695443675e-05, + 4.0436327253701165e-05, + 4.2260016925865784e-05, + 4.071593502885662e-05, + 3.461613232502714e-05 + ], + "bp_grad_norms_F": [ + 0.0021726686973124743, + 0.002256714040413499, + 0.0023172625806182623, + 0.0021478317212313414, + 0.0016112272860482335 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.165194034576416, + "epoch": 56 + }, + { + "hidden_norms": [ + 274.73480224609375, + 257.3844909667969, + 239.9276580810547, + 236.4628448486328, + 232.49490356445312 + ], + "bp_grad_norms_per_sample_med": [ + 4.182914926786907e-05, + 4.482160511543043e-05, + 4.732825618702918e-05, + 4.5475029764929786e-05, + 3.673886021715589e-05 + ], + "bp_grad_norms_F": [ + 0.002222857205197215, + 0.0022976247128099203, + 0.002366685541346669, + 0.002194431144744158, + 0.0016426561633124948 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.150635004043579, + "epoch": 57 + }, + { + "hidden_norms": [ + 273.9837341308594, + 255.2301025390625, + 239.6470184326172, + 235.07806396484375, + 232.15016174316406 + ], + "bp_grad_norms_per_sample_med": [ + 4.28417552029714e-05, + 4.5315191528061405e-05, + 4.770928717334755e-05, + 4.653819996747188e-05, + 3.727963485289365e-05 + ], + "bp_grad_norms_F": [ + 0.002205377910286188, + 0.00228099524974823, + 0.002334901597350836, + 0.0021908036433160305, + 0.001635397202335298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6064453125, + "loss_eval": 1.150489330291748, + "epoch": 58 + }, + { + "hidden_norms": [ + 273.4665222167969, + 255.21783447265625, + 238.12306213378906, + 232.99537658691406, + 229.35629272460938 + ], + "bp_grad_norms_per_sample_med": [ + 4.174295099801384e-05, + 4.412833004607819e-05, + 4.589854142977856e-05, + 4.366271969047375e-05, + 3.4910473914351314e-05 + ], + "bp_grad_norms_F": [ + 0.0022425123024731874, + 0.002337042009457946, + 0.0024111224338412285, + 0.002237174427136779, + 0.0016597777139395475 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1445674896240234, + "epoch": 59 + }, + { + "hidden_norms": [ + 272.8526306152344, + 254.31373596191406, + 238.0008087158203, + 233.6641082763672, + 229.88113403320312 + ], + "bp_grad_norms_per_sample_med": [ + 4.274978709872812e-05, + 4.589447416947223e-05, + 4.8100573621923104e-05, + 4.519677167991176e-05, + 3.628300692071207e-05 + ], + "bp_grad_norms_F": [ + 0.0022435274440795183, + 0.0023362115025520325, + 0.0024012199137359858, + 0.00223422609269619, + 0.0016617706278339028 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1417796611785889, + "epoch": 60 + }, + { + "hidden_norms": [ + 272.5745849609375, + 253.39877319335938, + 236.8953094482422, + 231.5461883544922, + 227.8491668701172 + ], + "bp_grad_norms_per_sample_med": [ + 4.257826367393136e-05, + 4.485245153773576e-05, + 4.667421308113262e-05, + 4.5228414819575846e-05, + 3.560770346666686e-05 + ], + "bp_grad_norms_F": [ + 0.0022986247204244137, + 0.002396916039288044, + 0.0024696297477930784, + 0.0022973858285695314, + 0.0016907128738239408 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1428865194320679, + "epoch": 61 + }, + { + "hidden_norms": [ + 269.6819763183594, + 250.9730682373047, + 234.21188354492188, + 228.83775329589844, + 224.82958984375 + ], + "bp_grad_norms_per_sample_med": [ + 4.29281426477246e-05, + 4.5681605115532875e-05, + 4.7611269110348076e-05, + 4.553339022095315e-05, + 3.683664544951171e-05 + ], + "bp_grad_norms_F": [ + 0.0023400019854307175, + 0.002444769022986293, + 0.0025141045916825533, + 0.002344615990296006, + 0.0017126062884926796 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1239444017410278, + "epoch": 62 + }, + { + "hidden_norms": [ + 269.7929992675781, + 250.5220947265625, + 233.3997802734375, + 228.2130584716797, + 224.5063018798828 + ], + "bp_grad_norms_per_sample_med": [ + 4.4715372496284544e-05, + 4.6482971811201423e-05, + 4.9765483709052205e-05, + 4.759176226798445e-05, + 3.8208585465326905e-05 + ], + "bp_grad_norms_F": [ + 0.0023639060091227293, + 0.002476333873346448, + 0.0025423571933060884, + 0.00236364989541471, + 0.0017294714925810695 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.1502506732940674, + "epoch": 63 + }, + { + "hidden_norms": [ + 269.24493408203125, + 251.6195831298828, + 234.21717834472656, + 228.9242401123047, + 224.33628845214844 + ], + "bp_grad_norms_per_sample_med": [ + 4.4276617700234056e-05, + 4.620026084012352e-05, + 4.972432361682877e-05, + 4.657481986214407e-05, + 3.729217132786289e-05 + ], + "bp_grad_norms_F": [ + 0.0023896305356174707, + 0.002498477231711149, + 0.0025652945041656494, + 0.002390124835073948, + 0.0017562232678756118 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.146531581878662, + "epoch": 64 + }, + { + "hidden_norms": [ + 268.0794982910156, + 250.7041778564453, + 233.16966247558594, + 227.9508056640625, + 223.48045349121094 + ], + "bp_grad_norms_per_sample_med": [ + 4.518003697739914e-05, + 4.807085497304797e-05, + 5.077984678791836e-05, + 4.9026388296624646e-05, + 3.8487425626954064e-05 + ], + "bp_grad_norms_F": [ + 0.0023859951179474592, + 0.002494273241609335, + 0.0025624327827244997, + 0.0023940331302583218, + 0.0017616016557440162 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1454447507858276, + "epoch": 65 + }, + { + "hidden_norms": [ + 267.8343811035156, + 247.6757049560547, + 231.40367126464844, + 225.93670654296875, + 220.4804229736328 + ], + "bp_grad_norms_per_sample_med": [ + 4.405072468216531e-05, + 4.688911576522514e-05, + 4.961229205946438e-05, + 4.743603858514689e-05, + 3.724359339685179e-05 + ], + "bp_grad_norms_F": [ + 0.002465154742822051, + 0.0025785581674426794, + 0.002648484194651246, + 0.0024633395951241255, + 0.0017954027280211449 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.165484070777893, + "epoch": 66 + }, + { + "hidden_norms": [ + 267.8901062011719, + 248.67857360839844, + 231.63746643066406, + 225.49383544921875, + 220.6399383544922 + ], + "bp_grad_norms_per_sample_med": [ + 4.755932604894042e-05, + 4.9960097385337576e-05, + 5.191187665332109e-05, + 4.949339563609101e-05, + 3.946756987716071e-05 + ], + "bp_grad_norms_F": [ + 0.0024303828831762075, + 0.0025356977712363005, + 0.002610789379104972, + 0.00243638688698411, + 0.0017875435296446085 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1472151279449463, + "epoch": 67 + }, + { + "hidden_norms": [ + 267.3486022949219, + 247.69305419921875, + 229.9873504638672, + 223.6610870361328, + 218.91578674316406 + ], + "bp_grad_norms_per_sample_med": [ + 4.743155659525655e-05, + 5.06583419337403e-05, + 5.422766844276339e-05, + 5.0596820074133575e-05, + 3.959470632253215e-05 + ], + "bp_grad_norms_F": [ + 0.0025001303292810917, + 0.0026160534471273422, + 0.002682509133592248, + 0.002501503797248006, + 0.0018251334549859166 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.157745599746704, + "epoch": 68 + }, + { + "hidden_norms": [ + 266.2055969238281, + 246.88201904296875, + 229.0934295654297, + 223.09255981445312, + 217.90614318847656 + ], + "bp_grad_norms_per_sample_med": [ + 4.6090037358226255e-05, + 4.8821068048710003e-05, + 5.145218892721459e-05, + 4.892798824585043e-05, + 3.874724279739894e-05 + ], + "bp_grad_norms_F": [ + 0.002517222659662366, + 0.00262960116378963, + 0.002704967511817813, + 0.002524228999391198, + 0.0018283555982634425 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1513168811798096, + "epoch": 69 + }, + { + "hidden_norms": [ + 263.8387451171875, + 244.32431030273438, + 227.78903198242188, + 222.13900756835938, + 216.27389526367188 + ], + "bp_grad_norms_per_sample_med": [ + 4.680602069129236e-05, + 5.040669202571735e-05, + 5.318928378983401e-05, + 4.9446778575656936e-05, + 3.913935870514251e-05 + ], + "bp_grad_norms_F": [ + 0.0025120435748249292, + 0.0026304670609533787, + 0.0027123456820845604, + 0.002537800231948495, + 0.001847997889854014 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1497204303741455, + "epoch": 70 + }, + { + "hidden_norms": [ + 263.52716064453125, + 243.21226501464844, + 226.427001953125, + 220.67845153808594, + 214.70176696777344 + ], + "bp_grad_norms_per_sample_med": [ + 4.6976576413726434e-05, + 5.0085352995665744e-05, + 5.2343326387926936e-05, + 4.9784572183853015e-05, + 4.0186921978602186e-05 + ], + "bp_grad_norms_F": [ + 0.0026124012656509876, + 0.0027241536881774664, + 0.002797869499772787, + 0.002603790955618024, + 0.0018792233895510435 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.153285026550293, + "epoch": 71 + }, + { + "hidden_norms": [ + 264.0121765136719, + 243.2773895263672, + 226.7365264892578, + 220.29107666015625, + 214.1591339111328 + ], + "bp_grad_norms_per_sample_med": [ + 4.6254041080828756e-05, + 4.949727008352056e-05, + 5.206605055718683e-05, + 5.012763722334057e-05, + 3.8815273001091555e-05 + ], + "bp_grad_norms_F": [ + 0.0026143237482756376, + 0.0027275518514215946, + 0.0028062777128070593, + 0.002607470378279686, + 0.0018867084290832281 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1514866352081299, + "epoch": 72 + }, + { + "hidden_norms": [ + 263.4013671875, + 243.0095672607422, + 225.4296112060547, + 219.55067443847656, + 213.40794372558594 + ], + "bp_grad_norms_per_sample_med": [ + 4.8506815801374614e-05, + 5.151949153514579e-05, + 5.5085791245801374e-05, + 5.175785190658644e-05, + 4.0316641388926655e-05 + ], + "bp_grad_norms_F": [ + 0.002606831956654787, + 0.002728143008425832, + 0.0028109808918088675, + 0.0026184367015957832, + 0.0018970600795000792 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1346663236618042, + "epoch": 73 + }, + { + "hidden_norms": [ + 262.27703857421875, + 242.7241668701172, + 224.5229949951172, + 218.4025115966797, + 212.19247436523438 + ], + "bp_grad_norms_per_sample_med": [ + 4.704251477960497e-05, + 5.0965834816452116e-05, + 5.3327348723541945e-05, + 5.0449500122340396e-05, + 4.0479797462467104e-05 + ], + "bp_grad_norms_F": [ + 0.0026277368888258934, + 0.0027542279567569494, + 0.00283243996091187, + 0.00264621595852077, + 0.0019058829639106989 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.137591004371643, + "epoch": 74 + }, + { + "hidden_norms": [ + 262.1747131347656, + 241.88607788085938, + 224.1046142578125, + 217.9982147216797, + 211.7519989013672 + ], + "bp_grad_norms_per_sample_med": [ + 4.847371383220889e-05, + 5.121564754517749e-05, + 5.3943567763781175e-05, + 5.087414683657698e-05, + 4.037184771732427e-05 + ], + "bp_grad_norms_F": [ + 0.0026811074931174517, + 0.002809705911204219, + 0.002887698821723461, + 0.002692745067179203, + 0.0019356919219717383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1538643836975098, + "epoch": 75 + }, + { + "hidden_norms": [ + 261.7838439941406, + 239.75706481933594, + 222.1133575439453, + 216.12124633789062, + 210.44593811035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.8369467549491674e-05, + 5.07068180013448e-05, + 5.281560879666358e-05, + 5.086012970423326e-05, + 4.062180232722312e-05 + ], + "bp_grad_norms_F": [ + 0.0027064597234129906, + 0.0028339733835309744, + 0.0029109998140484095, + 0.002717787167057395, + 0.0019469966646283865 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1476709842681885, + "epoch": 76 + }, + { + "hidden_norms": [ + 260.708251953125, + 239.65792846679688, + 222.502197265625, + 216.31419372558594, + 210.15716552734375 + ], + "bp_grad_norms_per_sample_med": [ + 4.919906132272445e-05, + 5.164166941540316e-05, + 5.366719051380642e-05, + 5.108323966851458e-05, + 4.000464832643047e-05 + ], + "bp_grad_norms_F": [ + 0.002715736860409379, + 0.0028464714996516705, + 0.0029330456163734198, + 0.0027443754952400923, + 0.001961463363841176 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1511735916137695, + "epoch": 77 + }, + { + "hidden_norms": [ + 260.4088439941406, + 239.9808349609375, + 222.2389373779297, + 215.33692932128906, + 208.58534240722656 + ], + "bp_grad_norms_per_sample_med": [ + 4.8405916459159926e-05, + 5.163977766642347e-05, + 5.34093014721293e-05, + 5.167788185644895e-05, + 4.020798587589525e-05 + ], + "bp_grad_norms_F": [ + 0.0027501434087753296, + 0.0028795108664780855, + 0.0029617082327604294, + 0.002769613405689597, + 0.001984042814001441 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1523363590240479, + "epoch": 78 + }, + { + "hidden_norms": [ + 259.8567199707031, + 238.8525848388672, + 221.2687225341797, + 213.9132537841797, + 207.3290557861328 + ], + "bp_grad_norms_per_sample_med": [ + 4.8219208110822365e-05, + 5.1672555855475366e-05, + 5.364803655538708e-05, + 5.1243885536678135e-05, + 4.079756035935134e-05 + ], + "bp_grad_norms_F": [ + 0.0028046013321727514, + 0.002939376747235656, + 0.0030214993748813868, + 0.002813557395711541, + 0.0019953204318881035 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1514203548431396, + "epoch": 79 + }, + { + "hidden_norms": [ + 259.52423095703125, + 238.27757263183594, + 219.9165802001953, + 213.4214324951172, + 206.20606994628906 + ], + "bp_grad_norms_per_sample_med": [ + 4.8479021643288434e-05, + 5.219021113589406e-05, + 5.5094871640903875e-05, + 5.1899030950153247e-05, + 4.124108454561792e-05 + ], + "bp_grad_norms_F": [ + 0.0028202880639582872, + 0.002952422248199582, + 0.0030410154722630978, + 0.002832787809893489, + 0.0020088190212845802 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1545820236206055, + "epoch": 80 + }, + { + "hidden_norms": [ + 258.1958923339844, + 237.08778381347656, + 219.2870635986328, + 212.87725830078125, + 205.84408569335938 + ], + "bp_grad_norms_per_sample_med": [ + 5.005837374483235e-05, + 5.344217424863018e-05, + 5.582463927567005e-05, + 5.345495083020069e-05, + 4.113194518140517e-05 + ], + "bp_grad_norms_F": [ + 0.0028330644126981497, + 0.002965509658679366, + 0.0030466399621218443, + 0.00284536718390882, + 0.0020232615061104298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.1552448272705078, + "epoch": 81 + }, + { + "hidden_norms": [ + 258.44268798828125, + 236.90562438964844, + 218.65948486328125, + 212.63186645507812, + 204.90692138671875 + ], + "bp_grad_norms_per_sample_med": [ + 4.896440077573061e-05, + 5.1820486987708136e-05, + 5.4638629080727696e-05, + 5.3578904044115916e-05, + 4.117973367101513e-05 + ], + "bp_grad_norms_F": [ + 0.002839416265487671, + 0.0029778846073895693, + 0.003062452422454953, + 0.002849552081897855, + 0.0020236214622855186 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1515182256698608, + "epoch": 82 + }, + { + "hidden_norms": [ + 258.24615478515625, + 236.87181091308594, + 219.06484985351562, + 213.2528076171875, + 205.03671264648438 + ], + "bp_grad_norms_per_sample_med": [ + 4.8622885515214875e-05, + 5.181535379961133e-05, + 5.509376205736771e-05, + 5.2298331866040826e-05, + 4.074195385328494e-05 + ], + "bp_grad_norms_F": [ + 0.002838765038177371, + 0.00297414674423635, + 0.003058358561247587, + 0.0028491863049566746, + 0.0020313323475420475 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1609394550323486, + "epoch": 83 + }, + { + "hidden_norms": [ + 257.9989929199219, + 236.4859161376953, + 218.73072814941406, + 212.0786895751953, + 204.2919464111328 + ], + "bp_grad_norms_per_sample_med": [ + 5.0208276661578566e-05, + 5.2276191127020866e-05, + 5.509322727448307e-05, + 5.315374437486753e-05, + 4.122377504245378e-05 + ], + "bp_grad_norms_F": [ + 0.0028634185437113047, + 0.0029970910400152206, + 0.0030890253838151693, + 0.002881886437535286, + 0.0020408176351338625 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.1592046022415161, + "epoch": 84 + }, + { + "hidden_norms": [ + 257.24053955078125, + 235.7548065185547, + 217.84329223632812, + 211.033935546875, + 203.8216094970703 + ], + "bp_grad_norms_per_sample_med": [ + 5.0660164561122656e-05, + 5.414208135334775e-05, + 5.5454143875977024e-05, + 5.3000938351033255e-05, + 4.292939411243424e-05 + ], + "bp_grad_norms_F": [ + 0.0028948886319994926, + 0.003031315514817834, + 0.0031204961705952883, + 0.002907233312726021, + 0.0020496752113103867 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1583250761032104, + "epoch": 85 + }, + { + "hidden_norms": [ + 256.78289794921875, + 235.2476348876953, + 217.21603393554688, + 210.80035400390625, + 203.15478515625 + ], + "bp_grad_norms_per_sample_med": [ + 4.9510348617332056e-05, + 5.1982155127916485e-05, + 5.440499808173627e-05, + 5.1704166253330186e-05, + 4.0308059396920726e-05 + ], + "bp_grad_norms_F": [ + 0.0028964560478925705, + 0.0030334230978041887, + 0.0031210912857204676, + 0.002908239373937249, + 0.0020543786231428385 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1597179174423218, + "epoch": 86 + }, + { + "hidden_norms": [ + 256.531982421875, + 235.45941162109375, + 217.1429443359375, + 210.1690673828125, + 202.77899169921875 + ], + "bp_grad_norms_per_sample_med": [ + 4.943124076817185e-05, + 5.149367279955186e-05, + 5.385246913647279e-05, + 5.262702325126156e-05, + 4.104706385987811e-05 + ], + "bp_grad_norms_F": [ + 0.0029305708594620228, + 0.0030687344260513783, + 0.003160761669278145, + 0.002940374892205, + 0.0020649591460824013 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.161116600036621, + "epoch": 87 + }, + { + "hidden_norms": [ + 256.3059387207031, + 235.24874877929688, + 217.37142944335938, + 210.53717041015625, + 203.14259338378906 + ], + "bp_grad_norms_per_sample_med": [ + 4.934536627843045e-05, + 5.2089759265072644e-05, + 5.424721530289389e-05, + 5.292960850056261e-05, + 4.041651845909655e-05 + ], + "bp_grad_norms_F": [ + 0.002913407515734434, + 0.0030489542987197638, + 0.003135726321488619, + 0.002922008978202939, + 0.002062067622318864 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.155902624130249, + "epoch": 88 + }, + { + "hidden_norms": [ + 256.7462463378906, + 235.3153839111328, + 216.87977600097656, + 210.572509765625, + 202.77845764160156 + ], + "bp_grad_norms_per_sample_med": [ + 4.990033630747348e-05, + 5.337029870133847e-05, + 5.522817809833214e-05, + 5.3465773817151785e-05, + 4.164372876402922e-05 + ], + "bp_grad_norms_F": [ + 0.0029192205984145403, + 0.0030557813588529825, + 0.003147577866911888, + 0.0029307191725820303, + 0.0020654413383454084 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.1561503410339355, + "epoch": 89 + }, + { + "hidden_norms": [ + 256.68145751953125, + 234.77310180664062, + 216.7720947265625, + 209.664794921875, + 202.22833251953125 + ], + "bp_grad_norms_per_sample_med": [ + 4.9965801736107096e-05, + 5.341583164408803e-05, + 5.593279274762608e-05, + 5.420796514954418e-05, + 4.210533734294586e-05 + ], + "bp_grad_norms_F": [ + 0.002943370258435607, + 0.00308181531727314, + 0.003169203409925103, + 0.002951863221824169, + 0.0020759364124387503 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1583542823791504, + "epoch": 90 + }, + { + "hidden_norms": [ + 256.4252014160156, + 234.56448364257812, + 216.34176635742188, + 209.5242156982422, + 201.7559356689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.9815931561170146e-05, + 5.2233976020943373e-05, + 5.5747830629115924e-05, + 5.41718618478626e-05, + 4.169955354882404e-05 + ], + "bp_grad_norms_F": [ + 0.0029554881621152163, + 0.0030950764194130898, + 0.0031847492791712284, + 0.0029650654178112745, + 0.002081435639411211 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.159005045890808, + "epoch": 91 + }, + { + "hidden_norms": [ + 256.15167236328125, + 234.47537231445312, + 216.2799072265625, + 209.95578002929688, + 201.94126892089844 + ], + "bp_grad_norms_per_sample_med": [ + 5.007637446396984e-05, + 5.260824036668055e-05, + 5.540058555197902e-05, + 5.322153810993768e-05, + 4.1122035327134654e-05 + ], + "bp_grad_norms_F": [ + 0.002944375155493617, + 0.00308293872512877, + 0.003174267942085862, + 0.0029555640649050474, + 0.0020777545869350433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1595215797424316, + "epoch": 92 + }, + { + "hidden_norms": [ + 256.1369934082031, + 234.51614379882812, + 216.30044555664062, + 209.4623565673828, + 201.70799255371094 + ], + "bp_grad_norms_per_sample_med": [ + 5.048588718636893e-05, + 5.3128016588743776e-05, + 5.624579353025183e-05, + 5.411298116086982e-05, + 4.109516885364428e-05 + ], + "bp_grad_norms_F": [ + 0.0029427227564156055, + 0.0030841128900647163, + 0.003178349928930402, + 0.0029583934228867292, + 0.002080487785860896 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1565905809402466, + "epoch": 93 + }, + { + "hidden_norms": [ + 255.9738311767578, + 234.28948974609375, + 216.3280029296875, + 209.589111328125, + 201.76205444335938 + ], + "bp_grad_norms_per_sample_med": [ + 5.070818224339746e-05, + 5.330924614099786e-05, + 5.596653136308305e-05, + 5.407314529293217e-05, + 4.100686783203855e-05 + ], + "bp_grad_norms_F": [ + 0.0029472638852894306, + 0.003088710131123662, + 0.0031828396022319794, + 0.0029631764627993107, + 0.0020829145796597004 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1584088802337646, + "epoch": 94 + }, + { + "hidden_norms": [ + 255.89332580566406, + 234.19253540039062, + 216.33103942871094, + 209.45057678222656, + 201.54258728027344 + ], + "bp_grad_norms_per_sample_med": [ + 5.041498661739752e-05, + 5.279783727019094e-05, + 5.5226330005098134e-05, + 5.407658318290487e-05, + 4.1154507925966755e-05 + ], + "bp_grad_norms_F": [ + 0.002949801040813327, + 0.00309200631454587, + 0.0031869453378021717, + 0.0029658437706530094, + 0.002085147425532341 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.158942699432373, + "epoch": 95 + }, + { + "hidden_norms": [ + 255.63841247558594, + 234.11630249023438, + 216.2378692626953, + 209.49703979492188, + 201.46917724609375 + ], + "bp_grad_norms_per_sample_med": [ + 5.020374737796374e-05, + 5.243354826234281e-05, + 5.587147097685374e-05, + 5.334949673851952e-05, + 4.121083111385815e-05 + ], + "bp_grad_norms_F": [ + 0.002950438065454364, + 0.003093136241659522, + 0.0031878354493528605, + 0.0029664800968021154, + 0.0020843464881181717 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.1582318544387817, + "epoch": 96 + }, + { + "hidden_norms": [ + 255.8027801513672, + 234.07070922851562, + 216.1463623046875, + 209.4476318359375, + 201.27279663085938 + ], + "bp_grad_norms_per_sample_med": [ + 5.0307549827266484e-05, + 5.278814569464885e-05, + 5.604944453807548e-05, + 5.306081584421918e-05, + 4.1182753193425015e-05 + ], + "bp_grad_norms_F": [ + 0.002952505135908723, + 0.003095670836046338, + 0.0031897351145744324, + 0.00296790711581707, + 0.002085329731926322 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.15840482711792, + "epoch": 97 + }, + { + "hidden_norms": [ + 255.60986328125, + 234.11065673828125, + 216.12860107421875, + 209.42921447753906, + 201.28346252441406 + ], + "bp_grad_norms_per_sample_med": [ + 5.0218295655213296e-05, + 5.269264511298388e-05, + 5.5988577514654025e-05, + 5.322946162777953e-05, + 4.136392453801818e-05 + ], + "bp_grad_norms_F": [ + 0.002954497467726469, + 0.003097717184573412, + 0.0031918887980282307, + 0.002969518303871155, + 0.00208606431260705 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1585593223571777, + "epoch": 98 + }, + { + "hidden_norms": [ + 255.57244873046875, + 234.11569213867188, + 216.13626098632812, + 209.40383911132812, + 201.28627014160156 + ], + "bp_grad_norms_per_sample_med": [ + 5.005559796700254e-05, + 5.2759678510483354e-05, + 5.5868193157948554e-05, + 5.3356721764430404e-05, + 4.125368650420569e-05 + ], + "bp_grad_norms_F": [ + 0.0029547216836363077, + 0.00309770368039608, + 0.003191797062754631, + 0.0029695071280002594, + 0.0020862380042672157 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1585021018981934, + "epoch": 99 + }, + { + "hidden_norms": [ + 255.5677947998047, + 234.11875915527344, + 216.1315460205078, + 209.4070281982422, + 201.2687530517578 + ], + "bp_grad_norms_per_sample_med": [ + 5.006368883186951e-05, + 5.279530887492001e-05, + 5.585233884630725e-05, + 5.334027810022235e-05, + 4.123226608498953e-05 + ], + "bp_grad_norms_F": [ + 0.002954971743747592, + 0.0030978918075561523, + 0.003191987983882427, + 0.002969692926853895, + 0.002086336025968194 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.1584858894348145, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 8.719978332519531, + 8.73093318939209, + 8.75937271118164, + 8.790542602539062 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009977436857298017, + 0.000992251792922616, + 0.0009848480112850666, + 0.0009761073160916567, + 0.0009735578205436468 + ], + "bp_grad_norms_F": [ + 0.035340383648872375, + 0.03499162197113037, + 0.03454425558447838, + 0.034113530069589615, + 0.033874060958623886 + ], + "gamma_dfa": 0.006830460682976991, + "acc_eval": 0.095703125, + "loss_eval": 2.486203908920288, + "epoch": 0 + }, + { + "hidden_norms": [ + 861.2440185546875, + 2373.370849609375, + 4675.99951171875, + 6090.40869140625, + 6962.984375 + ], + "bp_grad_norms_per_sample_med": [ + 2.380779051236459e-06, + 1.3197138741816161e-06, + 1.3154849511920474e-06, + 1.3285966815601569e-06, + 1.3258621720524388e-06 + ], + "bp_grad_norms_F": [ + 0.0001391920231981203, + 6.988063250901178e-05, + 6.874280370539054e-05, + 6.720778765156865e-05, + 6.707101420033723e-05 + ], + "gamma_dfa": 0.10659917898010463, + "acc_eval": 0.3037109375, + "loss_eval": 1.9665180444717407, + "epoch": 1 + }, + { + "hidden_norms": [ + 1679.144775390625, + 8850.173828125, + 31676.23046875, + 40712.2109375, + 45375.55859375 + ], + "bp_grad_norms_per_sample_med": [ + 1.1123192962259054e-06, + 2.7329409135745664e-07, + 2.7436919936008053e-07, + 2.75225175982996e-07, + 2.744452558545163e-07 + ], + "bp_grad_norms_F": [ + 7.363831537077203e-05, + 2.2035641450202093e-05, + 1.9731569409486838e-05, + 1.9022963897441514e-05, + 1.7921549442689866e-05 + ], + "gamma_dfa": 0.10788296448299661, + "acc_eval": 0.29296875, + "loss_eval": 1.972828984260559, + "epoch": 2 + }, + { + "hidden_norms": [ + 2530.16015625, + 21436.486328125, + 88828.296875, + 114079.484375, + 124374.78125 + ], + "bp_grad_norms_per_sample_med": [ + 8.110604312605574e-07, + 1.1556701196013819e-07, + 1.1451407289087001e-07, + 1.1523399479074214e-07, + 1.1543902900257308e-07 + ], + "bp_grad_norms_F": [ + 0.00011594755778787658, + 1.8132053810404614e-05, + 1.1369732419552747e-05, + 8.215727575588971e-06, + 7.219489361887099e-06 + ], + "gamma_dfa": 0.1084698709892109, + "acc_eval": 0.318359375, + "loss_eval": 1.9430747032165527, + "epoch": 3 + }, + { + "hidden_norms": [ + 3363.359375, + 41233.19921875, + 182355.03125, + 240225.46875, + 257539.390625 + ], + "bp_grad_norms_per_sample_med": [ + 6.176944111757621e-07, + 6.474806468759198e-08, + 6.307719502274267e-08, + 6.379124783961743e-08, + 6.374663996666641e-08 + ], + "bp_grad_norms_F": [ + 3.5978406231151894e-05, + 4.323610028222902e-06, + 3.5177260997443227e-06, + 3.4877305097325006e-06, + 3.479522774796351e-06 + ], + "gamma_dfa": 0.10987455540453084, + "acc_eval": 0.3173828125, + "loss_eval": 1.959622859954834, + "epoch": 4 + }, + { + "hidden_norms": [ + 4170.119140625, + 70935.8515625, + 335571.09375, + 441693.5625, + 469995.8125 + ], + "bp_grad_norms_per_sample_med": [ + 4.856212285631045e-07, + 4.0158354863706336e-08, + 3.8916198263905244e-08, + 3.9119736783277403e-08, + 3.916203894505088e-08 + ], + "bp_grad_norms_F": [ + 2.611691706988495e-05, + 2.208936621173052e-06, + 1.6750394706832594e-06, + 1.6634863868603134e-06, + 1.659758027017233e-06 + ], + "gamma_dfa": 0.1083616423420608, + "acc_eval": 0.3017578125, + "loss_eval": 1.932759165763855, + "epoch": 5 + }, + { + "hidden_norms": [ + 5013.92236328125, + 106898.6171875, + 530492.6875, + 719779.5, + 763058.3125 + ], + "bp_grad_norms_per_sample_med": [ + 4.242272950705228e-07, + 2.814423716301917e-08, + 2.683668043346188e-08, + 2.6872848835068908e-08, + 2.6873932412740942e-08 + ], + "bp_grad_norms_F": [ + 2.2560918296221644e-05, + 1.2798993793694535e-06, + 1.0339434766137856e-06, + 1.0326252777304035e-06, + 1.030524344969308e-06 + ], + "gamma_dfa": 0.11125951120629907, + "acc_eval": 0.3095703125, + "loss_eval": 1.9531997442245483, + "epoch": 6 + }, + { + "hidden_norms": [ + 5811.36279296875, + 156264.234375, + 809496.6875, + 1104418.875, + 1163013.625 + ], + "bp_grad_norms_per_sample_med": [ + 3.5694648659045924e-07, + 2.0201103012595922e-08, + 1.89678583950581e-08, + 1.8967025283700423e-08, + 1.8932304612917505e-08 + ], + "bp_grad_norms_F": [ + 1.9050115952268243e-05, + 9.341621307612513e-07, + 6.890153372296481e-07, + 6.891143584653037e-07, + 6.886222649882257e-07 + ], + "gamma_dfa": 0.11049338441807777, + "acc_eval": 0.3076171875, + "loss_eval": 1.9362893104553223, + "epoch": 7 + }, + { + "hidden_norms": [ + 6660.841796875, + 217521.65625, + 1158874.5, + 1615614.625, + 1694436.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.212987280676316e-07, + 1.5324568281016582e-08, + 1.4045938634410504e-08, + 1.4053354924215e-08, + 1.4027999206689401e-08 + ], + "bp_grad_norms_F": [ + 1.7352898794342764e-05, + 6.539408445860317e-07, + 5.044145154897706e-07, + 5.047700142313261e-07, + 5.048477760283276e-07 + ], + "gamma_dfa": 0.11245601065456867, + "acc_eval": 0.2978515625, + "loss_eval": 1.9441646337509155, + "epoch": 8 + }, + { + "hidden_norms": [ + 7480.24169921875, + 295557.40625, + 1585967.0, + 2246827.75, + 2356427.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.889860297727864e-07, + 1.193609300287335e-08, + 1.1067995409064224e-08, + 1.103960478587851e-08, + 1.1055576010221557e-08 + ], + "bp_grad_norms_F": [ + 1.5521236491622403e-05, + 4.5597263920171827e-07, + 3.8742672359148855e-07, + 3.8764648024880444e-07, + 3.877208314406744e-07 + ], + "gamma_dfa": 0.11317481694277376, + "acc_eval": 0.30078125, + "loss_eval": 1.9356626272201538, + "epoch": 9 + }, + { + "hidden_norms": [ + 8273.8408203125, + 388312.4375, + 2104540.5, + 3043837.75, + 3180222.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.619119925384439e-07, + 9.19370091168048e-09, + 8.51864179196582e-09, + 8.482276214749618e-09, + 8.476813917468462e-09 + ], + "bp_grad_norms_F": [ + 1.4210399967851117e-05, + 3.5443522961031704e-07, + 3.0404962103602884e-07, + 3.0431687036980293e-07, + 3.0445681886703824e-07 + ], + "gamma_dfa": 0.11495429277420044, + "acc_eval": 0.30859375, + "loss_eval": 1.936495304107666, + "epoch": 10 + }, + { + "hidden_norms": [ + 9086.7265625, + 501434.3125, + 2767834.0, + 4046107.75, + 4214970.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.471596189934644e-07, + 7.524303846651037e-09, + 7.025830139895106e-09, + 7.019247405537499e-09, + 7.011437208603866e-09 + ], + "bp_grad_norms_F": [ + 1.3406845027930103e-05, + 4.39807990915142e-07, + 2.471441860052437e-07, + 2.474318421263888e-07, + 2.475488827258232e-07 + ], + "gamma_dfa": 0.11651878873817623, + "acc_eval": 0.30859375, + "loss_eval": 1.9542189836502075, + "epoch": 11 + }, + { + "hidden_norms": [ + 9854.2626953125, + 612623.625, + 3485830.25, + 5139234.5, + 5346583.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3279393701614026e-07, + 6.378383154981293e-09, + 5.839252636974379e-09, + 5.8299334249056756e-09, + 5.825462778830115e-09 + ], + "bp_grad_norms_F": [ + 1.2396733836794738e-05, + 2.516441668376501e-07, + 2.0780194631697668e-07, + 2.0795941679807584e-07, + 2.080748373600727e-07 + ], + "gamma_dfa": 0.11470737145282328, + "acc_eval": 0.3046875, + "loss_eval": 1.9374217987060547, + "epoch": 12 + }, + { + "hidden_norms": [ + 10653.666015625, + 745430.125, + 4325399.0, + 6434218.5, + 6688000.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.1187355514484807e-07, + 5.294193083926757e-09, + 4.98529528769609e-09, + 4.991081326011226e-09, + 4.989251234377434e-09 + ], + "bp_grad_norms_F": [ + 1.1210328011657111e-05, + 2.000140426616781e-07, + 1.7647043648594263e-07, + 1.7654315342952032e-07, + 1.7665543339262513e-07 + ], + "gamma_dfa": 0.11383607180323452, + "acc_eval": 0.291015625, + "loss_eval": 1.9233126640319824, + "epoch": 13 + }, + { + "hidden_norms": [ + 11404.5263671875, + 893037.0625, + 5298411.0, + 7870617.0, + 8170729.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.9957101926593168e-07, + 4.642851436642559e-09, + 4.288450483613815e-09, + 4.285100718703916e-09, + 4.289933297485504e-09 + ], + "bp_grad_norms_F": [ + 1.0866175216506235e-05, + 1.758858729772328e-07, + 1.538420519864303e-07, + 1.5386244456294662e-07, + 1.5397839092656795e-07 + ], + "gamma_dfa": 0.1139617893495597, + "acc_eval": 0.30859375, + "loss_eval": 1.932279109954834, + "epoch": 14 + }, + { + "hidden_norms": [ + 12171.2412109375, + 1062066.875, + 6388639.0, + 9528923.0, + 9891447.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9334000000981177e-07, + 4.044033108385747e-09, + 3.810601167941741e-09, + 3.801854830953744e-09, + 3.8046659156520946e-09 + ], + "bp_grad_norms_F": [ + 1.0322088201064616e-05, + 1.529211743900305e-07, + 1.350435638869385e-07, + 1.3504063645086717e-07, + 1.3514510044387862e-07 + ], + "gamma_dfa": 0.11320225725648925, + "acc_eval": 0.3193359375, + "loss_eval": 1.921454906463623, + "epoch": 15 + }, + { + "hidden_norms": [ + 12924.974609375, + 1273988.625, + 7574387.5, + 11500420.0, + 11920183.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8497563303299103e-07, + 3.6160896499382034e-09, + 3.388503477808058e-09, + 3.385580482628825e-09, + 3.3854716807724117e-09 + ], + "bp_grad_norms_F": [ + 9.76746559899766e-06, + 1.3485876593222201e-07, + 1.1896084117779537e-07, + 1.1894425000491538e-07, + 1.1903343022368063e-07 + ], + "gamma_dfa": 0.11276883230311796, + "acc_eval": 0.306640625, + "loss_eval": 1.9356281757354736, + "epoch": 16 + }, + { + "hidden_norms": [ + 13632.109375, + 1465148.75, + 8873670.0, + 13535396.0, + 14019399.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7523743167657813e-07, + 3.18161341716916e-09, + 3.0166942277531916e-09, + 3.0173783471809656e-09, + 3.0215525637089513e-09 + ], + "bp_grad_norms_F": [ + 9.427177246834617e-06, + 1.1933295240851294e-07, + 1.0663712401992598e-07, + 1.0661205607220836e-07, + 1.0669979388922002e-07 + ], + "gamma_dfa": 0.11264261469477788, + "acc_eval": 0.3203125, + "loss_eval": 1.926081657409668, + "epoch": 17 + }, + { + "hidden_norms": [ + 14394.1845703125, + 1699121.5, + 10379340.0, + 15814831.0, + 16377349.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6784264289526618e-07, + 2.8936604223872564e-09, + 2.7336535257660444e-09, + 2.7314879247342105e-09, + 2.733708148738856e-09 + ], + "bp_grad_norms_F": [ + 9.04797616385622e-06, + 1.087723191517398e-07, + 9.662341682314946e-08, + 9.658959498892727e-08, + 9.665905764677518e-08 + ], + "gamma_dfa": 0.11253939801827073, + "acc_eval": 0.3154296875, + "loss_eval": 1.922888994216919, + "epoch": 18 + }, + { + "hidden_norms": [ + 15138.509765625, + 1969752.0, + 12071423.0, + 18393228.0, + 19044056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5837277089758572e-07, + 2.609559235366987e-09, + 2.4664128517315476e-09, + 2.4639881246457662e-09, + 2.4657431652030937e-09 + ], + "bp_grad_norms_F": [ + 8.502225682605058e-06, + 9.664965716638108e-08, + 8.704243725787819e-08, + 8.700892806245974e-08, + 8.707356613513184e-08 + ], + "gamma_dfa": 0.11155363742727786, + "acc_eval": 0.3125, + "loss_eval": 1.9243314266204834, + "epoch": 19 + }, + { + "hidden_norms": [ + 15811.982421875, + 2268261.5, + 13867645.0, + 21375086.0, + 22149420.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5073908343765652e-07, + 2.376487229227564e-09, + 2.2317030445861974e-09, + 2.2317414583028494e-09, + 2.2311954506193388e-09 + ], + "bp_grad_norms_F": [ + 8.195236659958027e-06, + 8.728681422098816e-08, + 7.846901439734211e-08, + 7.84395552955175e-08, + 7.849664029890846e-08 + ], + "gamma_dfa": 0.11315422086045146, + "acc_eval": 0.3095703125, + "loss_eval": 1.924652338027954, + "epoch": 20 + }, + { + "hidden_norms": [ + 16487.935546875, + 2556303.5, + 15702076.0, + 24321856.0, + 25185988.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.443007136003871e-07, + 2.174122659681643e-09, + 2.0514809850880056e-09, + 2.052057856971601e-09, + 2.05182382195801e-09 + ], + "bp_grad_norms_F": [ + 8.002187314559706e-06, + 8.025331510452816e-08, + 7.266314838716426e-08, + 7.2638087544874e-08, + 7.268938162496852e-08 + ], + "gamma_dfa": 0.11267373809823766, + "acc_eval": 0.310546875, + "loss_eval": 1.9348869323730469, + "epoch": 21 + }, + { + "hidden_norms": [ + 17153.216796875, + 2908610.25, + 17831918.0, + 27718528.0, + 28682196.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.43127067531168e-07, + 2.0134633960111614e-09, + 1.908325941712974e-09, + 1.9070569567958273e-09, + 1.9050578892176873e-09 + ], + "bp_grad_norms_F": [ + 7.550354439445073e-06, + 7.309487415341209e-08, + 6.660556550741603e-08, + 6.657593587533484e-08, + 6.66217090383725e-08 + ], + "gamma_dfa": 0.11266892295680009, + "acc_eval": 0.310546875, + "loss_eval": 1.9210036993026733, + "epoch": 22 + }, + { + "hidden_norms": [ + 17796.001953125, + 3236156.25, + 20246900.0, + 31494576.0, + 32571052.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3518946673229948e-07, + 1.8474217711172969e-09, + 1.7507182370479768e-09, + 1.7496273319039801e-09, + 1.7511733174657707e-09 + ], + "bp_grad_norms_F": [ + 7.284599632839672e-06, + 6.709063882226474e-08, + 6.151606157800416e-08, + 6.149030440383285e-08, + 6.153235432293513e-08 + ], + "gamma_dfa": 0.11186322406865656, + "acc_eval": 0.3115234375, + "loss_eval": 1.9283114671707153, + "epoch": 23 + }, + { + "hidden_norms": [ + 18460.63671875, + 3604280.25, + 22626418.0, + 35429216.0, + 36622356.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3137012899733236e-07, + 1.7567419741126855e-09, + 1.6593408869169934e-09, + 1.6595901319860218e-09, + 1.6608053821087765e-09 + ], + "bp_grad_norms_F": [ + 7.130098310881294e-06, + 6.264485108431472e-08, + 5.731577701340029e-08, + 5.729528851361465e-08, + 5.733248187311801e-08 + ], + "gamma_dfa": 0.11299802124267444, + "acc_eval": 0.2978515625, + "loss_eval": 1.942992925643921, + "epoch": 24 + }, + { + "hidden_norms": [ + 19115.904296875, + 4038094.25, + 25405536.0, + 39835936.0, + 41154148.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2640579427625198e-07, + 1.5953075527264104e-09, + 1.5003157605164574e-09, + 1.4991035079958692e-09, + 1.4979777418488993e-09 + ], + "bp_grad_norms_F": [ + 6.799941729696002e-06, + 5.7522207441706996e-08, + 5.297441418861126e-08, + 5.2952817242157835e-08, + 5.298943506204523e-08 + ], + "gamma_dfa": 0.11197824770351872, + "acc_eval": 0.298828125, + "loss_eval": 1.9319748878479004, + "epoch": 25 + }, + { + "hidden_norms": [ + 19780.572265625, + 4490110.5, + 28153634.0, + 44291160.0, + 45731404.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2269519800156559e-07, + 1.4798114955638653e-09, + 1.4102843337582271e-09, + 1.4097069067631196e-09, + 1.4109671209183716e-09 + ], + "bp_grad_norms_F": [ + 6.577545264008222e-06, + 5.327013141709358e-08, + 4.94958669605694e-08, + 4.9476955865657146e-08, + 4.950964083150211e-08 + ], + "gamma_dfa": 0.11252723945653997, + "acc_eval": 0.3115234375, + "loss_eval": 1.9247620105743408, + "epoch": 26 + }, + { + "hidden_norms": [ + 20381.6796875, + 4929967.0, + 30880866.0, + 48905308.0, + 50483824.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1911821928833888e-07, + 1.377626124288156e-09, + 1.3317531522005766e-09, + 1.3313244950907688e-09, + 1.3306112878197496e-09 + ], + "bp_grad_norms_F": [ + 6.326347829599399e-06, + 4.955709798082353e-08, + 4.649340468176888e-08, + 4.6477893533847237e-08, + 4.650862805988254e-08 + ], + "gamma_dfa": 0.11152978462632746, + "acc_eval": 0.2978515625, + "loss_eval": 1.9170689582824707, + "epoch": 27 + }, + { + "hidden_norms": [ + 21001.544921875, + 5444194.5, + 33907076.0, + 53832084.0, + 55554724.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1559290413742929e-07, + 1.3061883796794405e-09, + 1.2378150726632953e-09, + 1.2379912650573033e-09, + 1.2384089309591673e-09 + ], + "bp_grad_norms_F": [ + 6.23212235950632e-06, + 4.7021419646853246e-08, + 4.3998962695468435e-08, + 4.3984215380987735e-08, + 4.4011432720481025e-08 + ], + "gamma_dfa": 0.11285935762862209, + "acc_eval": 0.3193359375, + "loss_eval": 1.9198743104934692, + "epoch": 28 + }, + { + "hidden_norms": [ + 21623.64453125, + 5895143.0, + 37025488.0, + 58791348.0, + 60687928.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1377478870144841e-07, + 1.2547849426169932e-09, + 1.1888731110687445e-09, + 1.1877619998656996e-09, + 1.1896320595283782e-09 + ], + "bp_grad_norms_F": [ + 6.024939921189798e-06, + 4.443810297516393e-08, + 4.161294953064498e-08, + 4.159920763413538e-08, + 4.162497546644772e-08 + ], + "gamma_dfa": 0.11188641694025137, + "acc_eval": 0.3115234375, + "loss_eval": 1.917163372039795, + "epoch": 29 + }, + { + "hidden_norms": [ + 22195.29296875, + 6369258.5, + 40117404.0, + 64235468.0, + 66270544.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1021134582733794e-07, + 1.153794726427293e-09, + 1.1123471033158694e-09, + 1.1119479781385166e-09, + 1.1122585075185043e-09 + ], + "bp_grad_norms_F": [ + 5.96408472119947e-06, + 4.2022573865097e-08, + 3.954471239353552e-08, + 3.953241289877951e-08, + 3.955623029128219e-08 + ], + "gamma_dfa": 0.11316103948047385, + "acc_eval": 0.3125, + "loss_eval": 1.9332935810089111, + "epoch": 30 + }, + { + "hidden_norms": [ + 22786.513671875, + 6899202.5, + 43496572.0, + 69758712.0, + 71960648.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0609301170916297e-07, + 1.1096534802135238e-09, + 1.05872854927469e-09, + 1.0590027743617725e-09, + 1.0579482845329835e-09 + ], + "bp_grad_norms_F": [ + 5.711301128030755e-06, + 3.962547268088201e-08, + 3.742779952631281e-08, + 3.741677900848117e-08, + 3.743992138538488e-08 + ], + "gamma_dfa": 0.11225346029095817, + "acc_eval": 0.31640625, + "loss_eval": 1.9247596263885498, + "epoch": 31 + }, + { + "hidden_norms": [ + 23367.078125, + 7480530.0, + 47061616.0, + 75610000.0, + 77981320.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.054115728038596e-07, + 1.0618838031106748e-09, + 1.0191184562913236e-09, + 1.01949926278877e-09, + 1.0192180432966325e-09 + ], + "bp_grad_norms_F": [ + 5.768360097135883e-06, + 3.826109207238915e-08, + 3.593911657162607e-08, + 3.592855790657268e-08, + 3.594948694285449e-08 + ], + "gamma_dfa": 0.11492819089471595, + "acc_eval": 0.314453125, + "loss_eval": 1.939026117324829, + "epoch": 32 + }, + { + "hidden_norms": [ + 23912.85546875, + 8053234.0, + 51027352.0, + 81931568.0, + 84515616.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0266481353937706e-07, + 9.919576271499864e-10, + 9.572211912001194e-10, + 9.572932446744176e-10, + 9.577664217275128e-10 + ], + "bp_grad_norms_F": [ + 5.472421435115393e-06, + 3.587240016145188e-08, + 3.39712649122248e-08, + 3.396091940999213e-08, + 3.398050552050336e-08 + ], + "gamma_dfa": 0.11253271601162851, + "acc_eval": 0.3125, + "loss_eval": 1.9187253713607788, + "epoch": 33 + }, + { + "hidden_norms": [ + 24486.8359375, + 8682399.0, + 55030492.0, + 88236184.0, + 91025880.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0101911129822838e-07, + 9.702203485062455e-10, + 9.30652499508966e-10, + 9.30728105696943e-10, + 9.303261494508774e-10 + ], + "bp_grad_norms_F": [ + 5.286908617563313e-06, + 3.4072087373715476e-08, + 3.2386065385026086e-08, + 3.2376764380614986e-08, + 3.2396076932172946e-08 + ], + "gamma_dfa": 0.11125053715659305, + "acc_eval": 0.3125, + "loss_eval": 1.9214520454406738, + "epoch": 34 + }, + { + "hidden_norms": [ + 25051.91796875, + 9255517.0, + 58776788.0, + 94748472.0, + 97725744.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.793318156425812e-08, + 9.150468716079274e-10, + 8.747003676923271e-10, + 8.746902091516517e-10, + 8.743750723461119e-10 + ], + "bp_grad_norms_F": [ + 5.294927632348845e-06, + 3.279593840943562e-08, + 3.115108881956985e-08, + 3.114205782139834e-08, + 3.115993862934374e-08 + ], + "gamma_dfa": 0.11356210591475246, + "acc_eval": 0.314453125, + "loss_eval": 1.9334189891815186, + "epoch": 35 + }, + { + "hidden_norms": [ + 25539.400390625, + 9852175.0, + 62733436.0, + 101270040.0, + 104412528.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.590952032567657e-08, + 8.831190223546059e-10, + 8.506708115696426e-10, + 8.503630022360653e-10, + 8.506205184666271e-10 + ], + "bp_grad_norms_F": [ + 5.156022325536469e-06, + 3.1347209272780674e-08, + 2.992178593785866e-08, + 2.9913682197957314e-08, + 2.9930919964726854e-08 + ], + "gamma_dfa": 0.11300312746607233, + "acc_eval": 0.3291015625, + "loss_eval": 1.9240946769714355, + "epoch": 36 + }, + { + "hidden_norms": [ + 26058.23046875, + 10503947.0, + 66954420.0, + 108182184.0, + 111535672.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.312070403666439e-08, + 8.298656206662258e-10, + 8.076765367626138e-10, + 8.076487811869981e-10, + 8.083505531608637e-10 + ], + "bp_grad_norms_F": [ + 5.084062195237493e-06, + 3.008365112577849e-08, + 2.8773875726528786e-08, + 2.8766294235538226e-08, + 2.878227967073599e-08 + ], + "gamma_dfa": 0.11286510003083094, + "acc_eval": 0.322265625, + "loss_eval": 1.9284429550170898, + "epoch": 37 + }, + { + "hidden_norms": [ + 26547.951171875, + 11128081.0, + 71119440.0, + 115305784.0, + 118851064.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.278523549482998e-08, + 8.024952369289906e-10, + 7.701798643289237e-10, + 7.699446635811569e-10, + 7.706733029522184e-10 + ], + "bp_grad_norms_F": [ + 4.915013960271608e-06, + 2.8781727223758935e-08, + 2.7522533585511155e-08, + 2.751522920618754e-08, + 2.7530596469205193e-08 + ], + "gamma_dfa": 0.11193350053144968, + "acc_eval": 0.3046875, + "loss_eval": 1.9189305305480957, + "epoch": 38 + }, + { + "hidden_norms": [ + 27052.158203125, + 11815623.0, + 75267568.0, + 122747224.0, + 126538816.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.042137349979384e-08, + 7.699976212194315e-10, + 7.406790181185841e-10, + 7.406811275423308e-10, + 7.407266466863405e-10 + ], + "bp_grad_norms_F": [ + 4.783120857609902e-06, + 2.7648876965713498e-08, + 2.6492134708178128e-08, + 2.6485189152936073e-08, + 2.6500073246893407e-08 + ], + "gamma_dfa": 0.1119252087228233, + "acc_eval": 0.3076171875, + "loss_eval": 1.9200191497802734, + "epoch": 39 + }, + { + "hidden_norms": [ + 27573.439453125, + 12446571.0, + 79631776.0, + 129906592.0, + 133912576.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.999781897500725e-08, + 7.431448234562765e-10, + 7.212022645752825e-10, + 7.211930497241781e-10, + 7.215293917894883e-10 + ], + "bp_grad_norms_F": [ + 4.7411135710717645e-06, + 2.6746526771148638e-08, + 2.567137080689008e-08, + 2.566465262532347e-08, + 2.5678824400188205e-08 + ], + "gamma_dfa": 0.1126710368462227, + "acc_eval": 0.3291015625, + "loss_eval": 1.9156131744384766, + "epoch": 40 + }, + { + "hidden_norms": [ + 28020.1953125, + 13139046.0, + 84357848.0, + 137652880.0, + 141892912.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.93968845616655e-08, + 7.234106647047156e-10, + 7.015109604324721e-10, + 7.013014613477253e-10, + 7.019884118442121e-10 + ], + "bp_grad_norms_F": [ + 4.706852905655978e-06, + 2.5948086346261334e-08, + 2.480862271170281e-08, + 2.4802661258149783e-08, + 2.4816182886411298e-08 + ], + "gamma_dfa": 0.11299434299689892, + "acc_eval": 0.3134765625, + "loss_eval": 1.917637825012207, + "epoch": 41 + }, + { + "hidden_norms": [ + 28489.8828125, + 13728548.0, + 88388480.0, + 144432224.0, + 148906448.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.832166287220389e-08, + 7.007013858029154e-10, + 6.849794620400473e-10, + 6.849559253119253e-10, + 6.857461820608535e-10 + ], + "bp_grad_norms_F": [ + 4.678155619330937e-06, + 2.5201579489930737e-08, + 2.418770428391781e-08, + 2.4181909807907687e-08, + 2.419472266979028e-08 + ], + "gamma_dfa": 0.11410953500489995, + "acc_eval": 0.314453125, + "loss_eval": 1.9333336353302002, + "epoch": 42 + }, + { + "hidden_norms": [ + 28918.5546875, + 14414132.0, + 92681240.0, + 151898304.0, + 156571040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.454645694655483e-08, + 6.792187368098723e-10, + 6.553820264265653e-10, + 6.554308207284976e-10, + 6.556304388283252e-10 + ], + "bp_grad_norms_F": [ + 4.511462066147942e-06, + 2.4275013998931172e-08, + 2.338800797474505e-08, + 2.338238225263467e-08, + 2.3394919779207157e-08 + ], + "gamma_dfa": 0.11213390928969602, + "acc_eval": 0.3037109375, + "loss_eval": 1.9155462980270386, + "epoch": 43 + }, + { + "hidden_norms": [ + 29332.80078125, + 15055747.0, + 96975336.0, + 159279984.0, + 164189344.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.274933804841567e-08, + 6.447524736330479e-10, + 6.278008113369538e-10, + 6.277455777414787e-10, + 6.275664987676066e-10 + ], + "bp_grad_norms_F": [ + 4.426053692441201e-06, + 2.3487833900048827e-08, + 2.272233956546188e-08, + 2.2717028258512073e-08, + 2.272915367029782e-08 + ], + "gamma_dfa": 0.11223121372131573, + "acc_eval": 0.3173828125, + "loss_eval": 1.9162096977233887, + "epoch": 44 + }, + { + "hidden_norms": [ + 29736.349609375, + 15823423.0, + 101458080.0, + 166481584.0, + 171638352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.434898290943238e-08, + 6.55440757224568e-10, + 6.384029416217629e-10, + 6.384751061183636e-10, + 6.382625539202991e-10 + ], + "bp_grad_norms_F": [ + 4.4675143726635724e-06, + 2.308258295613541e-08, + 2.2235047580920764e-08, + 2.2229942331364327e-08, + 2.2241332331418562e-08 + ], + "gamma_dfa": 0.11349940555010107, + "acc_eval": 0.3134765625, + "loss_eval": 1.935542106628418, + "epoch": 45 + }, + { + "hidden_norms": [ + 30168.33984375, + 16512403.0, + 106240736.0, + 174293312.0, + 179686352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.255891259523196e-08, + 6.180955192114368e-10, + 6.070984825967685e-10, + 6.070359770404821e-10, + 6.068190394614703e-10 + ], + "bp_grad_norms_F": [ + 4.380563041195273e-06, + 2.227099038520919e-08, + 2.156298606337259e-08, + 2.1558207663474604e-08, + 2.1569489305761635e-08 + ], + "gamma_dfa": 0.11322060551538016, + "acc_eval": 0.3212890625, + "loss_eval": 1.9260894060134888, + "epoch": 46 + }, + { + "hidden_norms": [ + 30560.10546875, + 17240642.0, + 111300408.0, + 182109792.0, + 187762288.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.14508851476603e-08, + 6.030238530740917e-10, + 5.890909982042558e-10, + 5.890405385677866e-10, + 5.88881721164114e-10 + ], + "bp_grad_norms_F": [ + 4.2523201955191325e-06, + 2.1578937747790405e-08, + 2.0878760054188206e-08, + 2.0874194817110947e-08, + 2.08853556671329e-08 + ], + "gamma_dfa": 0.11227845895700739, + "acc_eval": 0.3193359375, + "loss_eval": 1.9136857986450195, + "epoch": 47 + }, + { + "hidden_norms": [ + 30927.453125, + 17981622.0, + 115698520.0, + 189446720.0, + 195329056.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.999796736157805e-08, + 5.827110460820961e-10, + 5.688347570753649e-10, + 5.688115534141502e-10, + 5.69402469619007e-10 + ], + "bp_grad_norms_F": [ + 4.254153282090556e-06, + 2.1111715042820833e-08, + 2.044158087244341e-08, + 2.043698899001356e-08, + 2.0447874504725405e-08 + ], + "gamma_dfa": 0.11285097184736514, + "acc_eval": 0.3251953125, + "loss_eval": 1.9130818843841553, + "epoch": 48 + }, + { + "hidden_norms": [ + 31297.09765625, + 18680606.0, + 120312440.0, + 197032272.0, + 203114064.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.911415877970285e-08, + 5.74776504169705e-10, + 5.532440061628563e-10, + 5.531197722064007e-10, + 5.533422053893844e-10 + ], + "bp_grad_norms_F": [ + 4.17833052779315e-06, + 2.0621358842731752e-08, + 1.9960678443453617e-08, + 1.9956562624656726e-08, + 1.9966993392017685e-08 + ], + "gamma_dfa": 0.11243592749451636, + "acc_eval": 0.3125, + "loss_eval": 1.9191365242004395, + "epoch": 49 + }, + { + "hidden_norms": [ + 31637.244140625, + 19360764.0, + 124754384.0, + 204064768.0, + 210382992.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.003268447964729e-08, + 5.749308251701279e-10, + 5.599746222273438e-10, + 5.599968821989876e-10, + 5.599694041791281e-10 + ], + "bp_grad_norms_F": [ + 4.128593900531996e-06, + 2.0178502424528233e-08, + 1.9575201903876405e-08, + 1.9571228193626666e-08, + 1.9581117172151608e-08 + ], + "gamma_dfa": 0.11233749791426817, + "acc_eval": 0.330078125, + "loss_eval": 1.9152377843856812, + "epoch": 50 + }, + { + "hidden_norms": [ + 31964.60546875, + 20067444.0, + 128969536.0, + 211772368.0, + 218247696.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.774531951554309e-08, + 5.427598370744136e-10, + 5.298457228519737e-10, + 5.297982053065198e-10, + 5.30141264221129e-10 + ], + "bp_grad_norms_F": [ + 4.058078957314137e-06, + 1.9621586133666824e-08, + 1.90722975190738e-08, + 1.9068517431719556e-08, + 1.907839575210346e-08 + ], + "gamma_dfa": 0.11183859535958618, + "acc_eval": 0.328125, + "loss_eval": 1.9089019298553467, + "epoch": 51 + }, + { + "hidden_norms": [ + 32292.658203125, + 20829408.0, + 133566216.0, + 219264704.0, + 225938912.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.692310788343093e-08, + 5.312774109533791e-10, + 5.173871886476888e-10, + 5.171740258269608e-10, + 5.173406147918058e-10 + ], + "bp_grad_norms_F": [ + 4.047169568366371e-06, + 1.926170511978853e-08, + 1.867934962263007e-08, + 1.8675748947316606e-08, + 1.868521692927061e-08 + ], + "gamma_dfa": 0.11216733865148854, + "acc_eval": 0.330078125, + "loss_eval": 1.917893886566162, + "epoch": 52 + }, + { + "hidden_norms": [ + 32582.02734375, + 21555154.0, + 138235216.0, + 226622112.0, + 233550816.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.588336359276582e-08, + 5.294207294781472e-10, + 5.160025184913763e-10, + 5.156744475875996e-10, + 5.168100947194887e-10 + ], + "bp_grad_norms_F": [ + 3.991732683061855e-06, + 1.8877956975416055e-08, + 1.8321758332717764e-08, + 1.831830331866513e-08, + 1.832757234865312e-08 + ], + "gamma_dfa": 0.11230919507215731, + "acc_eval": 0.314453125, + "loss_eval": 1.913461685180664, + "epoch": 53 + }, + { + "hidden_norms": [ + 32871.28125, + 22246662.0, + 142493184.0, + 233885040.0, + 241005264.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.552973357860537e-08, + 5.124695112712629e-10, + 4.966513311721599e-10, + 4.966223543512172e-10, + 4.969377687125132e-10 + ], + "bp_grad_norms_F": [ + 4.012842964584706e-06, + 1.8570215587487837e-08, + 1.8001765411668202e-08, + 1.799840099181438e-08, + 1.800739823920594e-08 + ], + "gamma_dfa": 0.11296637258055853, + "acc_eval": 0.33203125, + "loss_eval": 1.9206554889678955, + "epoch": 54 + }, + { + "hidden_norms": [ + 33169.98828125, + 22902584.0, + 146822496.0, + 241191920.0, + 248487904.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.486269026912851e-08, + 4.992010138593628e-10, + 4.874242676145002e-10, + 4.874663450671335e-10, + 4.884102011715186e-10 + ], + "bp_grad_norms_F": [ + 3.938752797694178e-06, + 1.8166964821375586e-08, + 1.767327617585579e-08, + 1.7670013008341812e-08, + 1.7678777552987412e-08 + ], + "gamma_dfa": 0.11258088904469332, + "acc_eval": 0.3134765625, + "loss_eval": 1.913904070854187, + "epoch": 55 + }, + { + "hidden_norms": [ + 33456.9140625, + 23628216.0, + 151346624.0, + 248325424.0, + 255824304.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.482947239623172e-08, + 5.02439700955648e-10, + 4.890933769097217e-10, + 4.891700933207233e-10, + 4.892242166931737e-10 + ], + "bp_grad_norms_F": [ + 3.895439022016944e-06, + 1.781435265968412e-08, + 1.7326955870089478e-08, + 1.7324007117736073e-08, + 1.7332443036366385e-08 + ], + "gamma_dfa": 0.11223017568408977, + "acc_eval": 0.314453125, + "loss_eval": 1.9154590368270874, + "epoch": 56 + }, + { + "hidden_norms": [ + 33716.85546875, + 24280678.0, + 155270816.0, + 255050304.0, + 262737184.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.482827157900829e-08, + 4.958616850458952e-10, + 4.826584132366918e-10, + 4.826221089437865e-10, + 4.828137889489881e-10 + ], + "bp_grad_norms_F": [ + 3.898983777617104e-06, + 1.7600514823357116e-08, + 1.7106302152569697e-08, + 1.7103344518432095e-08, + 1.7111482009113388e-08 + ], + "gamma_dfa": 0.11287979638109391, + "acc_eval": 0.30859375, + "loss_eval": 1.9285999536514282, + "epoch": 57 + }, + { + "hidden_norms": [ + 33981.390625, + 24925848.0, + 159148752.0, + 261662432.0, + 269540768.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.396101153744894e-08, + 4.846232304345222e-10, + 4.728849534174628e-10, + 4.72891226177552e-10, + 4.725210223099907e-10 + ], + "bp_grad_norms_F": [ + 3.847520019917283e-06, + 1.7274359720431676e-08, + 1.6806101399424733e-08, + 1.6803195279635474e-08, + 1.681126526875687e-08 + ], + "gamma_dfa": 0.11251267153238587, + "acc_eval": 0.330078125, + "loss_eval": 1.913767695426941, + "epoch": 58 + }, + { + "hidden_norms": [ + 34242.87890625, + 25494510.0, + 162965072.0, + 268190960.0, + 276245600.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.276207725226413e-08, + 4.64974586611433e-10, + 4.573621481540613e-10, + 4.5720988106623395e-10, + 4.578690204759539e-10 + ], + "bp_grad_norms_F": [ + 3.846054823952727e-06, + 1.7068730429059542e-08, + 1.6637597965996065e-08, + 1.663470783341836e-08, + 1.6642776046182917e-08 + ], + "gamma_dfa": 0.11268835317605408, + "acc_eval": 0.318359375, + "loss_eval": 1.9175846576690674, + "epoch": 59 + }, + { + "hidden_norms": [ + 34498.37890625, + 26013872.0, + 166717360.0, + 274736192.0, + 282985952.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.275441760157264e-08, + 4.638447681504232e-10, + 4.554343846496778e-10, + 4.5541673210358624e-10, + 4.558452226799403e-10 + ], + "bp_grad_norms_F": [ + 3.7814804727531737e-06, + 1.6729790885960938e-08, + 1.629800472358056e-08, + 1.629528156854576e-08, + 1.630315793477166e-08 + ], + "gamma_dfa": 0.11192971542368468, + "acc_eval": 0.3125, + "loss_eval": 1.9148613214492798, + "epoch": 60 + }, + { + "hidden_norms": [ + 34741.75390625, + 26574266.0, + 170266464.0, + 280835296.0, + 289264896.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.206668328763044e-08, + 4.543688481017938e-10, + 4.4642781138470866e-10, + 4.464762171085823e-10, + 4.4638817642272954e-10 + ], + "bp_grad_norms_F": [ + 3.800365902861813e-06, + 1.6550599113429598e-08, + 1.6135599523181554e-08, + 1.6132924329781417e-08, + 1.6140655034746487e-08 + ], + "gamma_dfa": 0.11263992198291817, + "acc_eval": 0.328125, + "loss_eval": 1.9202332496643066, + "epoch": 61 + }, + { + "hidden_norms": [ + 34981.7578125, + 27132752.0, + 173824032.0, + 286969856.0, + 295549056.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.146741154429037e-08, + 4.5107212409689623e-10, + 4.4140177624107935e-10, + 4.4141457156143815e-10, + 4.4168110835407504e-10 + ], + "bp_grad_norms_F": [ + 3.7655997857655166e-06, + 1.6349241960256222e-08, + 1.5922701379622595e-08, + 1.5920058160645567e-08, + 1.592757570278991e-08 + ], + "gamma_dfa": 0.11310465578208095, + "acc_eval": 0.314453125, + "loss_eval": 1.9224812984466553, + "epoch": 62 + }, + { + "hidden_norms": [ + 35201.25, + 27683016.0, + 177040880.0, + 292723872.0, + 301473504.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.122528700165276e-08, + 4.486005733550513e-10, + 4.4048292791032395e-10, + 4.4043477198663084e-10, + 4.4109013663806707e-10 + ], + "bp_grad_norms_F": [ + 3.748537892533932e-06, + 1.6115603074240425e-08, + 1.5725172275438126e-08, + 1.572264451965566e-08, + 1.5729948898979274e-08 + ], + "gamma_dfa": 0.11326105792613816, + "acc_eval": 0.3095703125, + "loss_eval": 1.9233062267303467, + "epoch": 63 + }, + { + "hidden_norms": [ + 35399.75390625, + 28156860.0, + 180111792.0, + 298457728.0, + 307298976.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.082014974457707e-08, + 4.4495629403229486e-10, + 4.324987312731565e-10, + 4.3260212079232474e-10, + 4.3259393289751813e-10 + ], + "bp_grad_norms_F": [ + 3.685790488816565e-06, + 1.5895359695150546e-08, + 1.5473323955461638e-08, + 1.547100403342938e-08, + 1.5478214265840506e-08 + ], + "gamma_dfa": 0.11222807004196511, + "acc_eval": 0.3125, + "loss_eval": 1.9198863506317139, + "epoch": 64 + }, + { + "hidden_norms": [ + 35584.6640625, + 28666806.0, + 183522992.0, + 303940064.0, + 312955008.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.149574088316513e-08, + 4.4883607941414994e-10, + 4.353337967888393e-10, + 4.3539158389727106e-10, + 4.35594643688475e-10 + ], + "bp_grad_norms_F": [ + 3.6930814530933276e-06, + 1.5769751726679715e-08, + 1.5353194271483517e-08, + 1.535078197889561e-08, + 1.5357914051605803e-08 + ], + "gamma_dfa": 0.11321029500413715, + "acc_eval": 0.3095703125, + "loss_eval": 1.9162211418151855, + "epoch": 65 + }, + { + "hidden_norms": [ + 35768.86328125, + 29145662.0, + 186551392.0, + 308909184.0, + 318089856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.985555245364594e-08, + 4.355726057614362e-10, + 4.2523776166980554e-10, + 4.251851093428627e-10, + 4.2568140679044575e-10 + ], + "bp_grad_norms_F": [ + 3.7230390717013506e-06, + 1.5615523096812467e-08, + 1.523139303571952e-08, + 1.522908021911462e-08, + 1.5236116368555486e-08 + ], + "gamma_dfa": 0.11393742701784504, + "acc_eval": 0.31640625, + "loss_eval": 1.9276196956634521, + "epoch": 66 + }, + { + "hidden_norms": [ + 35944.30859375, + 29545796.0, + 189503824.0, + 313822880.0, + 323180096.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.027381343505112e-08, + 4.2508935260698877e-10, + 4.156285593470699e-10, + 4.156731903126598e-10, + 4.1562600583411324e-10 + ], + "bp_grad_norms_F": [ + 3.67820075553027e-06, + 1.5450812185235918e-08, + 1.5081118576176777e-08, + 1.5078812864999236e-08, + 1.5085870330722173e-08 + ], + "gamma_dfa": 0.11295431066082529, + "acc_eval": 0.3251953125, + "loss_eval": 1.9145984649658203, + "epoch": 67 + }, + { + "hidden_norms": [ + 36107.91015625, + 29963964.0, + 192509232.0, + 318614048.0, + 328116416.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.995779955332182e-08, + 4.257695862541766e-10, + 4.1527120631101866e-10, + 4.1522696392348735e-10, + 4.1541275974665837e-10 + ], + "bp_grad_norms_F": [ + 3.6363949220685754e-06, + 1.5271682585193957e-08, + 1.4899570466297973e-08, + 1.4897324263074552e-08, + 1.4904214751254585e-08 + ], + "gamma_dfa": 0.11261070579712396, + "acc_eval": 0.322265625, + "loss_eval": 1.9148796796798706, + "epoch": 68 + }, + { + "hidden_norms": [ + 36263.38671875, + 30397186.0, + 195132224.0, + 323205344.0, + 332809856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.94296602432587e-08, + 4.221426264106043e-10, + 4.1666703420872864e-10, + 4.166992584320184e-10, + 4.166444134146019e-10 + ], + "bp_grad_norms_F": [ + 3.677051836348255e-06, + 1.5217779036902357e-08, + 1.486149248108859e-08, + 1.4859250718757266e-08, + 1.4866162523219373e-08 + ], + "gamma_dfa": 0.11349719034842565, + "acc_eval": 0.3134765625, + "loss_eval": 1.9238262176513672, + "epoch": 69 + }, + { + "hidden_norms": [ + 36417.9921875, + 30770712.0, + 197719328.0, + 327539232.0, + 337245152.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.906716976118332e-08, + 4.1953429619212557e-10, + 4.080901727654407e-10, + 4.080701054842706e-10, + 4.0843109450072745e-10 + ], + "bp_grad_norms_F": [ + 3.6080327845411375e-06, + 1.500828084033401e-08, + 1.4656276192681617e-08, + 1.465407439837918e-08, + 1.466091692492455e-08 + ], + "gamma_dfa": 0.11264980123269197, + "acc_eval": 0.3115234375, + "loss_eval": 1.9172749519348145, + "epoch": 70 + }, + { + "hidden_norms": [ + 36554.734375, + 31127202.0, + 200166992.0, + 331766240.0, + 341638624.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.895474768953136e-08, + 4.153002663986882e-10, + 4.053070101761591e-10, + 4.0528172484677327e-10, + 4.0563402636806245e-10 + ], + "bp_grad_norms_F": [ + 3.5790299079963006e-06, + 1.4871366360580396e-08, + 1.4521869928785236e-08, + 1.4519704549798007e-08, + 1.4526481351140319e-08 + ], + "gamma_dfa": 0.1125820265888251, + "acc_eval": 0.3291015625, + "loss_eval": 1.90960693359375, + "epoch": 71 + }, + { + "hidden_norms": [ + 36685.06640625, + 31478428.0, + 202703456.0, + 335890528.0, + 345860736.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.840604527269534e-08, + 4.11831152513642e-10, + 4.0155134772845713e-10, + 4.014005239305618e-10, + 4.018080868029017e-10 + ], + "bp_grad_norms_F": [ + 3.5732464311877266e-06, + 1.4777253198872131e-08, + 1.4430981742918902e-08, + 1.4428859884674239e-08, + 1.443555053270984e-08 + ], + "gamma_dfa": 0.11229235199152754, + "acc_eval": 0.3095703125, + "loss_eval": 1.912062644958496, + "epoch": 72 + }, + { + "hidden_norms": [ + 36808.640625, + 31756406.0, + 205006400.0, + 339625888.0, + 349722048.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.845510824859957e-08, + 4.056126268192628e-10, + 3.9775802096464474e-10, + 3.9773195847914167e-10, + 3.978435358931165e-10 + ], + "bp_grad_norms_F": [ + 3.601402113417862e-06, + 1.4699119255112691e-08, + 1.434870711136682e-08, + 1.4346603904868971e-08, + 1.4353199517813664e-08 + ], + "gamma_dfa": 0.11323098125649267, + "acc_eval": 0.3271484375, + "loss_eval": 1.9194645881652832, + "epoch": 73 + }, + { + "hidden_norms": [ + 36922.67578125, + 32105574.0, + 207090144.0, + 343260640.0, + 353436544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.8447327805643e-08, + 4.050982882475296e-10, + 3.977037865698918e-10, + 3.9765896131527256e-10, + 3.979234441953139e-10 + ], + "bp_grad_norms_F": [ + 3.603466893764562e-06, + 1.4652233204515142e-08, + 1.4306199780378392e-08, + 1.4304094797523703e-08, + 1.4310627349800598e-08 + ], + "gamma_dfa": 0.11329636031587142, + "acc_eval": 0.3056640625, + "loss_eval": 1.922640323638916, + "epoch": 74 + }, + { + "hidden_norms": [ + 37024.05859375, + 32409028.0, + 208845456.0, + 346325312.0, + 356587104.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.819700359983472e-08, + 4.0326031403026263e-10, + 3.9583156197231517e-10, + 3.9586384170675615e-10, + 3.9581374289276994e-10 + ], + "bp_grad_norms_F": [ + 3.5432237837085268e-06, + 1.4486117194678627e-08, + 1.4156262828635136e-08, + 1.4154186267489877e-08, + 1.4160684180808403e-08 + ], + "gamma_dfa": 0.11267639175457589, + "acc_eval": 0.31640625, + "loss_eval": 1.9154051542282104, + "epoch": 75 + }, + { + "hidden_norms": [ + 37125.02734375, + 32663892.0, + 210781344.0, + 349533728.0, + 359873568.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.772787486397647e-08, + 3.9591485645473767e-10, + 3.875866017022389e-10, + 3.8754283115949306e-10, + 3.8766378995802597e-10 + ], + "bp_grad_norms_F": [ + 3.5503553590388037e-06, + 1.4420066918319208e-08, + 1.40893732236691e-08, + 1.4087291333453322e-08, + 1.4093810563053921e-08 + ], + "gamma_dfa": 0.11297615164312447, + "acc_eval": 0.32421875, + "loss_eval": 1.913941502571106, + "epoch": 76 + }, + { + "hidden_norms": [ + 37216.296875, + 32930840.0, + 212456432.0, + 352475008.0, + 362884992.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.74248425980295e-08, + 3.9426073517034865e-10, + 3.872507869928654e-10, + 3.8720734951702696e-10, + 3.8765768373139053e-10 + ], + "bp_grad_norms_F": [ + 3.55011752617429e-06, + 1.4357588895563822e-08, + 1.402936344874206e-08, + 1.402732330291201e-08, + 1.4033815887160017e-08 + ], + "gamma_dfa": 0.11311322844358074, + "acc_eval": 0.3203125, + "loss_eval": 1.914380431175232, + "epoch": 77 + }, + { + "hidden_norms": [ + 37298.37890625, + 33147848.0, + 214118832.0, + 355022880.0, + 365529568.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.774458682912154e-08, + 3.987353780487979e-10, + 3.904769285689724e-10, + 3.904657153164237e-10, + 3.907260348601227e-10 + ], + "bp_grad_norms_F": [ + 3.509487669361988e-06, + 1.4249152968659473e-08, + 1.3931584774695693e-08, + 1.3929625453101835e-08, + 1.3936028331329453e-08 + ], + "gamma_dfa": 0.11238172389857937, + "acc_eval": 0.314453125, + "loss_eval": 1.9106721878051758, + "epoch": 78 + }, + { + "hidden_norms": [ + 37372.10546875, + 33388374.0, + 215761392.0, + 357596800.0, + 368190304.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.751073300392818e-08, + 3.9374201121766816e-10, + 3.8655822987010424e-10, + 3.866116038420131e-10, + 3.8653891198947576e-10 + ], + "bp_grad_norms_F": [ + 3.537302973199985e-06, + 1.4222394817409167e-08, + 1.3910858243093571e-08, + 1.3908881157931319e-08, + 1.3915280483445258e-08 + ], + "gamma_dfa": 0.11306001050525083, + "acc_eval": 0.322265625, + "loss_eval": 1.9138463735580444, + "epoch": 79 + }, + { + "hidden_norms": [ + 37442.84375, + 33566284.0, + 216908128.0, + 359755968.0, + 370379136.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.704155453007843e-08, + 3.923593672183756e-10, + 3.850708640840139e-10, + 3.8509884170423447e-10, + 3.849042473635933e-10 + ], + "bp_grad_norms_F": [ + 3.509628641040763e-06, + 1.4144676541150147e-08, + 1.3834353218555862e-08, + 1.3832397449675682e-08, + 1.3838723056380786e-08 + ], + "gamma_dfa": 0.11266809623703011, + "acc_eval": 0.3251953125, + "loss_eval": 1.9121947288513184, + "epoch": 80 + }, + { + "hidden_norms": [ + 37512.11328125, + 33717608.0, + 218115872.0, + 361736960.0, + 372400416.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.701832688804643e-08, + 3.917752788851203e-10, + 3.835655681960759e-10, + 3.835243511662867e-10, + 3.835320394607322e-10 + ], + "bp_grad_norms_F": [ + 3.5144942103215726e-06, + 1.4111047441645042e-08, + 1.3798888254257236e-08, + 1.3796943143518092e-08, + 1.3803241216692186e-08 + ], + "gamma_dfa": 0.11281233225781762, + "acc_eval": 0.3193359375, + "loss_eval": 1.9152591228485107, + "epoch": 81 + }, + { + "hidden_norms": [ + 37568.84375, + 33899664.0, + 219258560.0, + 363709504.0, + 374424128.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.695909604559347e-08, + 3.8868031015937277e-10, + 3.823757421805851e-10, + 3.8241659838789133e-10, + 3.8222841558521736e-10 + ], + "bp_grad_norms_F": [ + 3.516150854920852e-06, + 1.40706539752955e-08, + 1.3756586092483758e-08, + 1.375462410635464e-08, + 1.3760891093284044e-08 + ], + "gamma_dfa": 0.11307295318874822, + "acc_eval": 0.326171875, + "loss_eval": 1.9149377346038818, + "epoch": 82 + }, + { + "hidden_norms": [ + 37613.421875, + 34060644.0, + 220322080.0, + 365325472.0, + 376109056.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.71154296583154e-08, + 3.8974332094987574e-10, + 3.834943751446218e-10, + 3.8340422503502225e-10, + 3.8375369548759863e-10 + ], + "bp_grad_norms_F": [ + 3.4982940633199178e-06, + 1.4013506799415154e-08, + 1.370163893454901e-08, + 1.3699707146486162e-08, + 1.3705942158992457e-08 + ], + "gamma_dfa": 0.1128659905607492, + "acc_eval": 0.3212890625, + "loss_eval": 1.912517786026001, + "epoch": 83 + }, + { + "hidden_norms": [ + 37660.46875, + 34177292.0, + 221168784.0, + 366778016.0, + 377600544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.68943869186478e-08, + 3.894674860394076e-10, + 3.8076572450584933e-10, + 3.8073258434856427e-10, + 3.8100084198688933e-10 + ], + "bp_grad_norms_F": [ + 3.4944750950671732e-06, + 1.397998961039093e-08, + 1.3671985321650482e-08, + 1.3670069520799188e-08, + 1.3676272558882374e-08 + ], + "gamma_dfa": 0.11273636969053769, + "acc_eval": 0.318359375, + "loss_eval": 1.9171113967895508, + "epoch": 84 + }, + { + "hidden_norms": [ + 37701.8671875, + 34327872.0, + 222020640.0, + 368143552.0, + 379001216.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.639802307972786e-08, + 3.87883669628053e-10, + 3.8044753458699176e-10, + 3.804264403495239e-10, + 3.8037359373355173e-10 + ], + "bp_grad_norms_F": [ + 3.4919537483801832e-06, + 1.3943878052202763e-08, + 1.3639727569625393e-08, + 1.3637805551525162e-08, + 1.364400148418099e-08 + ], + "gamma_dfa": 0.11286781356830033, + "acc_eval": 0.328125, + "loss_eval": 1.9123945236206055, + "epoch": 85 + }, + { + "hidden_norms": [ + 37739.8125, + 34429904.0, + 222737072.0, + 369295712.0, + 380185984.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.741821323430486e-08, + 3.8846115213431176e-10, + 3.8069486452130263e-10, + 3.8060576912357647e-10, + 3.809500215279371e-10 + ], + "bp_grad_norms_F": [ + 3.500515958876349e-06, + 1.3945418153582523e-08, + 1.364027113481825e-08, + 1.3638369544821671e-08, + 1.364453350305439e-08 + ], + "gamma_dfa": 0.11293645015939546, + "acc_eval": 0.3154296875, + "loss_eval": 1.917877197265625, + "epoch": 86 + }, + { + "hidden_norms": [ + 37773.1484375, + 34523684.0, + 223309680.0, + 370332384.0, + 381249280.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.685363729275196e-08, + 3.8528755186284513e-10, + 3.7927344598287505e-10, + 3.7934516639026583e-10, + 3.7926364826468273e-10 + ], + "bp_grad_norms_F": [ + 3.4931999834952876e-06, + 1.3911479967987361e-08, + 1.360801249461474e-08, + 1.3606110904618163e-08, + 1.3612289961884017e-08 + ], + "gamma_dfa": 0.11282484548610228, + "acc_eval": 0.322265625, + "loss_eval": 1.9136494398117065, + "epoch": 87 + }, + { + "hidden_norms": [ + 37800.29296875, + 34600436.0, + 223845264.0, + 371228288.0, + 382171744.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.65767956320451e-08, + 3.853606878045923e-10, + 3.7911099259879677e-10, + 3.789283054000947e-10, + 3.791919833684432e-10 + ], + "bp_grad_norms_F": [ + 3.4772997423715424e-06, + 1.3876966242776234e-08, + 1.3575736979021258e-08, + 1.3573847823522556e-08, + 1.3580010893576855e-08 + ], + "gamma_dfa": 0.11266115616490424, + "acc_eval": 0.318359375, + "loss_eval": 1.912358045578003, + "epoch": 88 + }, + { + "hidden_norms": [ + 37822.953125, + 34659448.0, + 224278352.0, + 371994688.0, + 382956800.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.695878340678973e-08, + 3.8400196911148043e-10, + 3.7754030457470833e-10, + 3.775957047036371e-10, + 3.7752789783240814e-10 + ], + "bp_grad_norms_F": [ + 3.488719130473328e-06, + 1.387363113281026e-08, + 1.3571511026100325e-08, + 1.3569623646958462e-08, + 1.3575775170693305e-08 + ], + "gamma_dfa": 0.11286654848299804, + "acc_eval": 0.318359375, + "loss_eval": 1.9152348041534424, + "epoch": 89 + }, + { + "hidden_norms": [ + 37843.71484375, + 34715836.0, + 224633712.0, + 372602496.0, + 383583840.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.682009967562408e-08, + 3.831650552399424e-10, + 3.7603772873318064e-10, + 3.7600736413345714e-10, + 3.763372669052245e-10 + ], + "bp_grad_norms_F": [ + 3.4864976896642474e-06, + 1.3852580416084948e-08, + 1.355203504971314e-08, + 1.3550148558749697e-08, + 1.3556297417949281e-08 + ], + "gamma_dfa": 0.11291119743145828, + "acc_eval": 0.326171875, + "loss_eval": 1.914948582649231, + "epoch": 90 + }, + { + "hidden_norms": [ + 37859.484375, + 34761876.0, + 224938096.0, + 373110784.0, + 384106720.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.677319674963655e-08, + 3.8410433167435087e-10, + 3.768680645332978e-10, + 3.768474976517666e-10, + 3.767945122579164e-10 + ], + "bp_grad_norms_F": [ + 3.480063014649204e-06, + 1.3833711953736838e-08, + 1.3534608989118624e-08, + 1.3532734044474637e-08, + 1.3538858922856889e-08 + ], + "gamma_dfa": 0.1127637956833496, + "acc_eval": 0.322265625, + "loss_eval": 1.9153952598571777, + "epoch": 91 + }, + { + "hidden_norms": [ + 37872.0625, + 34797108.0, + 225202544.0, + 373570400.0, + 384579200.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.67909034746117e-08, + 3.821318816932262e-10, + 3.753052590926842e-10, + 3.7535435870594824e-10, + 3.7532754681990355e-10 + ], + "bp_grad_norms_F": [ + 3.4843556022678968e-06, + 1.3827068379157481e-08, + 1.352985190550271e-08, + 1.3527971631788205e-08, + 1.3534107168311493e-08 + ], + "gamma_dfa": 0.1129197701375233, + "acc_eval": 0.318359375, + "loss_eval": 1.9156945943832397, + "epoch": 92 + }, + { + "hidden_norms": [ + 37881.54296875, + 34826116.0, + 225403072.0, + 373889952.0, + 384906848.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.663099583192889e-08, + 3.844494445015556e-10, + 3.765425748980533e-10, + 3.7651176620911997e-10, + 3.7661743168548867e-10 + ], + "bp_grad_norms_F": [ + 3.480702616798226e-06, + 1.382177039488397e-08, + 1.3523890451949683e-08, + 1.3522016395484115e-08, + 1.3528141273866368e-08 + ], + "gamma_dfa": 0.11285195982236473, + "acc_eval": 0.322265625, + "loss_eval": 1.9148646593093872, + "epoch": 93 + }, + { + "hidden_norms": [ + 37889.18359375, + 34847784.0, + 225551344.0, + 374143840.0, + 385168448.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.623226767032975e-08, + 3.819731198007048e-10, + 3.7512581929632915e-10, + 3.752123889366743e-10, + 3.7511962980296687e-10 + ], + "bp_grad_norms_F": [ + 3.4782924558385275e-06, + 1.3813751031932497e-08, + 1.3516644692401769e-08, + 1.3514763530508844e-08, + 1.3520896402496874e-08 + ], + "gamma_dfa": 0.11281965267244232, + "acc_eval": 0.318359375, + "loss_eval": 1.9142093658447266, + "epoch": 94 + }, + { + "hidden_norms": [ + 37895.046875, + 34865808.0, + 225670928.0, + 374345440.0, + 385375392.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.64825137164371e-08, + 3.829765116147854e-10, + 3.7528671836817296e-10, + 3.7535685670775365e-10, + 3.752768373832538e-10 + ], + "bp_grad_norms_F": [ + 3.4792733458743896e-06, + 1.3809607679604596e-08, + 1.3512363672418815e-08, + 1.3510485175061149e-08, + 1.351661271797866e-08 + ], + "gamma_dfa": 0.11288163481003721, + "acc_eval": 0.32421875, + "loss_eval": 1.9146695137023926, + "epoch": 95 + }, + { + "hidden_norms": [ + 37898.87109375, + 34878456.0, + 225750400.0, + 374473248.0, + 385506496.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.652722817079848e-08, + 3.8302755411834255e-10, + 3.759152988891401e-10, + 3.7595143664859165e-10, + 3.7588568368995823e-10 + ], + "bp_grad_norms_F": [ + 3.480078930806485e-06, + 1.3808159060602065e-08, + 1.3511034957502943e-08, + 1.3509157348323697e-08, + 1.351528045034911e-08 + ], + "gamma_dfa": 0.1128929610213163, + "acc_eval": 0.3203125, + "loss_eval": 1.9147298336029053, + "epoch": 96 + }, + { + "hidden_norms": [ + 37900.7109375, + 34885860.0, + 225787696.0, + 374537472.0, + 385572896.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.630104820715133e-08, + 3.8308795025088216e-10, + 3.7579228617801164e-10, + 3.7582850720419003e-10, + 3.7576297629016153e-10 + ], + "bp_grad_norms_F": [ + 3.4770955608109944e-06, + 1.3803015619373582e-08, + 1.3505847995531894e-08, + 1.3503973050887907e-08, + 1.3510093488378061e-08 + ], + "gamma_dfa": 0.11285188281362935, + "acc_eval": 0.3212890625, + "loss_eval": 1.9143996238708496, + "epoch": 97 + }, + { + "hidden_norms": [ + 37902.46875, + 34890740.0, + 225820192.0, + 374593792.0, + 385630976.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.624973991620209e-08, + 3.8267702895389277e-10, + 3.7545791475857015e-10, + 3.7555664134103495e-10, + 3.75430270205257e-10 + ], + "bp_grad_norms_F": [ + 3.476953224890167e-06, + 1.3801756182374447e-08, + 1.350452816240022e-08, + 1.3502653217756233e-08, + 1.3508774543424806e-08 + ], + "gamma_dfa": 0.11284657929081732, + "acc_eval": 0.3203125, + "loss_eval": 1.9143402576446533, + "epoch": 98 + }, + { + "hidden_norms": [ + 37903.22265625, + 34893256.0, + 225836736.0, + 374620576.0, + 385658624.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.627380599866228e-08, + 3.8272779390169376e-10, + 3.7550038078926207e-10, + 3.7559910737172686e-10, + 3.7547268072479767e-10 + ], + "bp_grad_norms_F": [ + 3.477006657703896e-06, + 1.3801344067587706e-08, + 1.3504034335198867e-08, + 1.350215939055488e-08, + 1.3508279828045033e-08 + ], + "gamma_dfa": 0.11284785682073561, + "acc_eval": 0.3203125, + "loss_eval": 1.9143691062927246, + "epoch": 99 + }, + { + "hidden_norms": [ + 37903.25, + 34893376.0, + 225837280.0, + 374621408.0, + 385659456.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.626758874972438e-08, + 3.826984007471168e-10, + 3.755481758904722e-10, + 3.756469302285126e-10, + 3.755204758260078e-10 + ], + "bp_grad_norms_F": [ + 3.476960500847781e-06, + 1.3801311204986177e-08, + 1.3503997919883659e-08, + 1.3502122975239672e-08, + 1.3508243412729826e-08 + ], + "gamma_dfa": 0.11284651984533411, + "acc_eval": 0.3203125, + "loss_eval": 1.9143500328063965, + "epoch": 100 + } + ] +}
\ No newline at end of file |
