{ "config": { "output_dir": "results/snapshot_evolution_v2", "epochs": 100, "lr": 0.001, "wd": 0.01, "seed": 123, "depth": 4, "d_hidden": 256, "log_every": 1 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.690464973449707, 8.719978332519531, 8.73093318939209, 8.75937271118164, 8.790542602539062 ], "bp_grad_norms_per_sample_med": [ 0.0009977436857298017, 0.000992251792922616, 0.0009848480112850666, 0.0009761073160916567, 0.0009735578205436468 ], "bp_grad_norms_F": [ 0.035340383648872375, 0.03499162197113037, 0.03454425558447838, 0.034113530069589615, 0.033874060958623886 ], "gamma_dfa": NaN, "acc_eval": 0.095703125, "loss_eval": 2.486203908920288, "epoch": 0 }, { "hidden_norms": [ 78.8471908569336, 81.27874755859375, 85.74082946777344, 93.0085678100586, 99.78337860107422 ], "bp_grad_norms_per_sample_med": [ 5.44870927114971e-05, 5.06363830936607e-05, 4.9749945901567116e-05, 5.010423774365336e-05, 5.131187572260387e-05 ], "bp_grad_norms_F": [ 0.0025542855728417635, 0.0021727080456912518, 0.002010831143707037, 0.0019116367911919951, 0.0019338354468345642 ], "gamma_dfa": NaN, "acc_eval": 0.396484375, "loss_eval": 1.6637382507324219, "epoch": 1 }, { "hidden_norms": [ 94.79721069335938, 98.6406021118164, 103.38369750976562, 111.4940185546875, 118.88549041748047 ], "bp_grad_norms_per_sample_med": [ 4.842087219003588e-05, 4.405825529829599e-05, 4.263824666850269e-05, 4.2027873860206455e-05, 4.283937960281037e-05 ], "bp_grad_norms_F": [ 0.0020658739376813173, 0.001806268934160471, 0.001665781601332128, 0.0015872427029535174, 0.0015909546054899693 ], "gamma_dfa": NaN, "acc_eval": 0.4541015625, "loss_eval": 1.5350896120071411, "epoch": 2 }, { "hidden_norms": [ 112.59109497070312, 116.00851440429688, 118.50328063964844, 125.58804321289062, 132.86842346191406 ], "bp_grad_norms_per_sample_med": [ 4.3564141378737986e-05, 4.136884308536537e-05, 4.064830864081159e-05, 3.9523682062281296e-05, 3.8838741602376103e-05 ], "bp_grad_norms_F": [ 0.00200729351490736, 0.001785867614671588, 0.0016562910750508308, 0.0015452943043783307, 0.0015010037459433079 ], "gamma_dfa": NaN, "acc_eval": 0.4814453125, "loss_eval": 1.449176549911499, "epoch": 3 }, { "hidden_norms": [ 124.81511688232422, 128.57049560546875, 129.71421813964844, 136.4766387939453, 142.1854705810547 ], "bp_grad_norms_per_sample_med": [ 4.382780389278196e-05, 4.2459021642571315e-05, 4.143684418522753e-05, 4.0614067984279245e-05, 3.921420648111962e-05 ], "bp_grad_norms_F": [ 0.0018197334138676524, 0.0016814853297546506, 0.0015934663824737072, 0.0015063106548041105, 0.0014485444407910109 ], "gamma_dfa": NaN, "acc_eval": 0.4970703125, "loss_eval": 1.4218697547912598, "epoch": 4 }, { "hidden_norms": [ 138.24440002441406, 140.13018798828125, 141.3839874267578, 147.2488555908203, 155.097412109375 ], "bp_grad_norms_per_sample_med": [ 4.045376044814475e-05, 4.011149940197356e-05, 3.9452468627132475e-05, 3.831404319498688e-05, 3.721412576851435e-05 ], "bp_grad_norms_F": [ 0.0017204430187121034, 0.0016258049290627241, 0.001551075023598969, 0.0014644934562966228, 0.0013933938462287188 ], "gamma_dfa": NaN, "acc_eval": 0.5078125, "loss_eval": 1.3836241960525513, "epoch": 5 }, { "hidden_norms": [ 152.11605834960938, 153.1806182861328, 153.2488555908203, 159.2217559814453, 167.07318115234375 ], "bp_grad_norms_per_sample_med": [ 3.981084591941908e-05, 3.969454701291397e-05, 3.9165588532341644e-05, 3.808845940511674e-05, 3.58163051714655e-05 ], "bp_grad_norms_F": [ 0.0017226944910362363, 0.001611364888958633, 0.0015574879944324493, 0.001471089432016015, 0.001374671934172511 ], "gamma_dfa": NaN, "acc_eval": 0.525390625, "loss_eval": 1.372281551361084, "epoch": 6 }, { "hidden_norms": [ 161.75347900390625, 163.58787536621094, 163.35731506347656, 170.1693115234375, 177.47879028320312 ], "bp_grad_norms_per_sample_med": [ 3.749227471416816e-05, 3.707691575982608e-05, 3.776738958549686e-05, 3.692766040330753e-05, 3.5146917070960626e-05 ], "bp_grad_norms_F": [ 0.0016339722787961364, 0.00156014587264508, 0.0015048144850879908, 0.00141648028511554, 0.0013256004313006997 ], "gamma_dfa": NaN, "acc_eval": 0.515625, "loss_eval": 1.345876693725586, "epoch": 7 }, { "hidden_norms": [ 171.66441345214844, 171.10499572753906, 169.24270629882812, 175.52674865722656, 182.4739990234375 ], "bp_grad_norms_per_sample_med": [ 3.675510379252955e-05, 3.6888646718580276e-05, 3.695035775308497e-05, 3.644685784820467e-05, 3.359343099873513e-05 ], "bp_grad_norms_F": [ 0.0016642085975036025, 0.0015915494877845049, 0.0015412021894007921, 0.0014428672147914767, 0.0013226643204689026 ], "gamma_dfa": NaN, "acc_eval": 0.548828125, "loss_eval": 1.323807954788208, "epoch": 8 }, { "hidden_norms": [ 177.58766174316406, 178.5358123779297, 176.316650390625, 182.18365478515625, 188.81033325195312 ], "bp_grad_norms_per_sample_med": [ 3.550657493178733e-05, 3.561190533218905e-05, 3.632329753600061e-05, 3.5655833926284686e-05, 3.342977652209811e-05 ], "bp_grad_norms_F": [ 0.0016174933407455683, 0.0015753052430227399, 0.0015375673538073897, 0.001461501931771636, 0.0013270385097712278 ], "gamma_dfa": NaN, "acc_eval": 0.54296875, "loss_eval": 1.323765754699707, "epoch": 9 }, { "hidden_norms": [ 186.0078125, 185.2810821533203, 182.9329833984375, 188.10736083984375, 195.3680877685547 ], "bp_grad_norms_per_sample_med": [ 3.5615968954516575e-05, 3.5252433008281514e-05, 3.600740819820203e-05, 3.5232467780588195e-05, 3.2765579817350954e-05 ], "bp_grad_norms_F": [ 0.0015362550038844347, 0.001510681351646781, 0.0014847773127257824, 0.0014146054163575172, 0.00128385319840163 ], "gamma_dfa": NaN, "acc_eval": 0.544921875, "loss_eval": 1.2933119535446167, "epoch": 10 }, { "hidden_norms": [ 193.46343994140625, 194.1528778076172, 190.9546661376953, 196.03440856933594, 201.5336151123047 ], "bp_grad_norms_per_sample_med": [ 3.449141877354123e-05, 3.581260534701869e-05, 3.6061541322851554e-05, 3.5576940717874095e-05, 3.29486902046483e-05 ], "bp_grad_norms_F": [ 0.0015161881456151605, 0.0014996343525126576, 0.001473701442591846, 0.0013998147333040833, 0.0012604170478880405 ], "gamma_dfa": NaN, "acc_eval": 0.5556640625, "loss_eval": 1.2653318643569946, "epoch": 11 }, { "hidden_norms": [ 200.17047119140625, 198.5863037109375, 196.08795166015625, 200.61297607421875, 208.13084411621094 ], "bp_grad_norms_per_sample_med": [ 3.377814937266521e-05, 3.471539093879983e-05, 3.4731467167148367e-05, 3.4925535146612674e-05, 3.2187374017667025e-05 ], "bp_grad_norms_F": [ 0.0014635181287303567, 0.0014519579708576202, 0.001435206620953977, 0.0013784168986603618, 0.0012511539971455932 ], "gamma_dfa": NaN, "acc_eval": 0.546875, "loss_eval": 1.2704923152923584, "epoch": 12 }, { "hidden_norms": [ 203.8260955810547, 203.86688232421875, 200.01004028320312, 204.2325439453125, 211.52891540527344 ], "bp_grad_norms_per_sample_med": [ 3.5213015507906675e-05, 3.635779648902826e-05, 3.70470697816927e-05, 3.6254354199627414e-05, 3.324731005704962e-05 ], "bp_grad_norms_F": [ 0.0014951277989894152, 0.0014758999459445477, 0.0014606777112931013, 0.0014066072180867195, 0.0012636061292141676 ], "gamma_dfa": NaN, "acc_eval": 0.533203125, "loss_eval": 1.2718024253845215, "epoch": 13 }, { "hidden_norms": [ 211.8421630859375, 209.4982147216797, 206.025634765625, 210.11019897460938, 216.48568725585938 ], "bp_grad_norms_per_sample_med": [ 3.425328395678662e-05, 3.4357526601525024e-05, 3.5312823456479236e-05, 3.490734161459841e-05, 3.1354313250631094e-05 ], "bp_grad_norms_F": [ 0.0015326166758313775, 0.0015238082269206643, 0.0015112065011635423, 0.0014346316456794739, 0.0012716582277789712 ], "gamma_dfa": NaN, "acc_eval": 0.5595703125, "loss_eval": 1.2611415386199951, "epoch": 14 }, { "hidden_norms": [ 220.0836639404297, 218.3101806640625, 212.22019958496094, 216.97576904296875, 224.16114807128906 ], "bp_grad_norms_per_sample_med": [ 3.320865289424546e-05, 3.393836959730834e-05, 3.4554454032331705e-05, 3.380324415047653e-05, 3.0850649636704475e-05 ], "bp_grad_norms_F": [ 0.0015296684578061104, 0.0015227487310767174, 0.0015054721152409911, 0.0014223494799807668, 0.0012559365713968873 ], "gamma_dfa": NaN, "acc_eval": 0.5615234375, "loss_eval": 1.2511423826217651, "epoch": 15 }, { "hidden_norms": [ 223.3075714111328, 219.4958953857422, 213.75701904296875, 219.41580200195312, 223.92572021484375 ], "bp_grad_norms_per_sample_med": [ 3.406661926419474e-05, 3.485638080746867e-05, 3.5736342397285625e-05, 3.5617544199340045e-05, 3.142367859254591e-05 ], "bp_grad_norms_F": [ 0.001539028249680996, 0.0015256714541465044, 0.0015207449905574322, 0.001449243980459869, 0.0012804584112018347 ], "gamma_dfa": NaN, "acc_eval": 0.5478515625, "loss_eval": 1.2619048357009888, "epoch": 16 }, { "hidden_norms": [ 229.43417358398438, 224.83290100097656, 218.015869140625, 221.56915283203125, 228.59274291992188 ], "bp_grad_norms_per_sample_med": [ 3.325551369925961e-05, 3.411810757825151e-05, 3.506721623125486e-05, 3.451627344475128e-05, 3.0976541893323883e-05 ], "bp_grad_norms_F": [ 0.001564670237712562, 0.0015591747360303998, 0.0015565806534141302, 0.001464744214899838, 0.0012746548745781183 ], "gamma_dfa": NaN, "acc_eval": 0.5498046875, "loss_eval": 1.2594949007034302, "epoch": 17 }, { "hidden_norms": [ 233.65724182128906, 228.65892028808594, 223.14169311523438, 227.2765350341797, 233.75588989257812 ], "bp_grad_norms_per_sample_med": [ 3.4493146813474596e-05, 3.510132592055015e-05, 3.669387297122739e-05, 3.577200186555274e-05, 3.192189251421951e-05 ], "bp_grad_norms_F": [ 0.0015125939389690757, 0.0015123466728255153, 0.0015171029372140765, 0.0014489478198811412, 0.001258584321476519 ], "gamma_dfa": NaN, "acc_eval": 0.5595703125, "loss_eval": 1.2556639909744263, "epoch": 18 }, { "hidden_norms": [ 237.43548583984375, 232.39987182617188, 227.10951232910156, 230.72291564941406, 237.13616943359375 ], "bp_grad_norms_per_sample_med": [ 3.340727198519744e-05, 3.450348594924435e-05, 3.5213739465689287e-05, 3.445050970185548e-05, 3.137766179861501e-05 ], "bp_grad_norms_F": [ 0.0015336342621594667, 0.0015343877021223307, 0.0015299322549253702, 0.0014644783223047853, 0.0012699750950559974 ], "gamma_dfa": NaN, "acc_eval": 0.560546875, "loss_eval": 1.2415752410888672, "epoch": 19 }, { "hidden_norms": [ 240.3662109375, 235.49240112304688, 227.54061889648438, 233.16600036621094, 239.60838317871094 ], "bp_grad_norms_per_sample_med": [ 3.387282777111977e-05, 3.518611265462823e-05, 3.594699956011027e-05, 3.514933632686734e-05, 3.159138941555284e-05 ], "bp_grad_norms_F": [ 0.0015161214396357536, 0.0015244479291141033, 0.0015337818767875433, 0.0014538948889821768, 0.0012562318006530404 ], "gamma_dfa": NaN, "acc_eval": 0.560546875, "loss_eval": 1.2436577081680298, "epoch": 20 }, { "hidden_norms": [ 246.6840057373047, 239.0929412841797, 228.7230682373047, 233.1182403564453, 237.92440795898438 ], "bp_grad_norms_per_sample_med": [ 3.365568773006089e-05, 3.4782005968736485e-05, 3.604988887673244e-05, 3.48928188032005e-05, 3.140935586998239e-05 ], "bp_grad_norms_F": [ 0.0015826384769752622, 0.0015907500637695193, 0.0016004826175048947, 0.0015078946016728878, 0.0012762312544509768 ], "gamma_dfa": NaN, "acc_eval": 0.578125, "loss_eval": 1.2292213439941406, "epoch": 21 }, { "hidden_norms": [ 248.95265197753906, 241.59408569335938, 233.2073211669922, 236.39898681640625, 243.02566528320312 ], "bp_grad_norms_per_sample_med": [ 3.3556283597135916e-05, 3.463738539721817e-05, 3.5712662793230265e-05, 3.4992117434740067e-05, 3.1405961635755375e-05 ], "bp_grad_norms_F": [ 0.0015417077811434865, 0.0015624086372554302, 0.00158181122969836, 0.0014982762513682246, 0.001269534695893526 ], "gamma_dfa": NaN, "acc_eval": 0.5712890625, "loss_eval": 1.201985239982605, "epoch": 22 }, { "hidden_norms": [ 250.6766815185547, 243.67706298828125, 236.90567016601562, 240.1038360595703, 244.89207458496094 ], "bp_grad_norms_per_sample_med": [ 3.3543499739607796e-05, 3.4865890484070405e-05, 3.564134021871723e-05, 3.4787921322276816e-05, 3.112335252808407e-05 ], "bp_grad_norms_F": [ 0.0015237597981467843, 0.0015382410492748022, 0.0015483599854633212, 0.0014793339651077986, 0.0012637422187253833 ], "gamma_dfa": NaN, "acc_eval": 0.55859375, "loss_eval": 1.2245514392852783, "epoch": 23 }, { "hidden_norms": [ 256.1240539550781, 248.83609008789062, 240.2549285888672, 243.1914825439453, 248.11964416503906 ], "bp_grad_norms_per_sample_med": [ 3.322990596643649e-05, 3.523347186273895e-05, 3.6828067095484585e-05, 3.5215769457863644e-05, 3.133456266368739e-05 ], "bp_grad_norms_F": [ 0.0015543467598035932, 0.0015818241517990828, 0.0015992531552910805, 0.001527936663478613, 0.0012819069670513272 ], "gamma_dfa": NaN, "acc_eval": 0.5732421875, "loss_eval": 1.2261133193969727, "epoch": 24 }, { "hidden_norms": [ 256.9990234375, 248.78497314453125, 239.55239868164062, 243.13818359375, 249.48153686523438 ], "bp_grad_norms_per_sample_med": [ 3.39320904458873e-05, 3.600086711230688e-05, 3.7119287298992276e-05, 3.6292254662839696e-05, 3.193991506122984e-05 ], "bp_grad_norms_F": [ 0.0015332578914240003, 0.00156042305752635, 0.001574728754349053, 0.0015015782555565238, 0.0012670031283050776 ], "gamma_dfa": NaN, "acc_eval": 0.5771484375, "loss_eval": 1.2080682516098022, "epoch": 25 }, { "hidden_norms": [ 260.4493103027344, 251.83595275878906, 240.95025634765625, 242.58055114746094, 247.42816162109375 ], "bp_grad_norms_per_sample_med": [ 3.4877586585935205e-05, 3.68267938029021e-05, 3.760240360861644e-05, 3.5770553949987516e-05, 3.202233710908331e-05 ], "bp_grad_norms_F": [ 0.0016203002305701375, 0.0016500651836395264, 0.0016584799159318209, 0.0015617734752595425, 0.00129653827752918 ], "gamma_dfa": NaN, "acc_eval": 0.5576171875, "loss_eval": 1.2154628038406372, "epoch": 26 }, { "hidden_norms": [ 263.1241760253906, 253.4596405029297, 243.6095733642578, 245.4304656982422, 250.32362365722656 ], "bp_grad_norms_per_sample_med": [ 3.480416853562929e-05, 3.640647264546715e-05, 3.738802479347214e-05, 3.5808730899589136e-05, 3.25721557601355e-05 ], "bp_grad_norms_F": [ 0.0015986696816980839, 0.0016261462587863207, 0.0016554947942495346, 0.0015633245930075645, 0.0013003128115087748 ], "gamma_dfa": NaN, "acc_eval": 0.5634765625, "loss_eval": 1.2160842418670654, "epoch": 27 }, { "hidden_norms": [ 266.5273132324219, 256.0182189941406, 245.50253295898438, 246.18280029296875, 251.716064453125 ], "bp_grad_norms_per_sample_med": [ 3.359848051331937e-05, 3.572113564587198e-05, 3.695064515341073e-05, 3.506165376165882e-05, 3.114769424428232e-05 ], "bp_grad_norms_F": [ 0.0016088238917291164, 0.0016375494888052344, 0.0016567507991567254, 0.0015764845302328467, 0.001285399659536779 ], "gamma_dfa": NaN, "acc_eval": 0.58203125, "loss_eval": 1.2021496295928955, "epoch": 28 }, { "hidden_norms": [ 267.4769592285156, 258.21368408203125, 248.0418701171875, 248.66949462890625, 253.77452087402344 ], "bp_grad_norms_per_sample_med": [ 3.400501736905426e-05, 3.611011925386265e-05, 3.7168374547036365e-05, 3.569516775314696e-05, 3.031879896298051e-05 ], "bp_grad_norms_F": [ 0.0015880028950050473, 0.0016197538934648037, 0.001652923645451665, 0.0015723761171102524, 0.00128253607545048 ], "gamma_dfa": NaN, "acc_eval": 0.5771484375, "loss_eval": 1.2029783725738525, "epoch": 29 }, { "hidden_norms": [ 268.6047668457031, 256.4200744628906, 246.27796936035156, 246.51229858398438, 250.08482360839844 ], "bp_grad_norms_per_sample_med": [ 3.425245813559741e-05, 3.6405861465027556e-05, 3.752295742742717e-05, 3.6318160709924996e-05, 3.103434937656857e-05 ], "bp_grad_norms_F": [ 0.0017358324257656932, 0.0017647893400862813, 0.0017767423996701837, 0.0016745994798839092, 0.0013456137385219336 ], "gamma_dfa": NaN, "acc_eval": 0.5859375, "loss_eval": 1.2118260860443115, "epoch": 30 }, { "hidden_norms": [ 270.9348449707031, 260.40045166015625, 250.72512817382812, 251.9379425048828, 254.6614227294922 ], "bp_grad_norms_per_sample_med": [ 3.491883762762882e-05, 3.647417179308832e-05, 3.8068057619966567e-05, 3.653564635897055e-05, 3.172537253703922e-05 ], "bp_grad_norms_F": [ 0.0015994011191651225, 0.0016339519061148167, 0.0016624036943539977, 0.0015806201845407486, 0.0013034256407991052 ], "gamma_dfa": NaN, "acc_eval": 0.5849609375, "loss_eval": 1.1830923557281494, "epoch": 31 }, { "hidden_norms": [ 274.6016845703125, 262.9326477050781, 250.766357421875, 252.1786346435547, 254.2251739501953 ], "bp_grad_norms_per_sample_med": [ 3.4794014936778694e-05, 3.6746245314134285e-05, 3.771794217755087e-05, 3.6664638173533604e-05, 3.1814517569728196e-05 ], "bp_grad_norms_F": [ 0.0016584239201620221, 0.0016917918110266328, 0.001726189162582159, 0.0016276866663247347, 0.0013194811763241887 ], "gamma_dfa": NaN, "acc_eval": 0.578125, "loss_eval": 1.1851024627685547, "epoch": 32 }, { "hidden_norms": [ 273.59783935546875, 261.92218017578125, 250.27320861816406, 251.19146728515625, 255.70233154296875 ], "bp_grad_norms_per_sample_med": [ 3.505383210722357e-05, 3.6710382119053975e-05, 3.839766577584669e-05, 3.708387885126285e-05, 3.1251351174432784e-05 ], "bp_grad_norms_F": [ 0.0016781548038125038, 0.0017169808270409703, 0.0017399545758962631, 0.0016386040952056646, 0.0013246783055365086 ], "gamma_dfa": NaN, "acc_eval": 0.5712890625, "loss_eval": 1.1789460182189941, "epoch": 33 }, { "hidden_norms": [ 274.9112854003906, 262.3539123535156, 251.67474365234375, 253.08824157714844, 255.4647979736328 ], "bp_grad_norms_per_sample_med": [ 3.4545508242445067e-05, 3.622366421041079e-05, 3.7300182157196105e-05, 3.594972440623678e-05, 3.1557658076053485e-05 ], "bp_grad_norms_F": [ 0.001666227588430047, 0.0016955926548689604, 0.0017251977697014809, 0.0016294753877446055, 0.001327820005826652 ], "gamma_dfa": NaN, "acc_eval": 0.583984375, "loss_eval": 1.1757192611694336, "epoch": 34 }, { "hidden_norms": [ 273.9092712402344, 261.26507568359375, 250.60923767089844, 250.5943145751953, 253.19862365722656 ], "bp_grad_norms_per_sample_med": [ 3.532320988597348e-05, 3.7557252653641626e-05, 3.882365126628429e-05, 3.676790583995171e-05, 3.2376574381487444e-05 ], "bp_grad_norms_F": [ 0.001686039031483233, 0.0017200085567310452, 0.0017563666915521026, 0.0016565105179324746, 0.0013397492002695799 ], "gamma_dfa": NaN, "acc_eval": 0.5986328125, "loss_eval": 1.1719229221343994, "epoch": 35 }, { "hidden_norms": [ 275.9344177246094, 265.1002502441406, 253.2598114013672, 253.86024475097656, 257.8154296875 ], "bp_grad_norms_per_sample_med": [ 3.419027416384779e-05, 3.54782423528377e-05, 3.770734474528581e-05, 3.707608630065806e-05, 3.1706651498097926e-05 ], "bp_grad_norms_F": [ 0.0016564616234973073, 0.001694328966550529, 0.001729298266582191, 0.0016409243689849973, 0.0013242866843938828 ], "gamma_dfa": NaN, "acc_eval": 0.59375, "loss_eval": 1.169456958770752, "epoch": 36 }, { "hidden_norms": [ 277.0843200683594, 263.2900390625, 250.48553466796875, 251.51341247558594, 253.14413452148438 ], "bp_grad_norms_per_sample_med": [ 3.5850312997354195e-05, 3.7839381548110396e-05, 3.925598502974026e-05, 3.7184508983045816e-05, 3.174091762048192e-05 ], "bp_grad_norms_F": [ 0.0017717990558594465, 0.0018099851440638304, 0.0018417692044749856, 0.0017209915677085519, 0.0013732420047745109 ], "gamma_dfa": NaN, "acc_eval": 0.5869140625, "loss_eval": 1.1764099597930908, "epoch": 37 }, { "hidden_norms": [ 280.2084655761719, 265.3043518066406, 254.26673889160156, 253.3932342529297, 255.91488647460938 ], "bp_grad_norms_per_sample_med": [ 3.4716471418505535e-05, 3.675218249554746e-05, 3.84828781534452e-05, 3.653839303296991e-05, 3.1539821065962315e-05 ], "bp_grad_norms_F": [ 0.00171388138551265, 0.0017648075008764863, 0.00180675252340734, 0.0016973463352769613, 0.0013539392966777086 ], "gamma_dfa": NaN, "acc_eval": 0.591796875, "loss_eval": 1.1670037508010864, "epoch": 38 }, { "hidden_norms": [ 278.0702209472656, 264.4510498046875, 250.75350952148438, 248.73284912109375, 253.1072540283203 ], "bp_grad_norms_per_sample_med": [ 3.694290717248805e-05, 3.843691956717521e-05, 3.982238922617398e-05, 3.8299614971037954e-05, 3.253731847507879e-05 ], "bp_grad_norms_F": [ 0.0017997974064201117, 0.0018521619495004416, 0.0018853276269510388, 0.001754313474521041, 0.0013789198128506541 ], "gamma_dfa": NaN, "acc_eval": 0.576171875, "loss_eval": 1.168372631072998, "epoch": 39 }, { "hidden_norms": [ 279.5745849609375, 265.3549499511719, 252.89109802246094, 250.0029296875, 251.57737731933594 ], "bp_grad_norms_per_sample_med": [ 3.5274497349746525e-05, 3.741122054634616e-05, 3.8946731365285814e-05, 3.7627731217071414e-05, 3.1920495530357584e-05 ], "bp_grad_norms_F": [ 0.0017959685064852238, 0.0018515808042138815, 0.001886399113573134, 0.0017732164124026895, 0.001389715587720275 ], "gamma_dfa": NaN, "acc_eval": 0.5966796875, "loss_eval": 1.1735193729400635, "epoch": 40 }, { "hidden_norms": [ 280.56402587890625, 265.1068115234375, 251.912353515625, 248.08627319335938, 250.21177673339844 ], "bp_grad_norms_per_sample_med": [ 3.672741513582878e-05, 3.8823065551696345e-05, 4.041267675347626e-05, 3.835778989014216e-05, 3.2424144592368975e-05 ], "bp_grad_norms_F": [ 0.0018404219299554825, 0.0018969813827425241, 0.0019448500825092196, 0.0018052044324576855, 0.0014045372372493148 ], "gamma_dfa": NaN, "acc_eval": 0.5966796875, "loss_eval": 1.163725733757019, "epoch": 41 }, { "hidden_norms": [ 281.2812194824219, 266.5726623535156, 253.18124389648438, 252.3292694091797, 254.1314697265625 ], "bp_grad_norms_per_sample_med": [ 3.6245146475266665e-05, 3.849809218081646e-05, 4.034954326925799e-05, 3.857027695630677e-05, 3.267046849941835e-05 ], "bp_grad_norms_F": [ 0.0018043599557131529, 0.0018654613522812724, 0.0018976799910888076, 0.0017763315699994564, 0.0013986497651785612 ], "gamma_dfa": NaN, "acc_eval": 0.5830078125, "loss_eval": 1.172363519668579, "epoch": 42 }, { "hidden_norms": [ 278.3638916015625, 264.4734802246094, 250.60198974609375, 248.59568786621094, 249.39353942871094 ], "bp_grad_norms_per_sample_med": [ 3.7236037314869463e-05, 3.946686410927214e-05, 4.103714309167117e-05, 3.970286707044579e-05, 3.281752287875861e-05 ], "bp_grad_norms_F": [ 0.0018646781099960208, 0.0019272645004093647, 0.0019672266207635403, 0.001839098404161632, 0.0014395405305549502 ], "gamma_dfa": NaN, "acc_eval": 0.5830078125, "loss_eval": 1.1776624917984009, "epoch": 43 }, { "hidden_norms": [ 280.8514099121094, 269.1718444824219, 253.03790283203125, 251.60220336914062, 251.88168334960938 ], "bp_grad_norms_per_sample_med": [ 3.689880759338848e-05, 3.937961082556285e-05, 4.092283779755235e-05, 3.866894985549152e-05, 3.262344398535788e-05 ], "bp_grad_norms_F": [ 0.0018725661793723702, 0.0019201217219233513, 0.0019532060250639915, 0.0018317755311727524, 0.001439971849322319 ], "gamma_dfa": NaN, "acc_eval": 0.595703125, "loss_eval": 1.1693906784057617, "epoch": 44 }, { "hidden_norms": [ 280.3335266113281, 263.89471435546875, 253.01638793945312, 250.5576171875, 251.4005889892578 ], "bp_grad_norms_per_sample_med": [ 3.6666475352831185e-05, 3.875952461385168e-05, 4.0531358536100015e-05, 3.9068203477654606e-05, 3.450641088420525e-05 ], "bp_grad_norms_F": [ 0.0018578553572297096, 0.0019184533739462495, 0.001965942559763789, 0.0018550093518570065, 0.0014542803401127458 ], "gamma_dfa": NaN, "acc_eval": 0.5732421875, "loss_eval": 1.1839377880096436, "epoch": 45 }, { "hidden_norms": [ 280.3553771972656, 263.3617248535156, 248.94859313964844, 246.9832000732422, 246.24644470214844 ], "bp_grad_norms_per_sample_med": [ 3.8412734284065664e-05, 4.001844354206696e-05, 4.220755727146752e-05, 4.0393635572399944e-05, 3.391467180335894e-05 ], "bp_grad_norms_F": [ 0.001917686895467341, 0.0019766101613640785, 0.0020170181524008512, 0.0018900329014286399, 0.001476101577281952 ], "gamma_dfa": NaN, "acc_eval": 0.6005859375, "loss_eval": 1.1689397096633911, "epoch": 46 }, { "hidden_norms": [ 278.8861389160156, 263.3866882324219, 249.24301147460938, 246.43963623046875, 246.34503173828125 ], "bp_grad_norms_per_sample_med": [ 3.77853139070794e-05, 4.044857996632345e-05, 4.182702468824573e-05, 4.050548523082398e-05, 3.3606509532546625e-05 ], "bp_grad_norms_F": [ 0.0019284948939457536, 0.001992136472836137, 0.0020461773965507746, 0.001900508883409202, 0.001466717105358839 ], "gamma_dfa": NaN, "acc_eval": 0.599609375, "loss_eval": 1.1585946083068848, "epoch": 47 }, { "hidden_norms": [ 279.963623046875, 263.52496337890625, 249.6890869140625, 245.60646057128906, 245.52540588378906 ], "bp_grad_norms_per_sample_med": [ 3.724947964656167e-05, 3.964625648222864e-05, 4.1545175918145105e-05, 3.953047780669294e-05, 3.275729977758601e-05 ], "bp_grad_norms_F": [ 0.0019616533536463976, 0.002027863636612892, 0.0020759752951562405, 0.0019283785950392485, 0.001484199776314199 ], "gamma_dfa": NaN, "acc_eval": 0.6123046875, "loss_eval": 1.157920002937317, "epoch": 48 }, { "hidden_norms": [ 279.7983093261719, 263.42352294921875, 247.6257781982422, 244.5139923095703, 242.93429565429688 ], "bp_grad_norms_per_sample_med": [ 3.738125451491214e-05, 4.007351162726991e-05, 4.2600284359650686e-05, 4.0704209823161364e-05, 3.302833283669315e-05 ], "bp_grad_norms_F": [ 0.001973477192223072, 0.002032764023169875, 0.0020790304988622665, 0.0019371822709217668, 0.0014914683997631073 ], "gamma_dfa": NaN, "acc_eval": 0.6005859375, "loss_eval": 1.1545627117156982, "epoch": 49 }, { "hidden_norms": [ 278.16461181640625, 259.95208740234375, 246.212890625, 243.02810668945312, 242.42227172851562 ], "bp_grad_norms_per_sample_med": [ 3.896220732713118e-05, 4.0713552152737975e-05, 4.242185241309926e-05, 4.1096616769209504e-05, 3.4584638342494145e-05 ], "bp_grad_norms_F": [ 0.0020273446571081877, 0.0020888603758066893, 0.0021337512880563736, 0.0019914479926228523, 0.0015125740319490433 ], "gamma_dfa": NaN, "acc_eval": 0.599609375, "loss_eval": 1.1588966846466064, "epoch": 50 }, { "hidden_norms": [ 278.74609375, 259.810302734375, 244.75640869140625, 241.40191650390625, 241.2429962158203 ], "bp_grad_norms_per_sample_med": [ 4.005424489150755e-05, 4.289989738026634e-05, 4.383309351396747e-05, 4.207885649520904e-05, 3.527112494339235e-05 ], "bp_grad_norms_F": [ 0.002059010788798332, 0.002119551645591855, 0.002172222128137946, 0.0020189452916383743, 0.0015335450880229473 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1555505990982056, "epoch": 51 }, { "hidden_norms": [ 277.6565246582031, 262.0436096191406, 246.2357635498047, 241.67991638183594, 240.23500061035156 ], "bp_grad_norms_per_sample_med": [ 4.1031005821423605e-05, 4.313238605391234e-05, 4.465782694751397e-05, 4.2896612285403535e-05, 3.4334370866417885e-05 ], "bp_grad_norms_F": [ 0.002025892725214362, 0.0020990471821278334, 0.0021509609650820494, 0.002011507283896208, 0.0015318752266466618 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1416809558868408, "epoch": 52 }, { "hidden_norms": [ 277.4100646972656, 260.2519836425781, 245.48947143554688, 242.5662384033203, 241.2648162841797 ], "bp_grad_norms_per_sample_med": [ 3.732202821993269e-05, 3.9125570765463635e-05, 4.136607458349317e-05, 3.977569213020615e-05, 3.3676675229799e-05 ], "bp_grad_norms_F": [ 0.002009452786296606, 0.002076543401926756, 0.002131648361682892, 0.00199576816521585, 0.0015338497469201684 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.143639087677002, "epoch": 53 }, { "hidden_norms": [ 277.3269348144531, 259.49072265625, 243.7945098876953, 240.342041015625, 238.76239013671875 ], "bp_grad_norms_per_sample_med": [ 3.978172389906831e-05, 4.20100441260729e-05, 4.455841553863138e-05, 4.2333795136073604e-05, 3.435015969444066e-05 ], "bp_grad_norms_F": [ 0.0020786102395504713, 0.0021364488638937473, 0.0021890606731176376, 0.0020492339972406626, 0.0015625122468918562 ], "gamma_dfa": NaN, "acc_eval": 0.6044921875, "loss_eval": 1.1515132188796997, "epoch": 54 }, { "hidden_norms": [ 276.1414489746094, 257.6651306152344, 242.12867736816406, 238.3046875, 235.9711151123047 ], "bp_grad_norms_per_sample_med": [ 4.158447700319812e-05, 4.40051153418608e-05, 4.566523784887977e-05, 4.3018761061830446e-05, 3.456107515376061e-05 ], "bp_grad_norms_F": [ 0.0021895321551710367, 0.0022726275492459536, 0.00232017133384943, 0.002137792995199561, 0.0015979791060090065 ], "gamma_dfa": NaN, "acc_eval": 0.6025390625, "loss_eval": 1.148828148841858, "epoch": 55 }, { "hidden_norms": [ 276.29547119140625, 257.9006652832031, 242.25363159179688, 237.8865966796875, 235.57620239257812 ], "bp_grad_norms_per_sample_med": [ 3.9041460695443675e-05, 4.0436327253701165e-05, 4.2260016925865784e-05, 4.071593502885662e-05, 3.461613232502714e-05 ], "bp_grad_norms_F": [ 0.0021726686973124743, 0.002256714040413499, 0.0023172625806182623, 0.0021478317212313414, 0.0016112272860482335 ], "gamma_dfa": NaN, "acc_eval": 0.6015625, "loss_eval": 1.165194034576416, "epoch": 56 }, { "hidden_norms": [ 274.73480224609375, 257.3844909667969, 239.9276580810547, 236.4628448486328, 232.49490356445312 ], "bp_grad_norms_per_sample_med": [ 4.182914926786907e-05, 4.482160511543043e-05, 4.732825618702918e-05, 4.5475029764929786e-05, 3.673886021715589e-05 ], "bp_grad_norms_F": [ 0.002222857205197215, 0.0022976247128099203, 0.002366685541346669, 0.002194431144744158, 0.0016426561633124948 ], "gamma_dfa": NaN, "acc_eval": 0.6015625, "loss_eval": 1.150635004043579, "epoch": 57 }, { "hidden_norms": [ 273.9837341308594, 255.2301025390625, 239.6470184326172, 235.07806396484375, 232.15016174316406 ], "bp_grad_norms_per_sample_med": [ 4.28417552029714e-05, 4.5315191528061405e-05, 4.770928717334755e-05, 4.653819996747188e-05, 3.727963485289365e-05 ], "bp_grad_norms_F": [ 0.002205377910286188, 0.00228099524974823, 0.002334901597350836, 0.0021908036433160305, 0.001635397202335298 ], "gamma_dfa": NaN, "acc_eval": 0.6064453125, "loss_eval": 1.150489330291748, "epoch": 58 }, { "hidden_norms": [ 273.4665222167969, 255.21783447265625, 238.12306213378906, 232.99537658691406, 229.35629272460938 ], "bp_grad_norms_per_sample_med": [ 4.174295099801384e-05, 4.412833004607819e-05, 4.589854142977856e-05, 4.366271969047375e-05, 3.4910473914351314e-05 ], "bp_grad_norms_F": [ 0.0022425123024731874, 0.002337042009457946, 0.0024111224338412285, 0.002237174427136779, 0.0016597777139395475 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1445674896240234, "epoch": 59 }, { "hidden_norms": [ 272.8526306152344, 254.31373596191406, 238.0008087158203, 233.6641082763672, 229.88113403320312 ], "bp_grad_norms_per_sample_med": [ 4.274978709872812e-05, 4.589447416947223e-05, 4.8100573621923104e-05, 4.519677167991176e-05, 3.628300692071207e-05 ], "bp_grad_norms_F": [ 0.0022435274440795183, 0.0023362115025520325, 0.0024012199137359858, 0.00223422609269619, 0.0016617706278339028 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1417796611785889, "epoch": 60 }, { "hidden_norms": [ 272.5745849609375, 253.39877319335938, 236.8953094482422, 231.5461883544922, 227.8491668701172 ], "bp_grad_norms_per_sample_med": [ 4.257826367393136e-05, 4.485245153773576e-05, 4.667421308113262e-05, 4.5228414819575846e-05, 3.560770346666686e-05 ], "bp_grad_norms_F": [ 0.0022986247204244137, 0.002396916039288044, 0.0024696297477930784, 0.0022973858285695314, 0.0016907128738239408 ], "gamma_dfa": NaN, "acc_eval": 0.6044921875, "loss_eval": 1.1428865194320679, "epoch": 61 }, { "hidden_norms": [ 269.6819763183594, 250.9730682373047, 234.21188354492188, 228.83775329589844, 224.82958984375 ], "bp_grad_norms_per_sample_med": [ 4.29281426477246e-05, 4.5681605115532875e-05, 4.7611269110348076e-05, 4.553339022095315e-05, 3.683664544951171e-05 ], "bp_grad_norms_F": [ 0.0023400019854307175, 0.002444769022986293, 0.0025141045916825533, 0.002344615990296006, 0.0017126062884926796 ], "gamma_dfa": NaN, "acc_eval": 0.625, "loss_eval": 1.1239444017410278, "epoch": 62 }, { "hidden_norms": [ 269.7929992675781, 250.5220947265625, 233.3997802734375, 228.2130584716797, 224.5063018798828 ], "bp_grad_norms_per_sample_med": [ 4.4715372496284544e-05, 4.6482971811201423e-05, 4.9765483709052205e-05, 4.759176226798445e-05, 3.8208585465326905e-05 ], "bp_grad_norms_F": [ 0.0023639060091227293, 0.002476333873346448, 0.0025423571933060884, 0.00236364989541471, 0.0017294714925810695 ], "gamma_dfa": NaN, "acc_eval": 0.6162109375, "loss_eval": 1.1502506732940674, "epoch": 63 }, { "hidden_norms": [ 269.24493408203125, 251.6195831298828, 234.21717834472656, 228.9242401123047, 224.33628845214844 ], "bp_grad_norms_per_sample_med": [ 4.4276617700234056e-05, 4.620026084012352e-05, 4.972432361682877e-05, 4.657481986214407e-05, 3.729217132786289e-05 ], "bp_grad_norms_F": [ 0.0023896305356174707, 0.002498477231711149, 0.0025652945041656494, 0.002390124835073948, 0.0017562232678756118 ], "gamma_dfa": NaN, "acc_eval": 0.6171875, "loss_eval": 1.146531581878662, "epoch": 64 }, { "hidden_norms": [ 268.0794982910156, 250.7041778564453, 233.16966247558594, 227.9508056640625, 223.48045349121094 ], "bp_grad_norms_per_sample_med": [ 4.518003697739914e-05, 4.807085497304797e-05, 5.077984678791836e-05, 4.9026388296624646e-05, 3.8487425626954064e-05 ], "bp_grad_norms_F": [ 0.0023859951179474592, 0.002494273241609335, 0.0025624327827244997, 0.0023940331302583218, 0.0017616016557440162 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1454447507858276, "epoch": 65 }, { "hidden_norms": [ 267.8343811035156, 247.6757049560547, 231.40367126464844, 225.93670654296875, 220.4804229736328 ], "bp_grad_norms_per_sample_med": [ 4.405072468216531e-05, 4.688911576522514e-05, 4.961229205946438e-05, 4.743603858514689e-05, 3.724359339685179e-05 ], "bp_grad_norms_F": [ 0.002465154742822051, 0.0025785581674426794, 0.002648484194651246, 0.0024633395951241255, 0.0017954027280211449 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.165484070777893, "epoch": 66 }, { "hidden_norms": [ 267.8901062011719, 248.67857360839844, 231.63746643066406, 225.49383544921875, 220.6399383544922 ], "bp_grad_norms_per_sample_med": [ 4.755932604894042e-05, 4.9960097385337576e-05, 5.191187665332109e-05, 4.949339563609101e-05, 3.946756987716071e-05 ], "bp_grad_norms_F": [ 0.0024303828831762075, 0.0025356977712363005, 0.002610789379104972, 0.00243638688698411, 0.0017875435296446085 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1472151279449463, "epoch": 67 }, { "hidden_norms": [ 267.3486022949219, 247.69305419921875, 229.9873504638672, 223.6610870361328, 218.91578674316406 ], "bp_grad_norms_per_sample_med": [ 4.743155659525655e-05, 5.06583419337403e-05, 5.422766844276339e-05, 5.0596820074133575e-05, 3.959470632253215e-05 ], "bp_grad_norms_F": [ 0.0025001303292810917, 0.0026160534471273422, 0.002682509133592248, 0.002501503797248006, 0.0018251334549859166 ], "gamma_dfa": NaN, "acc_eval": 0.6201171875, "loss_eval": 1.157745599746704, "epoch": 68 }, { "hidden_norms": [ 266.2055969238281, 246.88201904296875, 229.0934295654297, 223.09255981445312, 217.90614318847656 ], "bp_grad_norms_per_sample_med": [ 4.6090037358226255e-05, 4.8821068048710003e-05, 5.145218892721459e-05, 4.892798824585043e-05, 3.874724279739894e-05 ], "bp_grad_norms_F": [ 0.002517222659662366, 0.00262960116378963, 0.002704967511817813, 0.002524228999391198, 0.0018283555982634425 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1513168811798096, "epoch": 69 }, { "hidden_norms": [ 263.8387451171875, 244.32431030273438, 227.78903198242188, 222.13900756835938, 216.27389526367188 ], "bp_grad_norms_per_sample_med": [ 4.680602069129236e-05, 5.040669202571735e-05, 5.318928378983401e-05, 4.9446778575656936e-05, 3.913935870514251e-05 ], "bp_grad_norms_F": [ 0.0025120435748249292, 0.0026304670609533787, 0.0027123456820845604, 0.002537800231948495, 0.001847997889854014 ], "gamma_dfa": NaN, "acc_eval": 0.6240234375, "loss_eval": 1.1497204303741455, "epoch": 70 }, { "hidden_norms": [ 263.52716064453125, 243.21226501464844, 226.427001953125, 220.67845153808594, 214.70176696777344 ], "bp_grad_norms_per_sample_med": [ 4.6976576413726434e-05, 5.0085352995665744e-05, 5.2343326387926936e-05, 4.9784572183853015e-05, 4.0186921978602186e-05 ], "bp_grad_norms_F": [ 0.0026124012656509876, 0.0027241536881774664, 0.002797869499772787, 0.002603790955618024, 0.0018792233895510435 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.153285026550293, "epoch": 71 }, { "hidden_norms": [ 264.0121765136719, 243.2773895263672, 226.7365264892578, 220.29107666015625, 214.1591339111328 ], "bp_grad_norms_per_sample_med": [ 4.6254041080828756e-05, 4.949727008352056e-05, 5.206605055718683e-05, 5.012763722334057e-05, 3.8815273001091555e-05 ], "bp_grad_norms_F": [ 0.0026143237482756376, 0.0027275518514215946, 0.0028062777128070593, 0.002607470378279686, 0.0018867084290832281 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1514866352081299, "epoch": 72 }, { "hidden_norms": [ 263.4013671875, 243.0095672607422, 225.4296112060547, 219.55067443847656, 213.40794372558594 ], "bp_grad_norms_per_sample_med": [ 4.8506815801374614e-05, 5.151949153514579e-05, 5.5085791245801374e-05, 5.175785190658644e-05, 4.0316641388926655e-05 ], "bp_grad_norms_F": [ 0.002606831956654787, 0.002728143008425832, 0.0028109808918088675, 0.0026184367015957832, 0.0018970600795000792 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1346663236618042, "epoch": 73 }, { "hidden_norms": [ 262.27703857421875, 242.7241668701172, 224.5229949951172, 218.4025115966797, 212.19247436523438 ], "bp_grad_norms_per_sample_med": [ 4.704251477960497e-05, 5.0965834816452116e-05, 5.3327348723541945e-05, 5.0449500122340396e-05, 4.0479797462467104e-05 ], "bp_grad_norms_F": [ 0.0026277368888258934, 0.0027542279567569494, 0.00283243996091187, 0.00264621595852077, 0.0019058829639106989 ], "gamma_dfa": NaN, "acc_eval": 0.6240234375, "loss_eval": 1.137591004371643, "epoch": 74 }, { "hidden_norms": [ 262.1747131347656, 241.88607788085938, 224.1046142578125, 217.9982147216797, 211.7519989013672 ], "bp_grad_norms_per_sample_med": [ 4.847371383220889e-05, 5.121564754517749e-05, 5.3943567763781175e-05, 5.087414683657698e-05, 4.037184771732427e-05 ], "bp_grad_norms_F": [ 0.0026811074931174517, 0.002809705911204219, 0.002887698821723461, 0.002692745067179203, 0.0019356919219717383 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1538643836975098, "epoch": 75 }, { "hidden_norms": [ 261.7838439941406, 239.75706481933594, 222.1133575439453, 216.12124633789062, 210.44593811035156 ], "bp_grad_norms_per_sample_med": [ 4.8369467549491674e-05, 5.07068180013448e-05, 5.281560879666358e-05, 5.086012970423326e-05, 4.062180232722312e-05 ], "bp_grad_norms_F": [ 0.0027064597234129906, 0.0028339733835309744, 0.0029109998140484095, 0.002717787167057395, 0.0019469966646283865 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1476709842681885, "epoch": 76 }, { "hidden_norms": [ 260.708251953125, 239.65792846679688, 222.502197265625, 216.31419372558594, 210.15716552734375 ], "bp_grad_norms_per_sample_med": [ 4.919906132272445e-05, 5.164166941540316e-05, 5.366719051380642e-05, 5.108323966851458e-05, 4.000464832643047e-05 ], "bp_grad_norms_F": [ 0.002715736860409379, 0.0028464714996516705, 0.0029330456163734198, 0.0027443754952400923, 0.001961463363841176 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.1511735916137695, "epoch": 77 }, { "hidden_norms": [ 260.4088439941406, 239.9808349609375, 222.2389373779297, 215.33692932128906, 208.58534240722656 ], "bp_grad_norms_per_sample_med": [ 4.8405916459159926e-05, 5.163977766642347e-05, 5.34093014721293e-05, 5.167788185644895e-05, 4.020798587589525e-05 ], "bp_grad_norms_F": [ 0.0027501434087753296, 0.0028795108664780855, 0.0029617082327604294, 0.002769613405689597, 0.001984042814001441 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1523363590240479, "epoch": 78 }, { "hidden_norms": [ 259.8567199707031, 238.8525848388672, 221.2687225341797, 213.9132537841797, 207.3290557861328 ], "bp_grad_norms_per_sample_med": [ 4.8219208110822365e-05, 5.1672555855475366e-05, 5.364803655538708e-05, 5.1243885536678135e-05, 4.079756035935134e-05 ], "bp_grad_norms_F": [ 0.0028046013321727514, 0.002939376747235656, 0.0030214993748813868, 0.002813557395711541, 0.0019953204318881035 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1514203548431396, "epoch": 79 }, { "hidden_norms": [ 259.52423095703125, 238.27757263183594, 219.9165802001953, 213.4214324951172, 206.20606994628906 ], "bp_grad_norms_per_sample_med": [ 4.8479021643288434e-05, 5.219021113589406e-05, 5.5094871640903875e-05, 5.1899030950153247e-05, 4.124108454561792e-05 ], "bp_grad_norms_F": [ 0.0028202880639582872, 0.002952422248199582, 0.0030410154722630978, 0.002832787809893489, 0.0020088190212845802 ], "gamma_dfa": NaN, "acc_eval": 0.625, "loss_eval": 1.1545820236206055, "epoch": 80 }, { "hidden_norms": [ 258.1958923339844, 237.08778381347656, 219.2870635986328, 212.87725830078125, 205.84408569335938 ], "bp_grad_norms_per_sample_med": [ 5.005837374483235e-05, 5.344217424863018e-05, 5.582463927567005e-05, 5.345495083020069e-05, 4.113194518140517e-05 ], "bp_grad_norms_F": [ 0.0028330644126981497, 0.002965509658679366, 0.0030466399621218443, 0.00284536718390882, 0.0020232615061104298 ], "gamma_dfa": NaN, "acc_eval": 0.6220703125, "loss_eval": 1.1552448272705078, "epoch": 81 }, { "hidden_norms": [ 258.44268798828125, 236.90562438964844, 218.65948486328125, 212.63186645507812, 204.90692138671875 ], "bp_grad_norms_per_sample_med": [ 4.896440077573061e-05, 5.1820486987708136e-05, 5.4638629080727696e-05, 5.3578904044115916e-05, 4.117973367101513e-05 ], "bp_grad_norms_F": [ 0.002839416265487671, 0.0029778846073895693, 0.003062452422454953, 0.002849552081897855, 0.0020236214622855186 ], "gamma_dfa": NaN, "acc_eval": 0.62109375, "loss_eval": 1.1515182256698608, "epoch": 82 }, { "hidden_norms": [ 258.24615478515625, 236.87181091308594, 219.06484985351562, 213.2528076171875, 205.03671264648438 ], "bp_grad_norms_per_sample_med": [ 4.8622885515214875e-05, 5.181535379961133e-05, 5.509376205736771e-05, 5.2298331866040826e-05, 4.074195385328494e-05 ], "bp_grad_norms_F": [ 0.002838765038177371, 0.00297414674423635, 0.003058358561247587, 0.0028491863049566746, 0.0020313323475420475 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1609394550323486, "epoch": 83 }, { "hidden_norms": [ 257.9989929199219, 236.4859161376953, 218.73072814941406, 212.0786895751953, 204.2919464111328 ], "bp_grad_norms_per_sample_med": [ 5.0208276661578566e-05, 5.2276191127020866e-05, 5.509322727448307e-05, 5.315374437486753e-05, 4.122377504245378e-05 ], "bp_grad_norms_F": [ 0.0028634185437113047, 0.0029970910400152206, 0.0030890253838151693, 0.002881886437535286, 0.0020408176351338625 ], "gamma_dfa": NaN, "acc_eval": 0.6171875, "loss_eval": 1.1592046022415161, "epoch": 84 }, { "hidden_norms": [ 257.24053955078125, 235.7548065185547, 217.84329223632812, 211.033935546875, 203.8216094970703 ], "bp_grad_norms_per_sample_med": [ 5.0660164561122656e-05, 5.414208135334775e-05, 5.5454143875977024e-05, 5.3000938351033255e-05, 4.292939411243424e-05 ], "bp_grad_norms_F": [ 0.0028948886319994926, 0.003031315514817834, 0.0031204961705952883, 0.002907233312726021, 0.0020496752113103867 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.1583250761032104, "epoch": 85 }, { "hidden_norms": [ 256.78289794921875, 235.2476348876953, 217.21603393554688, 210.80035400390625, 203.15478515625 ], "bp_grad_norms_per_sample_med": [ 4.9510348617332056e-05, 5.1982155127916485e-05, 5.440499808173627e-05, 5.1704166253330186e-05, 4.0308059396920726e-05 ], "bp_grad_norms_F": [ 0.0028964560478925705, 0.0030334230978041887, 0.0031210912857204676, 0.002908239373937249, 0.0020543786231428385 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.1597179174423218, "epoch": 86 }, { "hidden_norms": [ 256.531982421875, 235.45941162109375, 217.1429443359375, 210.1690673828125, 202.77899169921875 ], "bp_grad_norms_per_sample_med": [ 4.943124076817185e-05, 5.149367279955186e-05, 5.385246913647279e-05, 5.262702325126156e-05, 4.104706385987811e-05 ], "bp_grad_norms_F": [ 0.0029305708594620228, 0.0030687344260513783, 0.003160761669278145, 0.002940374892205, 0.0020649591460824013 ], "gamma_dfa": NaN, "acc_eval": 0.6220703125, "loss_eval": 1.161116600036621, "epoch": 87 }, { "hidden_norms": [ 256.3059387207031, 235.24874877929688, 217.37142944335938, 210.53717041015625, 203.14259338378906 ], "bp_grad_norms_per_sample_med": [ 4.934536627843045e-05, 5.2089759265072644e-05, 5.424721530289389e-05, 5.292960850056261e-05, 4.041651845909655e-05 ], "bp_grad_norms_F": [ 0.002913407515734434, 0.0030489542987197638, 0.003135726321488619, 0.002922008978202939, 0.002062067622318864 ], "gamma_dfa": NaN, "acc_eval": 0.61328125, "loss_eval": 1.155902624130249, "epoch": 88 }, { "hidden_norms": [ 256.7462463378906, 235.3153839111328, 216.87977600097656, 210.572509765625, 202.77845764160156 ], "bp_grad_norms_per_sample_med": [ 4.990033630747348e-05, 5.337029870133847e-05, 5.522817809833214e-05, 5.3465773817151785e-05, 4.164372876402922e-05 ], "bp_grad_norms_F": [ 0.0029192205984145403, 0.0030557813588529825, 0.003147577866911888, 0.0029307191725820303, 0.0020654413383454084 ], "gamma_dfa": NaN, "acc_eval": 0.6162109375, "loss_eval": 1.1561503410339355, "epoch": 89 }, { "hidden_norms": [ 256.68145751953125, 234.77310180664062, 216.7720947265625, 209.664794921875, 202.22833251953125 ], "bp_grad_norms_per_sample_med": [ 4.9965801736107096e-05, 5.341583164408803e-05, 5.593279274762608e-05, 5.420796514954418e-05, 4.210533734294586e-05 ], "bp_grad_norms_F": [ 0.002943370258435607, 0.00308181531727314, 0.003169203409925103, 0.002951863221824169, 0.0020759364124387503 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1583542823791504, "epoch": 90 }, { "hidden_norms": [ 256.4252014160156, 234.56448364257812, 216.34176635742188, 209.5242156982422, 201.7559356689453 ], "bp_grad_norms_per_sample_med": [ 4.9815931561170146e-05, 5.2233976020943373e-05, 5.5747830629115924e-05, 5.41718618478626e-05, 4.169955354882404e-05 ], "bp_grad_norms_F": [ 0.0029554881621152163, 0.0030950764194130898, 0.0031847492791712284, 0.0029650654178112745, 0.002081435639411211 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.159005045890808, "epoch": 91 }, { "hidden_norms": [ 256.15167236328125, 234.47537231445312, 216.2799072265625, 209.95578002929688, 201.94126892089844 ], "bp_grad_norms_per_sample_med": [ 5.007637446396984e-05, 5.260824036668055e-05, 5.540058555197902e-05, 5.322153810993768e-05, 4.1122035327134654e-05 ], "bp_grad_norms_F": [ 0.002944375155493617, 0.00308293872512877, 0.003174267942085862, 0.0029555640649050474, 0.0020777545869350433 ], "gamma_dfa": NaN, "acc_eval": 0.6259765625, "loss_eval": 1.1595215797424316, "epoch": 92 }, { "hidden_norms": [ 256.1369934082031, 234.51614379882812, 216.30044555664062, 209.4623565673828, 201.70799255371094 ], "bp_grad_norms_per_sample_med": [ 5.048588718636893e-05, 5.3128016588743776e-05, 5.624579353025183e-05, 5.411298116086982e-05, 4.109516885364428e-05 ], "bp_grad_norms_F": [ 0.0029427227564156055, 0.0030841128900647163, 0.003178349928930402, 0.0029583934228867292, 0.002080487785860896 ], "gamma_dfa": NaN, "acc_eval": 0.62109375, "loss_eval": 1.1565905809402466, "epoch": 93 }, { "hidden_norms": [ 255.9738311767578, 234.28948974609375, 216.3280029296875, 209.589111328125, 201.76205444335938 ], "bp_grad_norms_per_sample_med": [ 5.070818224339746e-05, 5.330924614099786e-05, 5.596653136308305e-05, 5.407314529293217e-05, 4.100686783203855e-05 ], "bp_grad_norms_F": [ 0.0029472638852894306, 0.003088710131123662, 0.0031828396022319794, 0.0029631764627993107, 0.0020829145796597004 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.1584088802337646, "epoch": 94 }, { "hidden_norms": [ 255.89332580566406, 234.19253540039062, 216.33103942871094, 209.45057678222656, 201.54258728027344 ], "bp_grad_norms_per_sample_med": [ 5.041498661739752e-05, 5.279783727019094e-05, 5.5226330005098134e-05, 5.407658318290487e-05, 4.1154507925966755e-05 ], "bp_grad_norms_F": [ 0.002949801040813327, 0.00309200631454587, 0.0031869453378021717, 0.0029658437706530094, 0.002085147425532341 ], "gamma_dfa": NaN, "acc_eval": 0.6201171875, "loss_eval": 1.158942699432373, "epoch": 95 }, { "hidden_norms": [ 255.63841247558594, 234.11630249023438, 216.2378692626953, 209.49703979492188, 201.46917724609375 ], "bp_grad_norms_per_sample_med": [ 5.020374737796374e-05, 5.243354826234281e-05, 5.587147097685374e-05, 5.334949673851952e-05, 4.121083111385815e-05 ], "bp_grad_norms_F": [ 0.002950438065454364, 0.003093136241659522, 0.0031878354493528605, 0.0029664800968021154, 0.0020843464881181717 ], "gamma_dfa": NaN, "acc_eval": 0.6201171875, "loss_eval": 1.1582318544387817, "epoch": 96 }, { "hidden_norms": [ 255.8027801513672, 234.07070922851562, 216.1463623046875, 209.4476318359375, 201.27279663085938 ], "bp_grad_norms_per_sample_med": [ 5.0307549827266484e-05, 5.278814569464885e-05, 5.604944453807548e-05, 5.306081584421918e-05, 4.1182753193425015e-05 ], "bp_grad_norms_F": [ 0.002952505135908723, 0.003095670836046338, 0.0031897351145744324, 0.00296790711581707, 0.002085329731926322 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.15840482711792, "epoch": 97 }, { "hidden_norms": [ 255.60986328125, 234.11065673828125, 216.12860107421875, 209.42921447753906, 201.28346252441406 ], "bp_grad_norms_per_sample_med": [ 5.0218295655213296e-05, 5.269264511298388e-05, 5.5988577514654025e-05, 5.322946162777953e-05, 4.136392453801818e-05 ], "bp_grad_norms_F": [ 0.002954497467726469, 0.003097717184573412, 0.0031918887980282307, 0.002969518303871155, 0.00208606431260705 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.1585593223571777, "epoch": 98 }, { "hidden_norms": [ 255.57244873046875, 234.11569213867188, 216.13626098632812, 209.40383911132812, 201.28627014160156 ], "bp_grad_norms_per_sample_med": [ 5.005559796700254e-05, 5.2759678510483354e-05, 5.5868193157948554e-05, 5.3356721764430404e-05, 4.125368650420569e-05 ], "bp_grad_norms_F": [ 0.0029547216836363077, 0.00309770368039608, 0.003191797062754631, 0.0029695071280002594, 0.0020862380042672157 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.1585021018981934, "epoch": 99 }, { "hidden_norms": [ 255.5677947998047, 234.11875915527344, 216.1315460205078, 209.4070281982422, 201.2687530517578 ], "bp_grad_norms_per_sample_med": [ 5.006368883186951e-05, 5.279530887492001e-05, 5.585233884630725e-05, 5.334027810022235e-05, 4.123226608498953e-05 ], "bp_grad_norms_F": [ 0.002954971743747592, 0.0030978918075561523, 0.003191987983882427, 0.002969692926853895, 0.002086336025968194 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.1584858894348145, "epoch": 100 } ], "dfa_log": [ { "hidden_norms": [ 8.690464973449707, 8.719978332519531, 8.73093318939209, 8.75937271118164, 8.790542602539062 ], "bp_grad_norms_per_sample_med": [ 0.0009977436857298017, 0.000992251792922616, 0.0009848480112850666, 0.0009761073160916567, 0.0009735578205436468 ], "bp_grad_norms_F": [ 0.035340383648872375, 0.03499162197113037, 0.03454425558447838, 0.034113530069589615, 0.033874060958623886 ], "gamma_dfa": 0.006830460682976991, "acc_eval": 0.095703125, "loss_eval": 2.486203908920288, "epoch": 0 }, { "hidden_norms": [ 861.2440185546875, 2373.370849609375, 4675.99951171875, 6090.40869140625, 6962.984375 ], "bp_grad_norms_per_sample_med": [ 2.380779051236459e-06, 1.3197138741816161e-06, 1.3154849511920474e-06, 1.3285966815601569e-06, 1.3258621720524388e-06 ], "bp_grad_norms_F": [ 0.0001391920231981203, 6.988063250901178e-05, 6.874280370539054e-05, 6.720778765156865e-05, 6.707101420033723e-05 ], "gamma_dfa": 0.10659917898010463, "acc_eval": 0.3037109375, "loss_eval": 1.9665180444717407, "epoch": 1 }, { "hidden_norms": [ 1679.144775390625, 8850.173828125, 31676.23046875, 40712.2109375, 45375.55859375 ], "bp_grad_norms_per_sample_med": [ 1.1123192962259054e-06, 2.7329409135745664e-07, 2.7436919936008053e-07, 2.75225175982996e-07, 2.744452558545163e-07 ], "bp_grad_norms_F": [ 7.363831537077203e-05, 2.2035641450202093e-05, 1.9731569409486838e-05, 1.9022963897441514e-05, 1.7921549442689866e-05 ], "gamma_dfa": 0.10788296448299661, "acc_eval": 0.29296875, "loss_eval": 1.972828984260559, "epoch": 2 }, { "hidden_norms": [ 2530.16015625, 21436.486328125, 88828.296875, 114079.484375, 124374.78125 ], "bp_grad_norms_per_sample_med": [ 8.110604312605574e-07, 1.1556701196013819e-07, 1.1451407289087001e-07, 1.1523399479074214e-07, 1.1543902900257308e-07 ], "bp_grad_norms_F": [ 0.00011594755778787658, 1.8132053810404614e-05, 1.1369732419552747e-05, 8.215727575588971e-06, 7.219489361887099e-06 ], "gamma_dfa": 0.1084698709892109, "acc_eval": 0.318359375, "loss_eval": 1.9430747032165527, "epoch": 3 }, { "hidden_norms": [ 3363.359375, 41233.19921875, 182355.03125, 240225.46875, 257539.390625 ], "bp_grad_norms_per_sample_med": [ 6.176944111757621e-07, 6.474806468759198e-08, 6.307719502274267e-08, 6.379124783961743e-08, 6.374663996666641e-08 ], "bp_grad_norms_F": [ 3.5978406231151894e-05, 4.323610028222902e-06, 3.5177260997443227e-06, 3.4877305097325006e-06, 3.479522774796351e-06 ], "gamma_dfa": 0.10987455540453084, "acc_eval": 0.3173828125, "loss_eval": 1.959622859954834, "epoch": 4 }, { "hidden_norms": [ 4170.119140625, 70935.8515625, 335571.09375, 441693.5625, 469995.8125 ], "bp_grad_norms_per_sample_med": [ 4.856212285631045e-07, 4.0158354863706336e-08, 3.8916198263905244e-08, 3.9119736783277403e-08, 3.916203894505088e-08 ], "bp_grad_norms_F": [ 2.611691706988495e-05, 2.208936621173052e-06, 1.6750394706832594e-06, 1.6634863868603134e-06, 1.659758027017233e-06 ], "gamma_dfa": 0.1083616423420608, "acc_eval": 0.3017578125, "loss_eval": 1.932759165763855, "epoch": 5 }, { "hidden_norms": [ 5013.92236328125, 106898.6171875, 530492.6875, 719779.5, 763058.3125 ], "bp_grad_norms_per_sample_med": [ 4.242272950705228e-07, 2.814423716301917e-08, 2.683668043346188e-08, 2.6872848835068908e-08, 2.6873932412740942e-08 ], "bp_grad_norms_F": [ 2.2560918296221644e-05, 1.2798993793694535e-06, 1.0339434766137856e-06, 1.0326252777304035e-06, 1.030524344969308e-06 ], "gamma_dfa": 0.11125951120629907, "acc_eval": 0.3095703125, "loss_eval": 1.9531997442245483, "epoch": 6 }, { "hidden_norms": [ 5811.36279296875, 156264.234375, 809496.6875, 1104418.875, 1163013.625 ], "bp_grad_norms_per_sample_med": [ 3.5694648659045924e-07, 2.0201103012595922e-08, 1.89678583950581e-08, 1.8967025283700423e-08, 1.8932304612917505e-08 ], "bp_grad_norms_F": [ 1.9050115952268243e-05, 9.341621307612513e-07, 6.890153372296481e-07, 6.891143584653037e-07, 6.886222649882257e-07 ], "gamma_dfa": 0.11049338441807777, "acc_eval": 0.3076171875, "loss_eval": 1.9362893104553223, "epoch": 7 }, { "hidden_norms": [ 6660.841796875, 217521.65625, 1158874.5, 1615614.625, 1694436.0 ], "bp_grad_norms_per_sample_med": [ 3.212987280676316e-07, 1.5324568281016582e-08, 1.4045938634410504e-08, 1.4053354924215e-08, 1.4027999206689401e-08 ], "bp_grad_norms_F": [ 1.7352898794342764e-05, 6.539408445860317e-07, 5.044145154897706e-07, 5.047700142313261e-07, 5.048477760283276e-07 ], "gamma_dfa": 0.11245601065456867, "acc_eval": 0.2978515625, "loss_eval": 1.9441646337509155, "epoch": 8 }, { "hidden_norms": [ 7480.24169921875, 295557.40625, 1585967.0, 2246827.75, 2356427.0 ], "bp_grad_norms_per_sample_med": [ 2.889860297727864e-07, 1.193609300287335e-08, 1.1067995409064224e-08, 1.103960478587851e-08, 1.1055576010221557e-08 ], "bp_grad_norms_F": [ 1.5521236491622403e-05, 4.5597263920171827e-07, 3.8742672359148855e-07, 3.8764648024880444e-07, 3.877208314406744e-07 ], "gamma_dfa": 0.11317481694277376, "acc_eval": 0.30078125, "loss_eval": 1.9356626272201538, "epoch": 9 }, { "hidden_norms": [ 8273.8408203125, 388312.4375, 2104540.5, 3043837.75, 3180222.75 ], "bp_grad_norms_per_sample_med": [ 2.619119925384439e-07, 9.19370091168048e-09, 8.51864179196582e-09, 8.482276214749618e-09, 8.476813917468462e-09 ], "bp_grad_norms_F": [ 1.4210399967851117e-05, 3.5443522961031704e-07, 3.0404962103602884e-07, 3.0431687036980293e-07, 3.0445681886703824e-07 ], "gamma_dfa": 0.11495429277420044, "acc_eval": 0.30859375, "loss_eval": 1.936495304107666, "epoch": 10 }, { "hidden_norms": [ 9086.7265625, 501434.3125, 2767834.0, 4046107.75, 4214970.5 ], "bp_grad_norms_per_sample_med": [ 2.471596189934644e-07, 7.524303846651037e-09, 7.025830139895106e-09, 7.019247405537499e-09, 7.011437208603866e-09 ], "bp_grad_norms_F": [ 1.3406845027930103e-05, 4.39807990915142e-07, 2.471441860052437e-07, 2.474318421263888e-07, 2.475488827258232e-07 ], "gamma_dfa": 0.11651878873817623, "acc_eval": 0.30859375, "loss_eval": 1.9542189836502075, "epoch": 11 }, { "hidden_norms": [ 9854.2626953125, 612623.625, 3485830.25, 5139234.5, 5346583.0 ], "bp_grad_norms_per_sample_med": [ 2.3279393701614026e-07, 6.378383154981293e-09, 5.839252636974379e-09, 5.8299334249056756e-09, 5.825462778830115e-09 ], "bp_grad_norms_F": [ 1.2396733836794738e-05, 2.516441668376501e-07, 2.0780194631697668e-07, 2.0795941679807584e-07, 2.080748373600727e-07 ], "gamma_dfa": 0.11470737145282328, "acc_eval": 0.3046875, "loss_eval": 1.9374217987060547, "epoch": 12 }, { "hidden_norms": [ 10653.666015625, 745430.125, 4325399.0, 6434218.5, 6688000.5 ], "bp_grad_norms_per_sample_med": [ 2.1187355514484807e-07, 5.294193083926757e-09, 4.98529528769609e-09, 4.991081326011226e-09, 4.989251234377434e-09 ], "bp_grad_norms_F": [ 1.1210328011657111e-05, 2.000140426616781e-07, 1.7647043648594263e-07, 1.7654315342952032e-07, 1.7665543339262513e-07 ], "gamma_dfa": 0.11383607180323452, "acc_eval": 0.291015625, "loss_eval": 1.9233126640319824, "epoch": 13 }, { "hidden_norms": [ 11404.5263671875, 893037.0625, 5298411.0, 7870617.0, 8170729.5 ], "bp_grad_norms_per_sample_med": [ 1.9957101926593168e-07, 4.642851436642559e-09, 4.288450483613815e-09, 4.285100718703916e-09, 4.289933297485504e-09 ], "bp_grad_norms_F": [ 1.0866175216506235e-05, 1.758858729772328e-07, 1.538420519864303e-07, 1.5386244456294662e-07, 1.5397839092656795e-07 ], "gamma_dfa": 0.1139617893495597, "acc_eval": 0.30859375, "loss_eval": 1.932279109954834, "epoch": 14 }, { "hidden_norms": [ 12171.2412109375, 1062066.875, 6388639.0, 9528923.0, 9891447.0 ], "bp_grad_norms_per_sample_med": [ 1.9334000000981177e-07, 4.044033108385747e-09, 3.810601167941741e-09, 3.801854830953744e-09, 3.8046659156520946e-09 ], "bp_grad_norms_F": [ 1.0322088201064616e-05, 1.529211743900305e-07, 1.350435638869385e-07, 1.3504063645086717e-07, 1.3514510044387862e-07 ], "gamma_dfa": 0.11320225725648925, "acc_eval": 0.3193359375, "loss_eval": 1.921454906463623, "epoch": 15 }, { "hidden_norms": [ 12924.974609375, 1273988.625, 7574387.5, 11500420.0, 11920183.0 ], "bp_grad_norms_per_sample_med": [ 1.8497563303299103e-07, 3.6160896499382034e-09, 3.388503477808058e-09, 3.385580482628825e-09, 3.3854716807724117e-09 ], "bp_grad_norms_F": [ 9.76746559899766e-06, 1.3485876593222201e-07, 1.1896084117779537e-07, 1.1894425000491538e-07, 1.1903343022368063e-07 ], "gamma_dfa": 0.11276883230311796, "acc_eval": 0.306640625, "loss_eval": 1.9356281757354736, "epoch": 16 }, { "hidden_norms": [ 13632.109375, 1465148.75, 8873670.0, 13535396.0, 14019399.0 ], "bp_grad_norms_per_sample_med": [ 1.7523743167657813e-07, 3.18161341716916e-09, 3.0166942277531916e-09, 3.0173783471809656e-09, 3.0215525637089513e-09 ], "bp_grad_norms_F": [ 9.427177246834617e-06, 1.1933295240851294e-07, 1.0663712401992598e-07, 1.0661205607220836e-07, 1.0669979388922002e-07 ], "gamma_dfa": 0.11264261469477788, "acc_eval": 0.3203125, "loss_eval": 1.926081657409668, "epoch": 17 }, { "hidden_norms": [ 14394.1845703125, 1699121.5, 10379340.0, 15814831.0, 16377349.0 ], "bp_grad_norms_per_sample_med": [ 1.6784264289526618e-07, 2.8936604223872564e-09, 2.7336535257660444e-09, 2.7314879247342105e-09, 2.733708148738856e-09 ], "bp_grad_norms_F": [ 9.04797616385622e-06, 1.087723191517398e-07, 9.662341682314946e-08, 9.658959498892727e-08, 9.665905764677518e-08 ], "gamma_dfa": 0.11253939801827073, "acc_eval": 0.3154296875, "loss_eval": 1.922888994216919, "epoch": 18 }, { "hidden_norms": [ 15138.509765625, 1969752.0, 12071423.0, 18393228.0, 19044056.0 ], "bp_grad_norms_per_sample_med": [ 1.5837277089758572e-07, 2.609559235366987e-09, 2.4664128517315476e-09, 2.4639881246457662e-09, 2.4657431652030937e-09 ], "bp_grad_norms_F": [ 8.502225682605058e-06, 9.664965716638108e-08, 8.704243725787819e-08, 8.700892806245974e-08, 8.707356613513184e-08 ], "gamma_dfa": 0.11155363742727786, "acc_eval": 0.3125, "loss_eval": 1.9243314266204834, "epoch": 19 }, { "hidden_norms": [ 15811.982421875, 2268261.5, 13867645.0, 21375086.0, 22149420.0 ], "bp_grad_norms_per_sample_med": [ 1.5073908343765652e-07, 2.376487229227564e-09, 2.2317030445861974e-09, 2.2317414583028494e-09, 2.2311954506193388e-09 ], "bp_grad_norms_F": [ 8.195236659958027e-06, 8.728681422098816e-08, 7.846901439734211e-08, 7.84395552955175e-08, 7.849664029890846e-08 ], "gamma_dfa": 0.11315422086045146, "acc_eval": 0.3095703125, "loss_eval": 1.924652338027954, "epoch": 20 }, { "hidden_norms": [ 16487.935546875, 2556303.5, 15702076.0, 24321856.0, 25185988.0 ], "bp_grad_norms_per_sample_med": [ 1.443007136003871e-07, 2.174122659681643e-09, 2.0514809850880056e-09, 2.052057856971601e-09, 2.05182382195801e-09 ], "bp_grad_norms_F": [ 8.002187314559706e-06, 8.025331510452816e-08, 7.266314838716426e-08, 7.2638087544874e-08, 7.268938162496852e-08 ], "gamma_dfa": 0.11267373809823766, "acc_eval": 0.310546875, "loss_eval": 1.9348869323730469, "epoch": 21 }, { "hidden_norms": [ 17153.216796875, 2908610.25, 17831918.0, 27718528.0, 28682196.0 ], "bp_grad_norms_per_sample_med": [ 1.43127067531168e-07, 2.0134633960111614e-09, 1.908325941712974e-09, 1.9070569567958273e-09, 1.9050578892176873e-09 ], "bp_grad_norms_F": [ 7.550354439445073e-06, 7.309487415341209e-08, 6.660556550741603e-08, 6.657593587533484e-08, 6.66217090383725e-08 ], "gamma_dfa": 0.11266892295680009, "acc_eval": 0.310546875, "loss_eval": 1.9210036993026733, "epoch": 22 }, { "hidden_norms": [ 17796.001953125, 3236156.25, 20246900.0, 31494576.0, 32571052.0 ], "bp_grad_norms_per_sample_med": [ 1.3518946673229948e-07, 1.8474217711172969e-09, 1.7507182370479768e-09, 1.7496273319039801e-09, 1.7511733174657707e-09 ], "bp_grad_norms_F": [ 7.284599632839672e-06, 6.709063882226474e-08, 6.151606157800416e-08, 6.149030440383285e-08, 6.153235432293513e-08 ], "gamma_dfa": 0.11186322406865656, "acc_eval": 0.3115234375, "loss_eval": 1.9283114671707153, "epoch": 23 }, { "hidden_norms": [ 18460.63671875, 3604280.25, 22626418.0, 35429216.0, 36622356.0 ], "bp_grad_norms_per_sample_med": [ 1.3137012899733236e-07, 1.7567419741126855e-09, 1.6593408869169934e-09, 1.6595901319860218e-09, 1.6608053821087765e-09 ], "bp_grad_norms_F": [ 7.130098310881294e-06, 6.264485108431472e-08, 5.731577701340029e-08, 5.729528851361465e-08, 5.733248187311801e-08 ], "gamma_dfa": 0.11299802124267444, "acc_eval": 0.2978515625, "loss_eval": 1.942992925643921, "epoch": 24 }, { "hidden_norms": [ 19115.904296875, 4038094.25, 25405536.0, 39835936.0, 41154148.0 ], "bp_grad_norms_per_sample_med": [ 1.2640579427625198e-07, 1.5953075527264104e-09, 1.5003157605164574e-09, 1.4991035079958692e-09, 1.4979777418488993e-09 ], "bp_grad_norms_F": [ 6.799941729696002e-06, 5.7522207441706996e-08, 5.297441418861126e-08, 5.2952817242157835e-08, 5.298943506204523e-08 ], "gamma_dfa": 0.11197824770351872, "acc_eval": 0.298828125, "loss_eval": 1.9319748878479004, "epoch": 25 }, { "hidden_norms": [ 19780.572265625, 4490110.5, 28153634.0, 44291160.0, 45731404.0 ], "bp_grad_norms_per_sample_med": [ 1.2269519800156559e-07, 1.4798114955638653e-09, 1.4102843337582271e-09, 1.4097069067631196e-09, 1.4109671209183716e-09 ], "bp_grad_norms_F": [ 6.577545264008222e-06, 5.327013141709358e-08, 4.94958669605694e-08, 4.9476955865657146e-08, 4.950964083150211e-08 ], "gamma_dfa": 0.11252723945653997, "acc_eval": 0.3115234375, "loss_eval": 1.9247620105743408, "epoch": 26 }, { "hidden_norms": [ 20381.6796875, 4929967.0, 30880866.0, 48905308.0, 50483824.0 ], "bp_grad_norms_per_sample_med": [ 1.1911821928833888e-07, 1.377626124288156e-09, 1.3317531522005766e-09, 1.3313244950907688e-09, 1.3306112878197496e-09 ], "bp_grad_norms_F": [ 6.326347829599399e-06, 4.955709798082353e-08, 4.649340468176888e-08, 4.6477893533847237e-08, 4.650862805988254e-08 ], "gamma_dfa": 0.11152978462632746, "acc_eval": 0.2978515625, "loss_eval": 1.9170689582824707, "epoch": 27 }, { "hidden_norms": [ 21001.544921875, 5444194.5, 33907076.0, 53832084.0, 55554724.0 ], "bp_grad_norms_per_sample_med": [ 1.1559290413742929e-07, 1.3061883796794405e-09, 1.2378150726632953e-09, 1.2379912650573033e-09, 1.2384089309591673e-09 ], "bp_grad_norms_F": [ 6.23212235950632e-06, 4.7021419646853246e-08, 4.3998962695468435e-08, 4.3984215380987735e-08, 4.4011432720481025e-08 ], "gamma_dfa": 0.11285935762862209, "acc_eval": 0.3193359375, "loss_eval": 1.9198743104934692, "epoch": 28 }, { "hidden_norms": [ 21623.64453125, 5895143.0, 37025488.0, 58791348.0, 60687928.0 ], "bp_grad_norms_per_sample_med": [ 1.1377478870144841e-07, 1.2547849426169932e-09, 1.1888731110687445e-09, 1.1877619998656996e-09, 1.1896320595283782e-09 ], "bp_grad_norms_F": [ 6.024939921189798e-06, 4.443810297516393e-08, 4.161294953064498e-08, 4.159920763413538e-08, 4.162497546644772e-08 ], "gamma_dfa": 0.11188641694025137, "acc_eval": 0.3115234375, "loss_eval": 1.917163372039795, "epoch": 29 }, { "hidden_norms": [ 22195.29296875, 6369258.5, 40117404.0, 64235468.0, 66270544.0 ], "bp_grad_norms_per_sample_med": [ 1.1021134582733794e-07, 1.153794726427293e-09, 1.1123471033158694e-09, 1.1119479781385166e-09, 1.1122585075185043e-09 ], "bp_grad_norms_F": [ 5.96408472119947e-06, 4.2022573865097e-08, 3.954471239353552e-08, 3.953241289877951e-08, 3.955623029128219e-08 ], "gamma_dfa": 0.11316103948047385, "acc_eval": 0.3125, "loss_eval": 1.9332935810089111, "epoch": 30 }, { "hidden_norms": [ 22786.513671875, 6899202.5, 43496572.0, 69758712.0, 71960648.0 ], "bp_grad_norms_per_sample_med": [ 1.0609301170916297e-07, 1.1096534802135238e-09, 1.05872854927469e-09, 1.0590027743617725e-09, 1.0579482845329835e-09 ], "bp_grad_norms_F": [ 5.711301128030755e-06, 3.962547268088201e-08, 3.742779952631281e-08, 3.741677900848117e-08, 3.743992138538488e-08 ], "gamma_dfa": 0.11225346029095817, "acc_eval": 0.31640625, "loss_eval": 1.9247596263885498, "epoch": 31 }, { "hidden_norms": [ 23367.078125, 7480530.0, 47061616.0, 75610000.0, 77981320.0 ], "bp_grad_norms_per_sample_med": [ 1.054115728038596e-07, 1.0618838031106748e-09, 1.0191184562913236e-09, 1.01949926278877e-09, 1.0192180432966325e-09 ], "bp_grad_norms_F": [ 5.768360097135883e-06, 3.826109207238915e-08, 3.593911657162607e-08, 3.592855790657268e-08, 3.594948694285449e-08 ], "gamma_dfa": 0.11492819089471595, "acc_eval": 0.314453125, "loss_eval": 1.939026117324829, "epoch": 32 }, { "hidden_norms": [ 23912.85546875, 8053234.0, 51027352.0, 81931568.0, 84515616.0 ], "bp_grad_norms_per_sample_med": [ 1.0266481353937706e-07, 9.919576271499864e-10, 9.572211912001194e-10, 9.572932446744176e-10, 9.577664217275128e-10 ], "bp_grad_norms_F": [ 5.472421435115393e-06, 3.587240016145188e-08, 3.39712649122248e-08, 3.396091940999213e-08, 3.398050552050336e-08 ], "gamma_dfa": 0.11253271601162851, "acc_eval": 0.3125, "loss_eval": 1.9187253713607788, "epoch": 33 }, { "hidden_norms": [ 24486.8359375, 8682399.0, 55030492.0, 88236184.0, 91025880.0 ], "bp_grad_norms_per_sample_med": [ 1.0101911129822838e-07, 9.702203485062455e-10, 9.30652499508966e-10, 9.30728105696943e-10, 9.303261494508774e-10 ], "bp_grad_norms_F": [ 5.286908617563313e-06, 3.4072087373715476e-08, 3.2386065385026086e-08, 3.2376764380614986e-08, 3.2396076932172946e-08 ], "gamma_dfa": 0.11125053715659305, "acc_eval": 0.3125, "loss_eval": 1.9214520454406738, "epoch": 34 }, { "hidden_norms": [ 25051.91796875, 9255517.0, 58776788.0, 94748472.0, 97725744.0 ], "bp_grad_norms_per_sample_med": [ 9.793318156425812e-08, 9.150468716079274e-10, 8.747003676923271e-10, 8.746902091516517e-10, 8.743750723461119e-10 ], "bp_grad_norms_F": [ 5.294927632348845e-06, 3.279593840943562e-08, 3.115108881956985e-08, 3.114205782139834e-08, 3.115993862934374e-08 ], "gamma_dfa": 0.11356210591475246, "acc_eval": 0.314453125, "loss_eval": 1.9334189891815186, "epoch": 35 }, { "hidden_norms": [ 25539.400390625, 9852175.0, 62733436.0, 101270040.0, 104412528.0 ], "bp_grad_norms_per_sample_med": [ 9.590952032567657e-08, 8.831190223546059e-10, 8.506708115696426e-10, 8.503630022360653e-10, 8.506205184666271e-10 ], "bp_grad_norms_F": [ 5.156022325536469e-06, 3.1347209272780674e-08, 2.992178593785866e-08, 2.9913682197957314e-08, 2.9930919964726854e-08 ], "gamma_dfa": 0.11300312746607233, "acc_eval": 0.3291015625, "loss_eval": 1.9240946769714355, "epoch": 36 }, { "hidden_norms": [ 26058.23046875, 10503947.0, 66954420.0, 108182184.0, 111535672.0 ], "bp_grad_norms_per_sample_med": [ 9.312070403666439e-08, 8.298656206662258e-10, 8.076765367626138e-10, 8.076487811869981e-10, 8.083505531608637e-10 ], "bp_grad_norms_F": [ 5.084062195237493e-06, 3.008365112577849e-08, 2.8773875726528786e-08, 2.8766294235538226e-08, 2.878227967073599e-08 ], "gamma_dfa": 0.11286510003083094, "acc_eval": 0.322265625, "loss_eval": 1.9284429550170898, "epoch": 37 }, { "hidden_norms": [ 26547.951171875, 11128081.0, 71119440.0, 115305784.0, 118851064.0 ], "bp_grad_norms_per_sample_med": [ 9.278523549482998e-08, 8.024952369289906e-10, 7.701798643289237e-10, 7.699446635811569e-10, 7.706733029522184e-10 ], "bp_grad_norms_F": [ 4.915013960271608e-06, 2.8781727223758935e-08, 2.7522533585511155e-08, 2.751522920618754e-08, 2.7530596469205193e-08 ], "gamma_dfa": 0.11193350053144968, "acc_eval": 0.3046875, "loss_eval": 1.9189305305480957, "epoch": 38 }, { "hidden_norms": [ 27052.158203125, 11815623.0, 75267568.0, 122747224.0, 126538816.0 ], "bp_grad_norms_per_sample_med": [ 9.042137349979384e-08, 7.699976212194315e-10, 7.406790181185841e-10, 7.406811275423308e-10, 7.407266466863405e-10 ], "bp_grad_norms_F": [ 4.783120857609902e-06, 2.7648876965713498e-08, 2.6492134708178128e-08, 2.6485189152936073e-08, 2.6500073246893407e-08 ], "gamma_dfa": 0.1119252087228233, "acc_eval": 0.3076171875, "loss_eval": 1.9200191497802734, "epoch": 39 }, { "hidden_norms": [ 27573.439453125, 12446571.0, 79631776.0, 129906592.0, 133912576.0 ], "bp_grad_norms_per_sample_med": [ 8.999781897500725e-08, 7.431448234562765e-10, 7.212022645752825e-10, 7.211930497241781e-10, 7.215293917894883e-10 ], "bp_grad_norms_F": [ 4.7411135710717645e-06, 2.6746526771148638e-08, 2.567137080689008e-08, 2.566465262532347e-08, 2.5678824400188205e-08 ], "gamma_dfa": 0.1126710368462227, "acc_eval": 0.3291015625, "loss_eval": 1.9156131744384766, "epoch": 40 }, { "hidden_norms": [ 28020.1953125, 13139046.0, 84357848.0, 137652880.0, 141892912.0 ], "bp_grad_norms_per_sample_med": [ 8.93968845616655e-08, 7.234106647047156e-10, 7.015109604324721e-10, 7.013014613477253e-10, 7.019884118442121e-10 ], "bp_grad_norms_F": [ 4.706852905655978e-06, 2.5948086346261334e-08, 2.480862271170281e-08, 2.4802661258149783e-08, 2.4816182886411298e-08 ], "gamma_dfa": 0.11299434299689892, "acc_eval": 0.3134765625, "loss_eval": 1.917637825012207, "epoch": 41 }, { "hidden_norms": [ 28489.8828125, 13728548.0, 88388480.0, 144432224.0, 148906448.0 ], "bp_grad_norms_per_sample_med": [ 8.832166287220389e-08, 7.007013858029154e-10, 6.849794620400473e-10, 6.849559253119253e-10, 6.857461820608535e-10 ], "bp_grad_norms_F": [ 4.678155619330937e-06, 2.5201579489930737e-08, 2.418770428391781e-08, 2.4181909807907687e-08, 2.419472266979028e-08 ], "gamma_dfa": 0.11410953500489995, "acc_eval": 0.314453125, "loss_eval": 1.9333336353302002, "epoch": 42 }, { "hidden_norms": [ 28918.5546875, 14414132.0, 92681240.0, 151898304.0, 156571040.0 ], "bp_grad_norms_per_sample_med": [ 8.454645694655483e-08, 6.792187368098723e-10, 6.553820264265653e-10, 6.554308207284976e-10, 6.556304388283252e-10 ], "bp_grad_norms_F": [ 4.511462066147942e-06, 2.4275013998931172e-08, 2.338800797474505e-08, 2.338238225263467e-08, 2.3394919779207157e-08 ], "gamma_dfa": 0.11213390928969602, "acc_eval": 0.3037109375, "loss_eval": 1.9155462980270386, "epoch": 43 }, { "hidden_norms": [ 29332.80078125, 15055747.0, 96975336.0, 159279984.0, 164189344.0 ], "bp_grad_norms_per_sample_med": [ 8.274933804841567e-08, 6.447524736330479e-10, 6.278008113369538e-10, 6.277455777414787e-10, 6.275664987676066e-10 ], "bp_grad_norms_F": [ 4.426053692441201e-06, 2.3487833900048827e-08, 2.272233956546188e-08, 2.2717028258512073e-08, 2.272915367029782e-08 ], "gamma_dfa": 0.11223121372131573, "acc_eval": 0.3173828125, "loss_eval": 1.9162096977233887, "epoch": 44 }, { "hidden_norms": [ 29736.349609375, 15823423.0, 101458080.0, 166481584.0, 171638352.0 ], "bp_grad_norms_per_sample_med": [ 8.434898290943238e-08, 6.55440757224568e-10, 6.384029416217629e-10, 6.384751061183636e-10, 6.382625539202991e-10 ], "bp_grad_norms_F": [ 4.4675143726635724e-06, 2.308258295613541e-08, 2.2235047580920764e-08, 2.2229942331364327e-08, 2.2241332331418562e-08 ], "gamma_dfa": 0.11349940555010107, "acc_eval": 0.3134765625, "loss_eval": 1.935542106628418, "epoch": 45 }, { "hidden_norms": [ 30168.33984375, 16512403.0, 106240736.0, 174293312.0, 179686352.0 ], "bp_grad_norms_per_sample_med": [ 8.255891259523196e-08, 6.180955192114368e-10, 6.070984825967685e-10, 6.070359770404821e-10, 6.068190394614703e-10 ], "bp_grad_norms_F": [ 4.380563041195273e-06, 2.227099038520919e-08, 2.156298606337259e-08, 2.1558207663474604e-08, 2.1569489305761635e-08 ], "gamma_dfa": 0.11322060551538016, "acc_eval": 0.3212890625, "loss_eval": 1.9260894060134888, "epoch": 46 }, { "hidden_norms": [ 30560.10546875, 17240642.0, 111300408.0, 182109792.0, 187762288.0 ], "bp_grad_norms_per_sample_med": [ 8.14508851476603e-08, 6.030238530740917e-10, 5.890909982042558e-10, 5.890405385677866e-10, 5.88881721164114e-10 ], "bp_grad_norms_F": [ 4.2523201955191325e-06, 2.1578937747790405e-08, 2.0878760054188206e-08, 2.0874194817110947e-08, 2.08853556671329e-08 ], "gamma_dfa": 0.11227845895700739, "acc_eval": 0.3193359375, "loss_eval": 1.9136857986450195, "epoch": 47 }, { "hidden_norms": [ 30927.453125, 17981622.0, 115698520.0, 189446720.0, 195329056.0 ], "bp_grad_norms_per_sample_med": [ 7.999796736157805e-08, 5.827110460820961e-10, 5.688347570753649e-10, 5.688115534141502e-10, 5.69402469619007e-10 ], "bp_grad_norms_F": [ 4.254153282090556e-06, 2.1111715042820833e-08, 2.044158087244341e-08, 2.043698899001356e-08, 2.0447874504725405e-08 ], "gamma_dfa": 0.11285097184736514, "acc_eval": 0.3251953125, "loss_eval": 1.9130818843841553, "epoch": 48 }, { "hidden_norms": [ 31297.09765625, 18680606.0, 120312440.0, 197032272.0, 203114064.0 ], "bp_grad_norms_per_sample_med": [ 7.911415877970285e-08, 5.74776504169705e-10, 5.532440061628563e-10, 5.531197722064007e-10, 5.533422053893844e-10 ], "bp_grad_norms_F": [ 4.17833052779315e-06, 2.0621358842731752e-08, 1.9960678443453617e-08, 1.9956562624656726e-08, 1.9966993392017685e-08 ], "gamma_dfa": 0.11243592749451636, "acc_eval": 0.3125, "loss_eval": 1.9191365242004395, "epoch": 49 }, { "hidden_norms": [ 31637.244140625, 19360764.0, 124754384.0, 204064768.0, 210382992.0 ], "bp_grad_norms_per_sample_med": [ 8.003268447964729e-08, 5.749308251701279e-10, 5.599746222273438e-10, 5.599968821989876e-10, 5.599694041791281e-10 ], "bp_grad_norms_F": [ 4.128593900531996e-06, 2.0178502424528233e-08, 1.9575201903876405e-08, 1.9571228193626666e-08, 1.9581117172151608e-08 ], "gamma_dfa": 0.11233749791426817, "acc_eval": 0.330078125, "loss_eval": 1.9152377843856812, "epoch": 50 }, { "hidden_norms": [ 31964.60546875, 20067444.0, 128969536.0, 211772368.0, 218247696.0 ], "bp_grad_norms_per_sample_med": [ 7.774531951554309e-08, 5.427598370744136e-10, 5.298457228519737e-10, 5.297982053065198e-10, 5.30141264221129e-10 ], "bp_grad_norms_F": [ 4.058078957314137e-06, 1.9621586133666824e-08, 1.90722975190738e-08, 1.9068517431719556e-08, 1.907839575210346e-08 ], "gamma_dfa": 0.11183859535958618, "acc_eval": 0.328125, "loss_eval": 1.9089019298553467, "epoch": 51 }, { "hidden_norms": [ 32292.658203125, 20829408.0, 133566216.0, 219264704.0, 225938912.0 ], "bp_grad_norms_per_sample_med": [ 7.692310788343093e-08, 5.312774109533791e-10, 5.173871886476888e-10, 5.171740258269608e-10, 5.173406147918058e-10 ], "bp_grad_norms_F": [ 4.047169568366371e-06, 1.926170511978853e-08, 1.867934962263007e-08, 1.8675748947316606e-08, 1.868521692927061e-08 ], "gamma_dfa": 0.11216733865148854, "acc_eval": 0.330078125, "loss_eval": 1.917893886566162, "epoch": 52 }, { "hidden_norms": [ 32582.02734375, 21555154.0, 138235216.0, 226622112.0, 233550816.0 ], "bp_grad_norms_per_sample_med": [ 7.588336359276582e-08, 5.294207294781472e-10, 5.160025184913763e-10, 5.156744475875996e-10, 5.168100947194887e-10 ], "bp_grad_norms_F": [ 3.991732683061855e-06, 1.8877956975416055e-08, 1.8321758332717764e-08, 1.831830331866513e-08, 1.832757234865312e-08 ], "gamma_dfa": 0.11230919507215731, "acc_eval": 0.314453125, "loss_eval": 1.913461685180664, "epoch": 53 }, { "hidden_norms": [ 32871.28125, 22246662.0, 142493184.0, 233885040.0, 241005264.0 ], "bp_grad_norms_per_sample_med": [ 7.552973357860537e-08, 5.124695112712629e-10, 4.966513311721599e-10, 4.966223543512172e-10, 4.969377687125132e-10 ], "bp_grad_norms_F": [ 4.012842964584706e-06, 1.8570215587487837e-08, 1.8001765411668202e-08, 1.799840099181438e-08, 1.800739823920594e-08 ], "gamma_dfa": 0.11296637258055853, "acc_eval": 0.33203125, "loss_eval": 1.9206554889678955, "epoch": 54 }, { "hidden_norms": [ 33169.98828125, 22902584.0, 146822496.0, 241191920.0, 248487904.0 ], "bp_grad_norms_per_sample_med": [ 7.486269026912851e-08, 4.992010138593628e-10, 4.874242676145002e-10, 4.874663450671335e-10, 4.884102011715186e-10 ], "bp_grad_norms_F": [ 3.938752797694178e-06, 1.8166964821375586e-08, 1.767327617585579e-08, 1.7670013008341812e-08, 1.7678777552987412e-08 ], "gamma_dfa": 0.11258088904469332, "acc_eval": 0.3134765625, "loss_eval": 1.913904070854187, "epoch": 55 }, { "hidden_norms": [ 33456.9140625, 23628216.0, 151346624.0, 248325424.0, 255824304.0 ], "bp_grad_norms_per_sample_med": [ 7.482947239623172e-08, 5.02439700955648e-10, 4.890933769097217e-10, 4.891700933207233e-10, 4.892242166931737e-10 ], "bp_grad_norms_F": [ 3.895439022016944e-06, 1.781435265968412e-08, 1.7326955870089478e-08, 1.7324007117736073e-08, 1.7332443036366385e-08 ], "gamma_dfa": 0.11223017568408977, "acc_eval": 0.314453125, "loss_eval": 1.9154590368270874, "epoch": 56 }, { "hidden_norms": [ 33716.85546875, 24280678.0, 155270816.0, 255050304.0, 262737184.0 ], "bp_grad_norms_per_sample_med": [ 7.482827157900829e-08, 4.958616850458952e-10, 4.826584132366918e-10, 4.826221089437865e-10, 4.828137889489881e-10 ], "bp_grad_norms_F": [ 3.898983777617104e-06, 1.7600514823357116e-08, 1.7106302152569697e-08, 1.7103344518432095e-08, 1.7111482009113388e-08 ], "gamma_dfa": 0.11287979638109391, "acc_eval": 0.30859375, "loss_eval": 1.9285999536514282, "epoch": 57 }, { "hidden_norms": [ 33981.390625, 24925848.0, 159148752.0, 261662432.0, 269540768.0 ], "bp_grad_norms_per_sample_med": [ 7.396101153744894e-08, 4.846232304345222e-10, 4.728849534174628e-10, 4.72891226177552e-10, 4.725210223099907e-10 ], "bp_grad_norms_F": [ 3.847520019917283e-06, 1.7274359720431676e-08, 1.6806101399424733e-08, 1.6803195279635474e-08, 1.681126526875687e-08 ], "gamma_dfa": 0.11251267153238587, "acc_eval": 0.330078125, "loss_eval": 1.913767695426941, "epoch": 58 }, { "hidden_norms": [ 34242.87890625, 25494510.0, 162965072.0, 268190960.0, 276245600.0 ], "bp_grad_norms_per_sample_med": [ 7.276207725226413e-08, 4.64974586611433e-10, 4.573621481540613e-10, 4.5720988106623395e-10, 4.578690204759539e-10 ], "bp_grad_norms_F": [ 3.846054823952727e-06, 1.7068730429059542e-08, 1.6637597965996065e-08, 1.663470783341836e-08, 1.6642776046182917e-08 ], "gamma_dfa": 0.11268835317605408, "acc_eval": 0.318359375, "loss_eval": 1.9175846576690674, "epoch": 59 }, { "hidden_norms": [ 34498.37890625, 26013872.0, 166717360.0, 274736192.0, 282985952.0 ], "bp_grad_norms_per_sample_med": [ 7.275441760157264e-08, 4.638447681504232e-10, 4.554343846496778e-10, 4.5541673210358624e-10, 4.558452226799403e-10 ], "bp_grad_norms_F": [ 3.7814804727531737e-06, 1.6729790885960938e-08, 1.629800472358056e-08, 1.629528156854576e-08, 1.630315793477166e-08 ], "gamma_dfa": 0.11192971542368468, "acc_eval": 0.3125, "loss_eval": 1.9148613214492798, "epoch": 60 }, { "hidden_norms": [ 34741.75390625, 26574266.0, 170266464.0, 280835296.0, 289264896.0 ], "bp_grad_norms_per_sample_med": [ 7.206668328763044e-08, 4.543688481017938e-10, 4.4642781138470866e-10, 4.464762171085823e-10, 4.4638817642272954e-10 ], "bp_grad_norms_F": [ 3.800365902861813e-06, 1.6550599113429598e-08, 1.6135599523181554e-08, 1.6132924329781417e-08, 1.6140655034746487e-08 ], "gamma_dfa": 0.11263992198291817, "acc_eval": 0.328125, "loss_eval": 1.9202332496643066, "epoch": 61 }, { "hidden_norms": [ 34981.7578125, 27132752.0, 173824032.0, 286969856.0, 295549056.0 ], "bp_grad_norms_per_sample_med": [ 7.146741154429037e-08, 4.5107212409689623e-10, 4.4140177624107935e-10, 4.4141457156143815e-10, 4.4168110835407504e-10 ], "bp_grad_norms_F": [ 3.7655997857655166e-06, 1.6349241960256222e-08, 1.5922701379622595e-08, 1.5920058160645567e-08, 1.592757570278991e-08 ], "gamma_dfa": 0.11310465578208095, "acc_eval": 0.314453125, "loss_eval": 1.9224812984466553, "epoch": 62 }, { "hidden_norms": [ 35201.25, 27683016.0, 177040880.0, 292723872.0, 301473504.0 ], "bp_grad_norms_per_sample_med": [ 7.122528700165276e-08, 4.486005733550513e-10, 4.4048292791032395e-10, 4.4043477198663084e-10, 4.4109013663806707e-10 ], "bp_grad_norms_F": [ 3.748537892533932e-06, 1.6115603074240425e-08, 1.5725172275438126e-08, 1.572264451965566e-08, 1.5729948898979274e-08 ], "gamma_dfa": 0.11326105792613816, "acc_eval": 0.3095703125, "loss_eval": 1.9233062267303467, "epoch": 63 }, { "hidden_norms": [ 35399.75390625, 28156860.0, 180111792.0, 298457728.0, 307298976.0 ], "bp_grad_norms_per_sample_med": [ 7.082014974457707e-08, 4.4495629403229486e-10, 4.324987312731565e-10, 4.3260212079232474e-10, 4.3259393289751813e-10 ], "bp_grad_norms_F": [ 3.685790488816565e-06, 1.5895359695150546e-08, 1.5473323955461638e-08, 1.547100403342938e-08, 1.5478214265840506e-08 ], "gamma_dfa": 0.11222807004196511, "acc_eval": 0.3125, "loss_eval": 1.9198863506317139, "epoch": 64 }, { "hidden_norms": [ 35584.6640625, 28666806.0, 183522992.0, 303940064.0, 312955008.0 ], "bp_grad_norms_per_sample_med": [ 7.149574088316513e-08, 4.4883607941414994e-10, 4.353337967888393e-10, 4.3539158389727106e-10, 4.35594643688475e-10 ], "bp_grad_norms_F": [ 3.6930814530933276e-06, 1.5769751726679715e-08, 1.5353194271483517e-08, 1.535078197889561e-08, 1.5357914051605803e-08 ], "gamma_dfa": 0.11321029500413715, "acc_eval": 0.3095703125, "loss_eval": 1.9162211418151855, "epoch": 65 }, { "hidden_norms": [ 35768.86328125, 29145662.0, 186551392.0, 308909184.0, 318089856.0 ], "bp_grad_norms_per_sample_med": [ 6.985555245364594e-08, 4.355726057614362e-10, 4.2523776166980554e-10, 4.251851093428627e-10, 4.2568140679044575e-10 ], "bp_grad_norms_F": [ 3.7230390717013506e-06, 1.5615523096812467e-08, 1.523139303571952e-08, 1.522908021911462e-08, 1.5236116368555486e-08 ], "gamma_dfa": 0.11393742701784504, "acc_eval": 0.31640625, "loss_eval": 1.9276196956634521, "epoch": 66 }, { "hidden_norms": [ 35944.30859375, 29545796.0, 189503824.0, 313822880.0, 323180096.0 ], "bp_grad_norms_per_sample_med": [ 7.027381343505112e-08, 4.2508935260698877e-10, 4.156285593470699e-10, 4.156731903126598e-10, 4.1562600583411324e-10 ], "bp_grad_norms_F": [ 3.67820075553027e-06, 1.5450812185235918e-08, 1.5081118576176777e-08, 1.5078812864999236e-08, 1.5085870330722173e-08 ], "gamma_dfa": 0.11295431066082529, "acc_eval": 0.3251953125, "loss_eval": 1.9145984649658203, "epoch": 67 }, { "hidden_norms": [ 36107.91015625, 29963964.0, 192509232.0, 318614048.0, 328116416.0 ], "bp_grad_norms_per_sample_med": [ 6.995779955332182e-08, 4.257695862541766e-10, 4.1527120631101866e-10, 4.1522696392348735e-10, 4.1541275974665837e-10 ], "bp_grad_norms_F": [ 3.6363949220685754e-06, 1.5271682585193957e-08, 1.4899570466297973e-08, 1.4897324263074552e-08, 1.4904214751254585e-08 ], "gamma_dfa": 0.11261070579712396, "acc_eval": 0.322265625, "loss_eval": 1.9148796796798706, "epoch": 68 }, { "hidden_norms": [ 36263.38671875, 30397186.0, 195132224.0, 323205344.0, 332809856.0 ], "bp_grad_norms_per_sample_med": [ 6.94296602432587e-08, 4.221426264106043e-10, 4.1666703420872864e-10, 4.166992584320184e-10, 4.166444134146019e-10 ], "bp_grad_norms_F": [ 3.677051836348255e-06, 1.5217779036902357e-08, 1.486149248108859e-08, 1.4859250718757266e-08, 1.4866162523219373e-08 ], "gamma_dfa": 0.11349719034842565, "acc_eval": 0.3134765625, "loss_eval": 1.9238262176513672, "epoch": 69 }, { "hidden_norms": [ 36417.9921875, 30770712.0, 197719328.0, 327539232.0, 337245152.0 ], "bp_grad_norms_per_sample_med": [ 6.906716976118332e-08, 4.1953429619212557e-10, 4.080901727654407e-10, 4.080701054842706e-10, 4.0843109450072745e-10 ], "bp_grad_norms_F": [ 3.6080327845411375e-06, 1.500828084033401e-08, 1.4656276192681617e-08, 1.465407439837918e-08, 1.466091692492455e-08 ], "gamma_dfa": 0.11264980123269197, "acc_eval": 0.3115234375, "loss_eval": 1.9172749519348145, "epoch": 70 }, { "hidden_norms": [ 36554.734375, 31127202.0, 200166992.0, 331766240.0, 341638624.0 ], "bp_grad_norms_per_sample_med": [ 6.895474768953136e-08, 4.153002663986882e-10, 4.053070101761591e-10, 4.0528172484677327e-10, 4.0563402636806245e-10 ], "bp_grad_norms_F": [ 3.5790299079963006e-06, 1.4871366360580396e-08, 1.4521869928785236e-08, 1.4519704549798007e-08, 1.4526481351140319e-08 ], "gamma_dfa": 0.1125820265888251, "acc_eval": 0.3291015625, "loss_eval": 1.90960693359375, "epoch": 71 }, { "hidden_norms": [ 36685.06640625, 31478428.0, 202703456.0, 335890528.0, 345860736.0 ], "bp_grad_norms_per_sample_med": [ 6.840604527269534e-08, 4.11831152513642e-10, 4.0155134772845713e-10, 4.014005239305618e-10, 4.018080868029017e-10 ], "bp_grad_norms_F": [ 3.5732464311877266e-06, 1.4777253198872131e-08, 1.4430981742918902e-08, 1.4428859884674239e-08, 1.443555053270984e-08 ], "gamma_dfa": 0.11229235199152754, "acc_eval": 0.3095703125, "loss_eval": 1.912062644958496, "epoch": 72 }, { "hidden_norms": [ 36808.640625, 31756406.0, 205006400.0, 339625888.0, 349722048.0 ], "bp_grad_norms_per_sample_med": [ 6.845510824859957e-08, 4.056126268192628e-10, 3.9775802096464474e-10, 3.9773195847914167e-10, 3.978435358931165e-10 ], "bp_grad_norms_F": [ 3.601402113417862e-06, 1.4699119255112691e-08, 1.434870711136682e-08, 1.4346603904868971e-08, 1.4353199517813664e-08 ], "gamma_dfa": 0.11323098125649267, "acc_eval": 0.3271484375, "loss_eval": 1.9194645881652832, "epoch": 73 }, { "hidden_norms": [ 36922.67578125, 32105574.0, 207090144.0, 343260640.0, 353436544.0 ], "bp_grad_norms_per_sample_med": [ 6.8447327805643e-08, 4.050982882475296e-10, 3.977037865698918e-10, 3.9765896131527256e-10, 3.979234441953139e-10 ], "bp_grad_norms_F": [ 3.603466893764562e-06, 1.4652233204515142e-08, 1.4306199780378392e-08, 1.4304094797523703e-08, 1.4310627349800598e-08 ], "gamma_dfa": 0.11329636031587142, "acc_eval": 0.3056640625, "loss_eval": 1.922640323638916, "epoch": 74 }, { "hidden_norms": [ 37024.05859375, 32409028.0, 208845456.0, 346325312.0, 356587104.0 ], "bp_grad_norms_per_sample_med": [ 6.819700359983472e-08, 4.0326031403026263e-10, 3.9583156197231517e-10, 3.9586384170675615e-10, 3.9581374289276994e-10 ], "bp_grad_norms_F": [ 3.5432237837085268e-06, 1.4486117194678627e-08, 1.4156262828635136e-08, 1.4154186267489877e-08, 1.4160684180808403e-08 ], "gamma_dfa": 0.11267639175457589, "acc_eval": 0.31640625, "loss_eval": 1.9154051542282104, "epoch": 75 }, { "hidden_norms": [ 37125.02734375, 32663892.0, 210781344.0, 349533728.0, 359873568.0 ], "bp_grad_norms_per_sample_med": [ 6.772787486397647e-08, 3.9591485645473767e-10, 3.875866017022389e-10, 3.8754283115949306e-10, 3.8766378995802597e-10 ], "bp_grad_norms_F": [ 3.5503553590388037e-06, 1.4420066918319208e-08, 1.40893732236691e-08, 1.4087291333453322e-08, 1.4093810563053921e-08 ], "gamma_dfa": 0.11297615164312447, "acc_eval": 0.32421875, "loss_eval": 1.913941502571106, "epoch": 76 }, { "hidden_norms": [ 37216.296875, 32930840.0, 212456432.0, 352475008.0, 362884992.0 ], "bp_grad_norms_per_sample_med": [ 6.74248425980295e-08, 3.9426073517034865e-10, 3.872507869928654e-10, 3.8720734951702696e-10, 3.8765768373139053e-10 ], "bp_grad_norms_F": [ 3.55011752617429e-06, 1.4357588895563822e-08, 1.402936344874206e-08, 1.402732330291201e-08, 1.4033815887160017e-08 ], "gamma_dfa": 0.11311322844358074, "acc_eval": 0.3203125, "loss_eval": 1.914380431175232, "epoch": 77 }, { "hidden_norms": [ 37298.37890625, 33147848.0, 214118832.0, 355022880.0, 365529568.0 ], "bp_grad_norms_per_sample_med": [ 6.774458682912154e-08, 3.987353780487979e-10, 3.904769285689724e-10, 3.904657153164237e-10, 3.907260348601227e-10 ], "bp_grad_norms_F": [ 3.509487669361988e-06, 1.4249152968659473e-08, 1.3931584774695693e-08, 1.3929625453101835e-08, 1.3936028331329453e-08 ], "gamma_dfa": 0.11238172389857937, "acc_eval": 0.314453125, "loss_eval": 1.9106721878051758, "epoch": 78 }, { "hidden_norms": [ 37372.10546875, 33388374.0, 215761392.0, 357596800.0, 368190304.0 ], "bp_grad_norms_per_sample_med": [ 6.751073300392818e-08, 3.9374201121766816e-10, 3.8655822987010424e-10, 3.866116038420131e-10, 3.8653891198947576e-10 ], "bp_grad_norms_F": [ 3.537302973199985e-06, 1.4222394817409167e-08, 1.3910858243093571e-08, 1.3908881157931319e-08, 1.3915280483445258e-08 ], "gamma_dfa": 0.11306001050525083, "acc_eval": 0.322265625, "loss_eval": 1.9138463735580444, "epoch": 79 }, { "hidden_norms": [ 37442.84375, 33566284.0, 216908128.0, 359755968.0, 370379136.0 ], "bp_grad_norms_per_sample_med": [ 6.704155453007843e-08, 3.923593672183756e-10, 3.850708640840139e-10, 3.8509884170423447e-10, 3.849042473635933e-10 ], "bp_grad_norms_F": [ 3.509628641040763e-06, 1.4144676541150147e-08, 1.3834353218555862e-08, 1.3832397449675682e-08, 1.3838723056380786e-08 ], "gamma_dfa": 0.11266809623703011, "acc_eval": 0.3251953125, "loss_eval": 1.9121947288513184, "epoch": 80 }, { "hidden_norms": [ 37512.11328125, 33717608.0, 218115872.0, 361736960.0, 372400416.0 ], "bp_grad_norms_per_sample_med": [ 6.701832688804643e-08, 3.917752788851203e-10, 3.835655681960759e-10, 3.835243511662867e-10, 3.835320394607322e-10 ], "bp_grad_norms_F": [ 3.5144942103215726e-06, 1.4111047441645042e-08, 1.3798888254257236e-08, 1.3796943143518092e-08, 1.3803241216692186e-08 ], "gamma_dfa": 0.11281233225781762, "acc_eval": 0.3193359375, "loss_eval": 1.9152591228485107, "epoch": 81 }, { "hidden_norms": [ 37568.84375, 33899664.0, 219258560.0, 363709504.0, 374424128.0 ], "bp_grad_norms_per_sample_med": [ 6.695909604559347e-08, 3.8868031015937277e-10, 3.823757421805851e-10, 3.8241659838789133e-10, 3.8222841558521736e-10 ], "bp_grad_norms_F": [ 3.516150854920852e-06, 1.40706539752955e-08, 1.3756586092483758e-08, 1.375462410635464e-08, 1.3760891093284044e-08 ], "gamma_dfa": 0.11307295318874822, "acc_eval": 0.326171875, "loss_eval": 1.9149377346038818, "epoch": 82 }, { "hidden_norms": [ 37613.421875, 34060644.0, 220322080.0, 365325472.0, 376109056.0 ], "bp_grad_norms_per_sample_med": [ 6.71154296583154e-08, 3.8974332094987574e-10, 3.834943751446218e-10, 3.8340422503502225e-10, 3.8375369548759863e-10 ], "bp_grad_norms_F": [ 3.4982940633199178e-06, 1.4013506799415154e-08, 1.370163893454901e-08, 1.3699707146486162e-08, 1.3705942158992457e-08 ], "gamma_dfa": 0.1128659905607492, "acc_eval": 0.3212890625, "loss_eval": 1.912517786026001, "epoch": 83 }, { "hidden_norms": [ 37660.46875, 34177292.0, 221168784.0, 366778016.0, 377600544.0 ], "bp_grad_norms_per_sample_med": [ 6.68943869186478e-08, 3.894674860394076e-10, 3.8076572450584933e-10, 3.8073258434856427e-10, 3.8100084198688933e-10 ], "bp_grad_norms_F": [ 3.4944750950671732e-06, 1.397998961039093e-08, 1.3671985321650482e-08, 1.3670069520799188e-08, 1.3676272558882374e-08 ], "gamma_dfa": 0.11273636969053769, "acc_eval": 0.318359375, "loss_eval": 1.9171113967895508, "epoch": 84 }, { "hidden_norms": [ 37701.8671875, 34327872.0, 222020640.0, 368143552.0, 379001216.0 ], "bp_grad_norms_per_sample_med": [ 6.639802307972786e-08, 3.87883669628053e-10, 3.8044753458699176e-10, 3.804264403495239e-10, 3.8037359373355173e-10 ], "bp_grad_norms_F": [ 3.4919537483801832e-06, 1.3943878052202763e-08, 1.3639727569625393e-08, 1.3637805551525162e-08, 1.364400148418099e-08 ], "gamma_dfa": 0.11286781356830033, "acc_eval": 0.328125, "loss_eval": 1.9123945236206055, "epoch": 85 }, { "hidden_norms": [ 37739.8125, 34429904.0, 222737072.0, 369295712.0, 380185984.0 ], "bp_grad_norms_per_sample_med": [ 6.741821323430486e-08, 3.8846115213431176e-10, 3.8069486452130263e-10, 3.8060576912357647e-10, 3.809500215279371e-10 ], "bp_grad_norms_F": [ 3.500515958876349e-06, 1.3945418153582523e-08, 1.364027113481825e-08, 1.3638369544821671e-08, 1.364453350305439e-08 ], "gamma_dfa": 0.11293645015939546, "acc_eval": 0.3154296875, "loss_eval": 1.917877197265625, "epoch": 86 }, { "hidden_norms": [ 37773.1484375, 34523684.0, 223309680.0, 370332384.0, 381249280.0 ], "bp_grad_norms_per_sample_med": [ 6.685363729275196e-08, 3.8528755186284513e-10, 3.7927344598287505e-10, 3.7934516639026583e-10, 3.7926364826468273e-10 ], "bp_grad_norms_F": [ 3.4931999834952876e-06, 1.3911479967987361e-08, 1.360801249461474e-08, 1.3606110904618163e-08, 1.3612289961884017e-08 ], "gamma_dfa": 0.11282484548610228, "acc_eval": 0.322265625, "loss_eval": 1.9136494398117065, "epoch": 87 }, { "hidden_norms": [ 37800.29296875, 34600436.0, 223845264.0, 371228288.0, 382171744.0 ], "bp_grad_norms_per_sample_med": [ 6.65767956320451e-08, 3.853606878045923e-10, 3.7911099259879677e-10, 3.789283054000947e-10, 3.791919833684432e-10 ], "bp_grad_norms_F": [ 3.4772997423715424e-06, 1.3876966242776234e-08, 1.3575736979021258e-08, 1.3573847823522556e-08, 1.3580010893576855e-08 ], "gamma_dfa": 0.11266115616490424, "acc_eval": 0.318359375, "loss_eval": 1.912358045578003, "epoch": 88 }, { "hidden_norms": [ 37822.953125, 34659448.0, 224278352.0, 371994688.0, 382956800.0 ], "bp_grad_norms_per_sample_med": [ 6.695878340678973e-08, 3.8400196911148043e-10, 3.7754030457470833e-10, 3.775957047036371e-10, 3.7752789783240814e-10 ], "bp_grad_norms_F": [ 3.488719130473328e-06, 1.387363113281026e-08, 1.3571511026100325e-08, 1.3569623646958462e-08, 1.3575775170693305e-08 ], "gamma_dfa": 0.11286654848299804, "acc_eval": 0.318359375, "loss_eval": 1.9152348041534424, "epoch": 89 }, { "hidden_norms": [ 37843.71484375, 34715836.0, 224633712.0, 372602496.0, 383583840.0 ], "bp_grad_norms_per_sample_med": [ 6.682009967562408e-08, 3.831650552399424e-10, 3.7603772873318064e-10, 3.7600736413345714e-10, 3.763372669052245e-10 ], "bp_grad_norms_F": [ 3.4864976896642474e-06, 1.3852580416084948e-08, 1.355203504971314e-08, 1.3550148558749697e-08, 1.3556297417949281e-08 ], "gamma_dfa": 0.11291119743145828, "acc_eval": 0.326171875, "loss_eval": 1.914948582649231, "epoch": 90 }, { "hidden_norms": [ 37859.484375, 34761876.0, 224938096.0, 373110784.0, 384106720.0 ], "bp_grad_norms_per_sample_med": [ 6.677319674963655e-08, 3.8410433167435087e-10, 3.768680645332978e-10, 3.768474976517666e-10, 3.767945122579164e-10 ], "bp_grad_norms_F": [ 3.480063014649204e-06, 1.3833711953736838e-08, 1.3534608989118624e-08, 1.3532734044474637e-08, 1.3538858922856889e-08 ], "gamma_dfa": 0.1127637956833496, "acc_eval": 0.322265625, "loss_eval": 1.9153952598571777, "epoch": 91 }, { "hidden_norms": [ 37872.0625, 34797108.0, 225202544.0, 373570400.0, 384579200.0 ], "bp_grad_norms_per_sample_med": [ 6.67909034746117e-08, 3.821318816932262e-10, 3.753052590926842e-10, 3.7535435870594824e-10, 3.7532754681990355e-10 ], "bp_grad_norms_F": [ 3.4843556022678968e-06, 1.3827068379157481e-08, 1.352985190550271e-08, 1.3527971631788205e-08, 1.3534107168311493e-08 ], "gamma_dfa": 0.1129197701375233, "acc_eval": 0.318359375, "loss_eval": 1.9156945943832397, "epoch": 92 }, { "hidden_norms": [ 37881.54296875, 34826116.0, 225403072.0, 373889952.0, 384906848.0 ], "bp_grad_norms_per_sample_med": [ 6.663099583192889e-08, 3.844494445015556e-10, 3.765425748980533e-10, 3.7651176620911997e-10, 3.7661743168548867e-10 ], "bp_grad_norms_F": [ 3.480702616798226e-06, 1.382177039488397e-08, 1.3523890451949683e-08, 1.3522016395484115e-08, 1.3528141273866368e-08 ], "gamma_dfa": 0.11285195982236473, "acc_eval": 0.322265625, "loss_eval": 1.9148646593093872, "epoch": 93 }, { "hidden_norms": [ 37889.18359375, 34847784.0, 225551344.0, 374143840.0, 385168448.0 ], "bp_grad_norms_per_sample_med": [ 6.623226767032975e-08, 3.819731198007048e-10, 3.7512581929632915e-10, 3.752123889366743e-10, 3.7511962980296687e-10 ], "bp_grad_norms_F": [ 3.4782924558385275e-06, 1.3813751031932497e-08, 1.3516644692401769e-08, 1.3514763530508844e-08, 1.3520896402496874e-08 ], "gamma_dfa": 0.11281965267244232, "acc_eval": 0.318359375, "loss_eval": 1.9142093658447266, "epoch": 94 }, { "hidden_norms": [ 37895.046875, 34865808.0, 225670928.0, 374345440.0, 385375392.0 ], "bp_grad_norms_per_sample_med": [ 6.64825137164371e-08, 3.829765116147854e-10, 3.7528671836817296e-10, 3.7535685670775365e-10, 3.752768373832538e-10 ], "bp_grad_norms_F": [ 3.4792733458743896e-06, 1.3809607679604596e-08, 1.3512363672418815e-08, 1.3510485175061149e-08, 1.351661271797866e-08 ], "gamma_dfa": 0.11288163481003721, "acc_eval": 0.32421875, "loss_eval": 1.9146695137023926, "epoch": 95 }, { "hidden_norms": [ 37898.87109375, 34878456.0, 225750400.0, 374473248.0, 385506496.0 ], "bp_grad_norms_per_sample_med": [ 6.652722817079848e-08, 3.8302755411834255e-10, 3.759152988891401e-10, 3.7595143664859165e-10, 3.7588568368995823e-10 ], "bp_grad_norms_F": [ 3.480078930806485e-06, 1.3808159060602065e-08, 1.3511034957502943e-08, 1.3509157348323697e-08, 1.351528045034911e-08 ], "gamma_dfa": 0.1128929610213163, "acc_eval": 0.3203125, "loss_eval": 1.9147298336029053, "epoch": 96 }, { "hidden_norms": [ 37900.7109375, 34885860.0, 225787696.0, 374537472.0, 385572896.0 ], "bp_grad_norms_per_sample_med": [ 6.630104820715133e-08, 3.8308795025088216e-10, 3.7579228617801164e-10, 3.7582850720419003e-10, 3.7576297629016153e-10 ], "bp_grad_norms_F": [ 3.4770955608109944e-06, 1.3803015619373582e-08, 1.3505847995531894e-08, 1.3503973050887907e-08, 1.3510093488378061e-08 ], "gamma_dfa": 0.11285188281362935, "acc_eval": 0.3212890625, "loss_eval": 1.9143996238708496, "epoch": 97 }, { "hidden_norms": [ 37902.46875, 34890740.0, 225820192.0, 374593792.0, 385630976.0 ], "bp_grad_norms_per_sample_med": [ 6.624973991620209e-08, 3.8267702895389277e-10, 3.7545791475857015e-10, 3.7555664134103495e-10, 3.75430270205257e-10 ], "bp_grad_norms_F": [ 3.476953224890167e-06, 1.3801756182374447e-08, 1.350452816240022e-08, 1.3502653217756233e-08, 1.3508774543424806e-08 ], "gamma_dfa": 0.11284657929081732, "acc_eval": 0.3203125, "loss_eval": 1.9143402576446533, "epoch": 98 }, { "hidden_norms": [ 37903.22265625, 34893256.0, 225836736.0, 374620576.0, 385658624.0 ], "bp_grad_norms_per_sample_med": [ 6.627380599866228e-08, 3.8272779390169376e-10, 3.7550038078926207e-10, 3.7559910737172686e-10, 3.7547268072479767e-10 ], "bp_grad_norms_F": [ 3.477006657703896e-06, 1.3801344067587706e-08, 1.3504034335198867e-08, 1.350215939055488e-08, 1.3508279828045033e-08 ], "gamma_dfa": 0.11284785682073561, "acc_eval": 0.3203125, "loss_eval": 1.9143691062927246, "epoch": 99 }, { "hidden_norms": [ 37903.25, 34893376.0, 225837280.0, 374621408.0, 385659456.0 ], "bp_grad_norms_per_sample_med": [ 6.626758874972438e-08, 3.826984007471168e-10, 3.755481758904722e-10, 3.756469302285126e-10, 3.755204758260078e-10 ], "bp_grad_norms_F": [ 3.476960500847781e-06, 1.3801311204986177e-08, 1.3503997919883659e-08, 1.3502122975239672e-08, 1.3508243412729826e-08 ], "gamma_dfa": 0.11284651984533411, "acc_eval": 0.3203125, "loss_eval": 1.9143500328063965, "epoch": 100 } ] }