{ "config": { "output_dir": "results/snapshot_evolution_v2", "epochs": 100, "lr": 0.001, "wd": 0.01, "seed": 456, "depth": 4, "d_hidden": 256, "log_every": 1 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.696551322937012, 8.737784385681152, 8.813130378723145, 8.844642639160156, 8.889528274536133 ], "bp_grad_norms_per_sample_med": [ 0.0010079912608489394, 0.0010035138111561537, 0.0009970925748348236, 0.0009936393471434712, 0.000986678060144186 ], "bp_grad_norms_F": [ 0.035574451088905334, 0.035288579761981964, 0.035048045217990875, 0.0346725769340992, 0.03439188003540039 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.4863264560699463, "epoch": 0 }, { "hidden_norms": [ 79.9596176147461, 82.38219451904297, 86.97193145751953, 92.46615600585938, 99.17337799072266 ], "bp_grad_norms_per_sample_med": [ 5.704927025362849e-05, 5.414035331341438e-05, 5.3104751714272425e-05, 5.354730456019752e-05, 5.5780339607736096e-05 ], "bp_grad_norms_F": [ 0.00240120361559093, 0.0021707164123654366, 0.002052225871011615, 0.0020026240963488817, 0.002049861242994666 ], "gamma_dfa": NaN, "acc_eval": 0.400390625, "loss_eval": 1.6942739486694336, "epoch": 1 }, { "hidden_norms": [ 95.21885681152344, 97.9500732421875, 101.84932708740234, 108.15538787841797, 115.16011810302734 ], "bp_grad_norms_per_sample_med": [ 4.467168764676899e-05, 4.3202508095419034e-05, 4.3004638428101316e-05, 4.286228431737982e-05, 4.4292191887507215e-05 ], "bp_grad_norms_F": [ 0.0018949288642033935, 0.0017146588070318103, 0.0016399234300479293, 0.001598119386471808, 0.0016228299355134368 ], "gamma_dfa": NaN, "acc_eval": 0.4599609375, "loss_eval": 1.5051867961883545, "epoch": 2 }, { "hidden_norms": [ 112.65824890136719, 111.87681579589844, 114.76032257080078, 118.74363708496094, 125.05441284179688 ], "bp_grad_norms_per_sample_med": [ 4.4033156882505864e-05, 4.2794465116458014e-05, 4.2031828343169764e-05, 4.134616028750315e-05, 4.226301462040283e-05 ], "bp_grad_norms_F": [ 0.0018527565989643335, 0.0017638156423345208, 0.0016669610049575567, 0.0015881577273830771, 0.0015705813420936465 ], "gamma_dfa": NaN, "acc_eval": 0.4931640625, "loss_eval": 1.4331163167953491, "epoch": 3 }, { "hidden_norms": [ 126.20967102050781, 125.90274810791016, 128.2918243408203, 131.685302734375, 136.71499633789062 ], "bp_grad_norms_per_sample_med": [ 4.358301157481037e-05, 4.267259282642044e-05, 4.196130612399429e-05, 4.08500200137496e-05, 4.0281276596942917e-05 ], "bp_grad_norms_F": [ 0.0018887611804530025, 0.0017927174922078848, 0.0016837789444252849, 0.0015876276884227991, 0.0015263468958437443 ], "gamma_dfa": NaN, "acc_eval": 0.490234375, "loss_eval": 1.4055290222167969, "epoch": 4 }, { "hidden_norms": [ 137.673583984375, 136.8435516357422, 138.64651489257812, 141.41473388671875, 147.87835693359375 ], "bp_grad_norms_per_sample_med": [ 4.085261025466025e-05, 4.06657018174883e-05, 3.941181785194203e-05, 3.858502532239072e-05, 3.7998870539013296e-05 ], "bp_grad_norms_F": [ 0.001770049100741744, 0.0016922445502132177, 0.0016029543476179242, 0.0015241446672007442, 0.0014664788031950593 ], "gamma_dfa": NaN, "acc_eval": 0.50390625, "loss_eval": 1.3763911724090576, "epoch": 5 }, { "hidden_norms": [ 150.45315551757812, 148.60609436035156, 150.3750457763672, 152.9460906982422, 158.2902069091797 ], "bp_grad_norms_per_sample_med": [ 3.8344696804415435e-05, 3.8422465877374634e-05, 3.834897142951377e-05, 3.7070902180857956e-05, 3.6289642594056204e-05 ], "bp_grad_norms_F": [ 0.0017990845954045653, 0.001743242726661265, 0.0016358466818928719, 0.0015305348206311464, 0.0014392968732863665 ], "gamma_dfa": NaN, "acc_eval": 0.5166015625, "loss_eval": 1.373401165008545, "epoch": 6 }, { "hidden_norms": [ 162.06126403808594, 159.53811645507812, 158.62655639648438, 160.54307556152344, 165.60415649414062 ], "bp_grad_norms_per_sample_med": [ 3.797870522248559e-05, 3.766914960579015e-05, 3.7873480323469266e-05, 3.735603968380019e-05, 3.6521956644719467e-05 ], "bp_grad_norms_F": [ 0.001707478309981525, 0.0016470234841108322, 0.0015834521036595106, 0.001506388420239091, 0.001406461582519114 ], "gamma_dfa": NaN, "acc_eval": 0.5283203125, "loss_eval": 1.3223559856414795, "epoch": 7 }, { "hidden_norms": [ 169.8936309814453, 168.42221069335938, 169.54115295410156, 171.452880859375, 176.4298553466797 ], "bp_grad_norms_per_sample_med": [ 3.760562321986072e-05, 3.8139285607030615e-05, 3.7332967622205615e-05, 3.670771184260957e-05, 3.4867567592300475e-05 ], "bp_grad_norms_F": [ 0.001674071652814746, 0.0016396756982430816, 0.001556537114083767, 0.001464220928028226, 0.0013669237960129976 ], "gamma_dfa": NaN, "acc_eval": 0.529296875, "loss_eval": 1.3310301303863525, "epoch": 8 }, { "hidden_norms": [ 177.821044921875, 176.60687255859375, 177.76409912109375, 179.53733825683594, 184.176513671875 ], "bp_grad_norms_per_sample_med": [ 3.643108357209712e-05, 3.605252277338877e-05, 3.6002034903503954e-05, 3.529640525812283e-05, 3.386645403224975e-05 ], "bp_grad_norms_F": [ 0.0016080558998510242, 0.0015692447777837515, 0.0014910849276930094, 0.0014210963854566216, 0.0013221093686297536 ], "gamma_dfa": NaN, "acc_eval": 0.5390625, "loss_eval": 1.3072502613067627, "epoch": 9 }, { "hidden_norms": [ 188.1353759765625, 184.39834594726562, 184.91822814941406, 185.82460021972656, 191.45692443847656 ], "bp_grad_norms_per_sample_med": [ 3.544713035807945e-05, 3.5891316656488925e-05, 3.613864828366786e-05, 3.507022120174952e-05, 3.361281778779812e-05 ], "bp_grad_norms_F": [ 0.0015651460271328688, 0.0015296414494514465, 0.0014787326799705625, 0.0014131872449070215, 0.0013114992761984468 ], "gamma_dfa": NaN, "acc_eval": 0.5537109375, "loss_eval": 1.2935423851013184, "epoch": 10 }, { "hidden_norms": [ 193.53599548339844, 189.33700561523438, 190.08908081054688, 192.31288146972656, 198.0936737060547 ], "bp_grad_norms_per_sample_med": [ 3.3899334084708244e-05, 3.468272552709095e-05, 3.463856774033047e-05, 3.383589137229137e-05, 3.240162550355308e-05 ], "bp_grad_norms_F": [ 0.001495138043537736, 0.0014781414065510035, 0.0014301009941846132, 0.0013711795909330249, 0.0012839946430176497 ], "gamma_dfa": NaN, "acc_eval": 0.544921875, "loss_eval": 1.2766207456588745, "epoch": 11 }, { "hidden_norms": [ 199.85023498535156, 194.9699249267578, 193.4657440185547, 194.60928344726562, 199.97662353515625 ], "bp_grad_norms_per_sample_med": [ 3.289094092906453e-05, 3.539410317898728e-05, 3.491900861263275e-05, 3.4397991839796305e-05, 3.252939859521575e-05 ], "bp_grad_norms_F": [ 0.0015656249597668648, 0.0015614606672897935, 0.0015110056847333908, 0.0014306820230558515, 0.00130200176499784 ], "gamma_dfa": NaN, "acc_eval": 0.5439453125, "loss_eval": 1.2812860012054443, "epoch": 12 }, { "hidden_norms": [ 206.15440368652344, 199.86099243164062, 199.35470581054688, 201.66831970214844, 206.71054077148438 ], "bp_grad_norms_per_sample_med": [ 3.430957076488994e-05, 3.5125638532917947e-05, 3.523785198922269e-05, 3.404217568458989e-05, 3.245573316235095e-05 ], "bp_grad_norms_F": [ 0.0015102275647222996, 0.0015037795528769493, 0.001468595233745873, 0.0013989906292408705, 0.0012804438592866063 ], "gamma_dfa": NaN, "acc_eval": 0.5517578125, "loss_eval": 1.2559274435043335, "epoch": 13 }, { "hidden_norms": [ 209.39404296875, 203.8543243408203, 201.63771057128906, 202.7413787841797, 209.64585876464844 ], "bp_grad_norms_per_sample_med": [ 3.3599189919186756e-05, 3.511353497742675e-05, 3.4795291867339984e-05, 3.415898390812799e-05, 3.225719046895392e-05 ], "bp_grad_norms_F": [ 0.0015785910654813051, 0.0015854343073442578, 0.0015357385855168104, 0.00144979078322649, 0.0013052559224888682 ], "gamma_dfa": NaN, "acc_eval": 0.5478515625, "loss_eval": 1.2778449058532715, "epoch": 14 }, { "hidden_norms": [ 214.74293518066406, 208.2928924560547, 206.78591918945312, 207.79452514648438, 213.0249481201172 ], "bp_grad_norms_per_sample_med": [ 3.347836172906682e-05, 3.457088314462453e-05, 3.509481393848546e-05, 3.4477459848858416e-05, 3.169552292092703e-05 ], "bp_grad_norms_F": [ 0.0015018024714663625, 0.0015100837917998433, 0.0014814585447311401, 0.0014098759274929762, 0.0012745971325784922 ], "gamma_dfa": NaN, "acc_eval": 0.5693359375, "loss_eval": 1.2316113710403442, "epoch": 15 }, { "hidden_norms": [ 223.09906005859375, 214.6353302001953, 211.16726684570312, 210.60520935058594, 214.28952026367188 ], "bp_grad_norms_per_sample_med": [ 3.5336081054992974e-05, 3.693878170452081e-05, 3.7104789953446016e-05, 3.635902612586506e-05, 3.3355980121996254e-05 ], "bp_grad_norms_F": [ 0.0015461220173165202, 0.0015768769662827253, 0.0015498694265261292, 0.001453379518352449, 0.0013068238040432334 ], "gamma_dfa": NaN, "acc_eval": 0.55078125, "loss_eval": 1.2516858577728271, "epoch": 16 }, { "hidden_norms": [ 225.36517333984375, 217.36669921875, 214.27880859375, 215.62054443359375, 219.76197814941406 ], "bp_grad_norms_per_sample_med": [ 3.474476397968829e-05, 3.609717168728821e-05, 3.612042564782314e-05, 3.547673986759037e-05, 3.216006007278338e-05 ], "bp_grad_norms_F": [ 0.001510953065007925, 0.0015347315929830074, 0.0015160846523940563, 0.001440546941012144, 0.0012782461708411574 ], "gamma_dfa": NaN, "acc_eval": 0.583984375, "loss_eval": 1.2262325286865234, "epoch": 17 }, { "hidden_norms": [ 230.7099151611328, 222.3380889892578, 218.67819213867188, 217.3147735595703, 221.999755859375 ], "bp_grad_norms_per_sample_med": [ 3.285402272013016e-05, 3.4367294574622065e-05, 3.490627204882912e-05, 3.413260492379777e-05, 3.064925112994388e-05 ], "bp_grad_norms_F": [ 0.0015693235909566283, 0.0015950833912938833, 0.0015582602936774492, 0.001467122812755406, 0.0012723723193630576 ], "gamma_dfa": NaN, "acc_eval": 0.5751953125, "loss_eval": 1.2127145528793335, "epoch": 18 }, { "hidden_norms": [ 235.28932189941406, 226.01202392578125, 222.56756591796875, 222.25152587890625, 226.0247344970703 ], "bp_grad_norms_per_sample_med": [ 3.336059671710245e-05, 3.488900983938947e-05, 3.518831363180652e-05, 3.5047873097937554e-05, 3.1955056329024956e-05 ], "bp_grad_norms_F": [ 0.0015264152316376567, 0.0015387749299407005, 0.0015209508128464222, 0.001451890799216926, 0.00127940543461591 ], "gamma_dfa": NaN, "acc_eval": 0.5673828125, "loss_eval": 1.2340281009674072, "epoch": 19 }, { "hidden_norms": [ 239.98486328125, 230.95614624023438, 226.7176513671875, 225.3818359375, 231.0238037109375 ], "bp_grad_norms_per_sample_med": [ 3.4207379940198734e-05, 3.5167759051546454e-05, 3.5256896808277816e-05, 3.462574022705667e-05, 3.117474989267066e-05 ], "bp_grad_norms_F": [ 0.0015223841182887554, 0.0015598630998283625, 0.0015445069875568151, 0.0014689662493765354, 0.0012761331163346767 ], "gamma_dfa": NaN, "acc_eval": 0.56640625, "loss_eval": 1.2441283464431763, "epoch": 20 }, { "hidden_norms": [ 245.0663299560547, 233.2012939453125, 227.60426330566406, 226.96006774902344, 229.30145263671875 ], "bp_grad_norms_per_sample_med": [ 3.25386063195765e-05, 3.39963698934298e-05, 3.503257903503254e-05, 3.4624255931703374e-05, 3.013665264006704e-05 ], "bp_grad_norms_F": [ 0.001554132904857397, 0.0015968671068549156, 0.001575724920257926, 0.0014765377854928374, 0.0012655528262257576 ], "gamma_dfa": NaN, "acc_eval": 0.595703125, "loss_eval": 1.1905839443206787, "epoch": 21 }, { "hidden_norms": [ 246.93258666992188, 235.25485229492188, 232.71095275878906, 231.27796936035156, 235.4611358642578 ], "bp_grad_norms_per_sample_med": [ 3.248557914048433e-05, 3.448772622505203e-05, 3.525316424202174e-05, 3.4218086511828005e-05, 2.997798401338514e-05 ], "bp_grad_norms_F": [ 0.001511804643087089, 0.0015418389812111855, 0.001536028808914125, 0.0014609270729124546, 0.001262559788301587 ], "gamma_dfa": NaN, "acc_eval": 0.576171875, "loss_eval": 1.2032543420791626, "epoch": 22 }, { "hidden_norms": [ 251.2838592529297, 237.0211639404297, 234.6432342529297, 233.30433654785156, 238.11598205566406 ], "bp_grad_norms_per_sample_med": [ 3.3030770282493904e-05, 3.484229455352761e-05, 3.59142868546769e-05, 3.533583367243409e-05, 3.1214847695082426e-05 ], "bp_grad_norms_F": [ 0.0015120860189199448, 0.00155613012611866, 0.0015533699188381433, 0.001477457000873983, 0.0012758751399815083 ], "gamma_dfa": NaN, "acc_eval": 0.568359375, "loss_eval": 1.220862627029419, "epoch": 23 }, { "hidden_norms": [ 253.3640594482422, 242.6001739501953, 237.11773681640625, 237.31105041503906, 241.1314697265625 ], "bp_grad_norms_per_sample_med": [ 3.295885835541412e-05, 3.492692485451698e-05, 3.562758502084762e-05, 3.515293064992875e-05, 3.0970571970101446e-05 ], "bp_grad_norms_F": [ 0.001516172313131392, 0.0015499184373766184, 0.0015383078716695309, 0.0014658188447356224, 0.0012659834465011954 ], "gamma_dfa": NaN, "acc_eval": 0.5888671875, "loss_eval": 1.1925604343414307, "epoch": 24 }, { "hidden_norms": [ 258.6325378417969, 245.05575561523438, 239.04722595214844, 237.04385375976562, 240.51011657714844 ], "bp_grad_norms_per_sample_med": [ 3.258220021962188e-05, 3.459660729276948e-05, 3.553628994268365e-05, 3.461805317783728e-05, 3.001722870976664e-05 ], "bp_grad_norms_F": [ 0.0015354488277807832, 0.001572331297211349, 0.0015721773961558938, 0.0014915125211700797, 0.0012740870006382465 ], "gamma_dfa": NaN, "acc_eval": 0.58203125, "loss_eval": 1.1843492984771729, "epoch": 25 }, { "hidden_norms": [ 262.35577392578125, 247.456298828125, 241.52687072753906, 239.8603057861328, 242.48818969726562 ], "bp_grad_norms_per_sample_med": [ 3.335328074172139e-05, 3.581988130463287e-05, 3.6700876080431044e-05, 3.52635579474736e-05, 3.091046164627187e-05 ], "bp_grad_norms_F": [ 0.0015506797935813665, 0.0016048819525167346, 0.0016078166663646698, 0.0015189298428595066, 0.001287299208343029 ], "gamma_dfa": NaN, "acc_eval": 0.6025390625, "loss_eval": 1.2021183967590332, "epoch": 26 }, { "hidden_norms": [ 262.69769287109375, 248.58924865722656, 243.61415100097656, 242.7408905029297, 243.58761596679688 ], "bp_grad_norms_per_sample_med": [ 3.363215728313662e-05, 3.542406557244249e-05, 3.617940456024371e-05, 3.522956103552133e-05, 3.093081613769755e-05 ], "bp_grad_norms_F": [ 0.0015515872510150075, 0.0015918170101940632, 0.0015870564384385943, 0.0015067857457324862, 0.001285396981984377 ], "gamma_dfa": NaN, "acc_eval": 0.576171875, "loss_eval": 1.1753299236297607, "epoch": 27 }, { "hidden_norms": [ 264.57330322265625, 252.62904357910156, 246.43833923339844, 245.4523468017578, 247.43896484375 ], "bp_grad_norms_per_sample_med": [ 3.3458851248724386e-05, 3.510742317303084e-05, 3.596700116759166e-05, 3.530932735884562e-05, 3.0871200578985736e-05 ], "bp_grad_norms_F": [ 0.0015561054460704327, 0.0015992044936865568, 0.0016016490990296006, 0.0015203922521322966, 0.001274992828257382 ], "gamma_dfa": NaN, "acc_eval": 0.587890625, "loss_eval": 1.1872658729553223, "epoch": 28 }, { "hidden_norms": [ 268.63336181640625, 253.74609375, 247.2230224609375, 244.07066345214844, 248.91635131835938 ], "bp_grad_norms_per_sample_med": [ 3.388441837159917e-05, 3.55305674020201e-05, 3.711709723575041e-05, 3.565939550753683e-05, 3.06438232655637e-05 ], "bp_grad_norms_F": [ 0.0015880814753472805, 0.001632494037039578, 0.0016352345701307058, 0.001542495796456933, 0.001282386132515967 ], "gamma_dfa": NaN, "acc_eval": 0.59375, "loss_eval": 1.1748178005218506, "epoch": 29 }, { "hidden_norms": [ 269.5155944824219, 254.65687561035156, 249.08070373535156, 246.4084930419922, 248.03065490722656 ], "bp_grad_norms_per_sample_med": [ 3.340150215080939e-05, 3.542837657732889e-05, 3.656153057818301e-05, 3.62997452612035e-05, 3.134588405373506e-05 ], "bp_grad_norms_F": [ 0.0015988025115802884, 0.0016428054077550769, 0.0016343789175152779, 0.00154898373875767, 0.001290567102842033 ], "gamma_dfa": NaN, "acc_eval": 0.5888671875, "loss_eval": 1.184614658355713, "epoch": 30 }, { "hidden_norms": [ 273.0482482910156, 255.88157653808594, 249.6538543701172, 246.09181213378906, 250.09861755371094 ], "bp_grad_norms_per_sample_med": [ 3.485401612124406e-05, 3.613552325987257e-05, 3.727355215232819e-05, 3.6410303437151015e-05, 3.111722253379412e-05 ], "bp_grad_norms_F": [ 0.0016218513483181596, 0.001677986583672464, 0.0016929754056036472, 0.001593436230905354, 0.0013143697287887335 ], "gamma_dfa": NaN, "acc_eval": 0.5673828125, "loss_eval": 1.2012369632720947, "epoch": 31 }, { "hidden_norms": [ 274.05010986328125, 255.77792358398438, 247.96664428710938, 246.15379333496094, 248.44847106933594 ], "bp_grad_norms_per_sample_med": [ 3.431778895901516e-05, 3.609380655689165e-05, 3.7377911212388426e-05, 3.6012417695019394e-05, 3.0985673220129684e-05 ], "bp_grad_norms_F": [ 0.0016116296174004674, 0.0016683804569765925, 0.0016786488704383373, 0.0015687323175370693, 0.001289981184527278 ], "gamma_dfa": NaN, "acc_eval": 0.5986328125, "loss_eval": 1.1654620170593262, "epoch": 32 }, { "hidden_norms": [ 274.6156921386719, 257.166259765625, 251.9473876953125, 251.01661682128906, 252.84222412109375 ], "bp_grad_norms_per_sample_med": [ 3.185174864483997e-05, 3.433173696976155e-05, 3.572784407879226e-05, 3.4680619137361646e-05, 2.997389128722716e-05 ], "bp_grad_norms_F": [ 0.0015743848634883761, 0.001610185718163848, 0.0016222007106989622, 0.0015360275283455849, 0.0012806184822693467 ], "gamma_dfa": NaN, "acc_eval": 0.58984375, "loss_eval": 1.1679120063781738, "epoch": 33 }, { "hidden_norms": [ 274.3385009765625, 256.1404724121094, 249.90264892578125, 247.3904266357422, 249.5623016357422 ], "bp_grad_norms_per_sample_med": [ 3.419954009586945e-05, 3.6830995668424293e-05, 3.8464357203338295e-05, 3.64230691047851e-05, 3.0958552088122815e-05 ], "bp_grad_norms_F": [ 0.0016346886986866593, 0.0016823107143864036, 0.0016956342151388526, 0.0015958002768456936, 0.0013100137002766132 ], "gamma_dfa": NaN, "acc_eval": 0.5927734375, "loss_eval": 1.1599082946777344, "epoch": 34 }, { "hidden_norms": [ 276.65985107421875, 258.50543212890625, 251.1997833251953, 247.7036895751953, 248.07545471191406 ], "bp_grad_norms_per_sample_med": [ 3.384043520782143e-05, 3.567537714843638e-05, 3.686825220938772e-05, 3.5754670534515753e-05, 3.0301211154437624e-05 ], "bp_grad_norms_F": [ 0.0016451155534014106, 0.0016956959152594209, 0.001703266054391861, 0.0016015227884054184, 0.0013142916141077876 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.148215889930725, "epoch": 35 }, { "hidden_norms": [ 279.6298522949219, 261.1481018066406, 253.67742919921875, 250.86221313476562, 250.6768035888672 ], "bp_grad_norms_per_sample_med": [ 3.341220144648105e-05, 3.499272861517966e-05, 3.6701327189803123e-05, 3.602671858971007e-05, 3.081390605075285e-05 ], "bp_grad_norms_F": [ 0.0016287019243463874, 0.0016769150970503688, 0.0016951658762991428, 0.0015969424275681376, 0.0013187138829380274 ], "gamma_dfa": NaN, "acc_eval": 0.6015625, "loss_eval": 1.1451219320297241, "epoch": 36 }, { "hidden_norms": [ 277.2866516113281, 258.4331359863281, 251.4995880126953, 249.0448455810547, 248.5166015625 ], "bp_grad_norms_per_sample_med": [ 3.2723561162129045e-05, 3.4428499930072576e-05, 3.571901106624864e-05, 3.4436179703334346e-05, 2.9252587410155684e-05 ], "bp_grad_norms_F": [ 0.0016638770466670394, 0.0017149352934211493, 0.0017208203207701445, 0.0016291715437546372, 0.0013402353506535292 ], "gamma_dfa": NaN, "acc_eval": 0.599609375, "loss_eval": 1.145239233970642, "epoch": 37 }, { "hidden_norms": [ 279.7109680175781, 259.3131103515625, 250.73587036132812, 247.214111328125, 249.20944213867188 ], "bp_grad_norms_per_sample_med": [ 3.449835639912635e-05, 3.682902752188966e-05, 3.780073166126385e-05, 3.652105442597531e-05, 3.046718666155357e-05 ], "bp_grad_norms_F": [ 0.001753124757669866, 0.0018144651548936963, 0.0018306451383978128, 0.0017095789080485702, 0.001379602705128491 ], "gamma_dfa": NaN, "acc_eval": 0.5908203125, "loss_eval": 1.1677792072296143, "epoch": 38 }, { "hidden_norms": [ 279.9946594238281, 260.2458190917969, 252.0008087158203, 250.56716918945312, 250.73135375976562 ], "bp_grad_norms_per_sample_med": [ 3.489958180580288e-05, 3.730110984179191e-05, 3.791403287323192e-05, 3.650010330602527e-05, 3.076100256294012e-05 ], "bp_grad_norms_F": [ 0.0017145961755886674, 0.0017580300336703658, 0.001775139826349914, 0.0016669962788000703, 0.0013597821816802025 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1510668992996216, "epoch": 39 }, { "hidden_norms": [ 280.5132751464844, 260.75970458984375, 252.2814178466797, 249.84548950195312, 248.41783142089844 ], "bp_grad_norms_per_sample_med": [ 3.552919588400982e-05, 3.777973688556813e-05, 3.952483166358434e-05, 3.783141073654406e-05, 3.1490348192164674e-05 ], "bp_grad_norms_F": [ 0.0017431442392989993, 0.0017984459409490228, 0.0018199888290837407, 0.0017078405944630504, 0.0013792469399049878 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1412110328674316, "epoch": 40 }, { "hidden_norms": [ 279.3873596191406, 259.55096435546875, 251.9462432861328, 247.29443359375, 247.82852172851562 ], "bp_grad_norms_per_sample_med": [ 3.456972990534268e-05, 3.654780448414385e-05, 3.848340566037223e-05, 3.736113285413012e-05, 3.1597948691342026e-05 ], "bp_grad_norms_F": [ 0.0017544032307341695, 0.0018107325304299593, 0.0018319039372727275, 0.0017261328175663948, 0.0013868761016055942 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.1418483257293701, "epoch": 41 }, { "hidden_norms": [ 282.4360656738281, 261.22149658203125, 251.49090576171875, 247.5189208984375, 247.03427124023438 ], "bp_grad_norms_per_sample_med": [ 3.5179280530428514e-05, 3.728548108483665e-05, 3.779769394895993e-05, 3.6327692214399576e-05, 3.026284321094863e-05 ], "bp_grad_norms_F": [ 0.0017881252570077777, 0.0018441356951370835, 0.0018691252917051315, 0.0017487212317064404, 0.0013921407517045736 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1468144655227661, "epoch": 42 }, { "hidden_norms": [ 283.1267395019531, 261.29425048828125, 252.38563537597656, 248.00192260742188, 246.58505249023438 ], "bp_grad_norms_per_sample_med": [ 3.485176421236247e-05, 3.699021544889547e-05, 3.812833165284246e-05, 3.7145182432141155e-05, 3.1198313081404194e-05 ], "bp_grad_norms_F": [ 0.0017692983383312821, 0.0018438888946548104, 0.001876220339909196, 0.0017641744343563914, 0.0014044356066733599 ], "gamma_dfa": NaN, "acc_eval": 0.62109375, "loss_eval": 1.1329892873764038, "epoch": 43 }, { "hidden_norms": [ 281.29327392578125, 259.43359375, 249.52906799316406, 246.0892333984375, 243.162109375 ], "bp_grad_norms_per_sample_med": [ 3.586204911698587e-05, 3.787377499975264e-05, 3.9215286960825324e-05, 3.7436715501826257e-05, 3.160976120852865e-05 ], "bp_grad_norms_F": [ 0.0018376735970377922, 0.0019067999674007297, 0.0019337635021656752, 0.0017983472207561135, 0.001438757055439055 ], "gamma_dfa": NaN, "acc_eval": 0.6181640625, "loss_eval": 1.144508957862854, "epoch": 44 }, { "hidden_norms": [ 282.5230407714844, 259.55322265625, 248.72308349609375, 245.0394287109375, 243.0651092529297 ], "bp_grad_norms_per_sample_med": [ 3.6309906136011705e-05, 3.868114436045289e-05, 4.0484872442903e-05, 3.8203681469894946e-05, 3.144023139611818e-05 ], "bp_grad_norms_F": [ 0.0018340122187510133, 0.0019134157337248325, 0.0019425065256655216, 0.0018252682639285922, 0.001443033921532333 ], "gamma_dfa": NaN, "acc_eval": 0.61328125, "loss_eval": 1.1290326118469238, "epoch": 45 }, { "hidden_norms": [ 280.8598327636719, 260.14111328125, 250.84779357910156, 245.9561767578125, 243.0910186767578 ], "bp_grad_norms_per_sample_med": [ 3.4626806154847145e-05, 3.693445250974037e-05, 3.8311845855787396e-05, 3.7721722037531435e-05, 3.145459049846977e-05 ], "bp_grad_norms_F": [ 0.0018591763218864799, 0.0019209657330065966, 0.0019388735527172685, 0.001830682042054832, 0.001447839429602027 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1423537731170654, "epoch": 46 }, { "hidden_norms": [ 280.17266845703125, 259.26568603515625, 248.45452880859375, 243.45750427246094, 241.2735137939453 ], "bp_grad_norms_per_sample_med": [ 3.609486884670332e-05, 3.887504499289207e-05, 4.01619981857948e-05, 3.9294092857744545e-05, 3.1412804673891515e-05 ], "bp_grad_norms_F": [ 0.0018975000130012631, 0.0019804267212748528, 0.002001592656597495, 0.0018729616422206163, 0.0014571875799447298 ], "gamma_dfa": NaN, "acc_eval": 0.61328125, "loss_eval": 1.1366385221481323, "epoch": 47 }, { "hidden_norms": [ 281.79833984375, 259.25860595703125, 249.18551635742188, 244.24977111816406, 240.67100524902344 ], "bp_grad_norms_per_sample_med": [ 3.47710374626331e-05, 3.7153975426917896e-05, 3.885528349201195e-05, 3.792768620769493e-05, 3.113777347607538e-05 ], "bp_grad_norms_F": [ 0.0019318967824801803, 0.0019981141667813063, 0.0020311782136559486, 0.0018996316939592361, 0.0014788025291636586 ], "gamma_dfa": NaN, "acc_eval": 0.6162109375, "loss_eval": 1.138331651687622, "epoch": 48 }, { "hidden_norms": [ 282.3840637207031, 258.1807861328125, 248.13995361328125, 243.45587158203125, 239.51858520507812 ], "bp_grad_norms_per_sample_med": [ 3.68369001080282e-05, 3.935660788556561e-05, 4.189974788459949e-05, 3.9929436752572656e-05, 3.188087430316955e-05 ], "bp_grad_norms_F": [ 0.0019372758688405156, 0.0020036858040839434, 0.0020287453662604094, 0.001896715839393437, 0.0014835885958746076 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1377842426300049, "epoch": 49 }, { "hidden_norms": [ 280.9283142089844, 257.81524658203125, 248.47984313964844, 241.96157836914062, 238.4756317138672 ], "bp_grad_norms_per_sample_med": [ 3.7310775951482356e-05, 3.98769298044499e-05, 4.1753111872822046e-05, 4.021048516733572e-05, 3.21856678056065e-05 ], "bp_grad_norms_F": [ 0.0019433718407526612, 0.0020235073752701283, 0.002055324148386717, 0.0019370814552530646, 0.0015049076173454523 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.133098840713501, "epoch": 50 }, { "hidden_norms": [ 279.66400146484375, 256.7322082519531, 246.65223693847656, 241.45947265625, 236.65582275390625 ], "bp_grad_norms_per_sample_med": [ 3.620017014327459e-05, 3.800772174145095e-05, 4.072795491083525e-05, 3.888807259500027e-05, 3.182498039677739e-05 ], "bp_grad_norms_F": [ 0.0019729172345250845, 0.002036863239482045, 0.0020802877843379974, 0.0019662927370518446, 0.0015235996106639504 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.1315571069717407, "epoch": 51 }, { "hidden_norms": [ 280.00152587890625, 258.0238037109375, 247.4223175048828, 240.8101348876953, 237.3229217529297 ], "bp_grad_norms_per_sample_med": [ 3.6401659599505365e-05, 3.855170143651776e-05, 4.065703978994861e-05, 3.844475213554688e-05, 3.1645795388612896e-05 ], "bp_grad_norms_F": [ 0.0019983802922070026, 0.0020701857283711433, 0.002107742242515087, 0.001981276087462902, 0.0015306670684367418 ], "gamma_dfa": NaN, "acc_eval": 0.6171875, "loss_eval": 1.137194037437439, "epoch": 52 }, { "hidden_norms": [ 278.19708251953125, 255.23036193847656, 245.5857696533203, 239.48196411132812, 235.09983825683594 ], "bp_grad_norms_per_sample_med": [ 3.97727417293936e-05, 4.185501529718749e-05, 4.392741175252013e-05, 4.302372326492332e-05, 3.48737376043573e-05 ], "bp_grad_norms_F": [ 0.002044696593657136, 0.00211329385638237, 0.002144050318747759, 0.0020148823969066143, 0.0015573638956993818 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1354646682739258, "epoch": 53 }, { "hidden_norms": [ 276.7043762207031, 255.62408447265625, 243.71484375, 238.2984161376953, 233.8153076171875 ], "bp_grad_norms_per_sample_med": [ 3.715257116709836e-05, 3.887641287292354e-05, 4.099323268746957e-05, 3.948296944145113e-05, 3.221148654120043e-05 ], "bp_grad_norms_F": [ 0.0020365805830806494, 0.00209893099963665, 0.0021342532709240913, 0.0020123852882534266, 0.0015702869277447462 ], "gamma_dfa": NaN, "acc_eval": 0.623046875, "loss_eval": 1.1295127868652344, "epoch": 54 }, { "hidden_norms": [ 279.308349609375, 255.30587768554688, 243.6786651611328, 237.71823120117188, 232.89991760253906 ], "bp_grad_norms_per_sample_med": [ 3.9407084841514006e-05, 4.1900668293237686e-05, 4.364689812064171e-05, 4.154618363827467e-05, 3.264051701989956e-05 ], "bp_grad_norms_F": [ 0.0021011638455092907, 0.002175872679799795, 0.002217113971710205, 0.002071501687169075, 0.0015880379360169172 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.1201554536819458, "epoch": 55 }, { "hidden_norms": [ 276.9933166503906, 253.379638671875, 244.23390197753906, 238.01930236816406, 233.3076171875 ], "bp_grad_norms_per_sample_med": [ 3.799827391048893e-05, 4.017200990347192e-05, 4.2665858927648515e-05, 4.083341627847403e-05, 3.210103386663832e-05 ], "bp_grad_norms_F": [ 0.002064710482954979, 0.0021362933330237865, 0.0021728368010371923, 0.0020478416699916124, 0.0015873984666541219 ], "gamma_dfa": NaN, "acc_eval": 0.630859375, "loss_eval": 1.1222728490829468, "epoch": 56 }, { "hidden_norms": [ 276.41168212890625, 251.91033935546875, 241.81382751464844, 234.8279266357422, 230.53956604003906 ], "bp_grad_norms_per_sample_med": [ 3.770063631236553e-05, 3.94962407881394e-05, 4.150882887188345e-05, 4.040042040287517e-05, 3.2475280022481456e-05 ], "bp_grad_norms_F": [ 0.002123177284374833, 0.0021965675987303257, 0.00223328173160553, 0.0020905195269733667, 0.0016039537731558084 ], "gamma_dfa": NaN, "acc_eval": 0.630859375, "loss_eval": 1.1091526746749878, "epoch": 57 }, { "hidden_norms": [ 274.760986328125, 250.0972442626953, 239.511474609375, 233.29798889160156, 228.16070556640625 ], "bp_grad_norms_per_sample_med": [ 3.728809315362014e-05, 4.0525967051507905e-05, 4.239326517563313e-05, 4.087138222530484e-05, 3.216422919649631e-05 ], "bp_grad_norms_F": [ 0.0021635335870087147, 0.0022461507469415665, 0.0022873859852552414, 0.002144098049029708, 0.001636566361412406 ], "gamma_dfa": NaN, "acc_eval": 0.6416015625, "loss_eval": 1.1180500984191895, "epoch": 58 }, { "hidden_norms": [ 273.91064453125, 249.49452209472656, 238.54373168945312, 232.80734252929688, 225.6833953857422 ], "bp_grad_norms_per_sample_med": [ 3.966117583331652e-05, 4.1986208088928834e-05, 4.316144259064458e-05, 4.332280877861194e-05, 3.44519030477386e-05 ], "bp_grad_norms_F": [ 0.0021825931034982204, 0.0022617392241954803, 0.0023092019837349653, 0.00216560042463243, 0.0016612708568572998 ], "gamma_dfa": NaN, "acc_eval": 0.6279296875, "loss_eval": 1.131789207458496, "epoch": 59 }, { "hidden_norms": [ 274.90008544921875, 250.0712127685547, 238.57467651367188, 231.15719604492188, 225.55587768554688 ], "bp_grad_norms_per_sample_med": [ 4.130819797865115e-05, 4.363877815194428e-05, 4.489632920012809e-05, 4.4512398744700477e-05, 3.470887531875633e-05 ], "bp_grad_norms_F": [ 0.002240521367639303, 0.002310203853994608, 0.0023576009552925825, 0.002204722724854946, 0.0016799044096842408 ], "gamma_dfa": NaN, "acc_eval": 0.6240234375, "loss_eval": 1.1323366165161133, "epoch": 60 }, { "hidden_norms": [ 275.4504699707031, 249.5341796875, 237.540283203125, 230.39208984375, 224.43321228027344 ], "bp_grad_norms_per_sample_med": [ 4.056218676851131e-05, 4.288182390155271e-05, 4.5818003854947165e-05, 4.356648423708975e-05, 3.492152245598845e-05 ], "bp_grad_norms_F": [ 0.002249655080959201, 0.0023316002916544676, 0.002382595557719469, 0.002231382764875889, 0.00168902100995183 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.1275749206542969, "epoch": 61 }, { "hidden_norms": [ 273.6263122558594, 248.43479919433594, 234.8235321044922, 228.0020751953125, 222.4278106689453 ], "bp_grad_norms_per_sample_med": [ 4.0597744373371825e-05, 4.323143730289303e-05, 4.647616151487455e-05, 4.4688425987260416e-05, 3.521826511132531e-05 ], "bp_grad_norms_F": [ 0.002307126997038722, 0.0023877634666860104, 0.0024417925160378218, 0.0022813305258750916, 0.001714664394967258 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.1252907514572144, "epoch": 62 }, { "hidden_norms": [ 271.7508239746094, 246.79209899902344, 233.84280395507812, 226.96934509277344, 220.57888793945312 ], "bp_grad_norms_per_sample_med": [ 4.177554728812538e-05, 4.393904600874521e-05, 4.635817458620295e-05, 4.428510874276981e-05, 3.396430111024529e-05 ], "bp_grad_norms_F": [ 0.002355988370254636, 0.0024527544155716896, 0.0025022663176059723, 0.0023387460969388485, 0.0017370774876326323 ], "gamma_dfa": NaN, "acc_eval": 0.62109375, "loss_eval": 1.1249933242797852, "epoch": 63 }, { "hidden_norms": [ 271.7035217285156, 246.70675659179688, 233.96661376953125, 226.53175354003906, 220.52359008789062 ], "bp_grad_norms_per_sample_med": [ 4.2499312257859856e-05, 4.503092714003287e-05, 4.670799171435647e-05, 4.5866876462241635e-05, 3.720118911587633e-05 ], "bp_grad_norms_F": [ 0.002408105880022049, 0.0024944571778178215, 0.002545328810811043, 0.002381332218647003, 0.0017641197191551328 ], "gamma_dfa": NaN, "acc_eval": 0.625, "loss_eval": 1.1418037414550781, "epoch": 64 }, { "hidden_norms": [ 271.0970153808594, 246.78770446777344, 234.2436065673828, 226.7012176513672, 219.61680603027344 ], "bp_grad_norms_per_sample_med": [ 4.040581188746728e-05, 4.3224725231993943e-05, 4.4494401663541794e-05, 4.3532105337362736e-05, 3.4612559829838574e-05 ], "bp_grad_norms_F": [ 0.0024068003986030817, 0.002485552802681923, 0.002538430504500866, 0.002368941670283675, 0.0017652952810749412 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.1279454231262207, "epoch": 65 }, { "hidden_norms": [ 270.66473388671875, 244.8525390625, 232.8356475830078, 224.2222137451172, 217.24554443359375 ], "bp_grad_norms_per_sample_med": [ 4.1549992602085695e-05, 4.493525193538517e-05, 4.7448877012357116e-05, 4.479651397559792e-05, 3.5401590139372274e-05 ], "bp_grad_norms_F": [ 0.002463088370859623, 0.002551029436290264, 0.002594881458207965, 0.0024160456378012896, 0.001803302438929677 ], "gamma_dfa": NaN, "acc_eval": 0.6376953125, "loss_eval": 1.1330325603485107, "epoch": 66 }, { "hidden_norms": [ 269.8645935058594, 243.50497436523438, 231.37692260742188, 222.27967834472656, 215.22059631347656 ], "bp_grad_norms_per_sample_med": [ 4.1519095248077065e-05, 4.487609476200305e-05, 4.708006963483058e-05, 4.4878328480990604e-05, 3.578457108233124e-05 ], "bp_grad_norms_F": [ 0.0024854058865457773, 0.0025721373967826366, 0.0026270432863384485, 0.0024401266127824783, 0.0018134783022105694 ], "gamma_dfa": NaN, "acc_eval": 0.63671875, "loss_eval": 1.123876690864563, "epoch": 67 }, { "hidden_norms": [ 269.28570556640625, 242.04359436035156, 229.53497314453125, 221.24327087402344, 215.1306610107422 ], "bp_grad_norms_per_sample_med": [ 4.279898348613642e-05, 4.6176737669156864e-05, 4.813459236174822e-05, 4.609950337908231e-05, 3.566763552953489e-05 ], "bp_grad_norms_F": [ 0.0024860126432031393, 0.002575797727331519, 0.0026342689525336027, 0.0024608916137367487, 0.0018216874450445175 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.122079849243164, "epoch": 68 }, { "hidden_norms": [ 268.3481140136719, 242.3759765625, 229.19241333007812, 220.78233337402344, 213.58587646484375 ], "bp_grad_norms_per_sample_med": [ 4.163750054431148e-05, 4.50872685178183e-05, 4.8797548515722156e-05, 4.597716542775743e-05, 3.505409767967649e-05 ], "bp_grad_norms_F": [ 0.0025033215060830116, 0.002596172271296382, 0.002654082840308547, 0.002480126451700926, 0.0018305372213944793 ], "gamma_dfa": NaN, "acc_eval": 0.6328125, "loss_eval": 1.1238645315170288, "epoch": 69 }, { "hidden_norms": [ 267.92425537109375, 239.90985107421875, 228.08212280273438, 219.12835693359375, 212.38052368164062 ], "bp_grad_norms_per_sample_med": [ 4.42373457190115e-05, 4.6515069698216394e-05, 4.823393464903347e-05, 4.762738535646349e-05, 3.6444154829951e-05 ], "bp_grad_norms_F": [ 0.0025684935972094536, 0.002675230847671628, 0.0027295781765133142, 0.0025394319090992212, 0.0018643162911757827 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.135793685913086, "epoch": 70 }, { "hidden_norms": [ 266.2279052734375, 239.37680053710938, 226.3264923095703, 218.04910278320312, 210.68836975097656 ], "bp_grad_norms_per_sample_med": [ 4.4824198994319886e-05, 4.7638000978622586e-05, 4.962517414242029e-05, 4.7396664740517735e-05, 3.5957502404926345e-05 ], "bp_grad_norms_F": [ 0.002600227715447545, 0.002714222064241767, 0.002763595897704363, 0.0025755097158253193, 0.0018772372277453542 ], "gamma_dfa": NaN, "acc_eval": 0.623046875, "loss_eval": 1.123576283454895, "epoch": 71 }, { "hidden_norms": [ 266.4837951660156, 239.67581176757812, 227.51805114746094, 218.58811950683594, 211.26596069335938 ], "bp_grad_norms_per_sample_med": [ 4.245663512847386e-05, 4.560768138617277e-05, 4.797001020051539e-05, 4.539322981145233e-05, 3.4807548217941076e-05 ], "bp_grad_norms_F": [ 0.0025984421372413635, 0.002703956561163068, 0.002762222196906805, 0.002577459439635277, 0.0018865292659029365 ], "gamma_dfa": NaN, "acc_eval": 0.61328125, "loss_eval": 1.1362444162368774, "epoch": 72 }, { "hidden_norms": [ 264.8100891113281, 237.96121215820312, 226.14822387695312, 217.3454132080078, 208.98077392578125 ], "bp_grad_norms_per_sample_med": [ 4.217765308567323e-05, 4.603620618581772e-05, 4.735886977869086e-05, 4.5346474507823586e-05, 3.594472218537703e-05 ], "bp_grad_norms_F": [ 0.0026375274173915386, 0.0027397233061492443, 0.0028012648690491915, 0.0026011927984654903, 0.0018980697495862842 ], "gamma_dfa": NaN, "acc_eval": 0.6318359375, "loss_eval": 1.1286330223083496, "epoch": 73 }, { "hidden_norms": [ 264.8172302246094, 238.0478057861328, 225.0303497314453, 217.1344757080078, 209.569580078125 ], "bp_grad_norms_per_sample_med": [ 4.242224895278923e-05, 4.6696859499206766e-05, 4.831598562304862e-05, 4.5893459173385054e-05, 3.54531584889628e-05 ], "bp_grad_norms_F": [ 0.0026500027161091566, 0.002760941395536065, 0.0028223067056387663, 0.0026202781591564417, 0.001915424014441669 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.1304678916931152, "epoch": 74 }, { "hidden_norms": [ 264.7013854980469, 237.4438018798828, 225.43527221679688, 216.18502807617188, 208.08302307128906 ], "bp_grad_norms_per_sample_med": [ 4.43761091446504e-05, 4.801220347872004e-05, 4.9817157560028136e-05, 4.829527097172104e-05, 3.73583534383215e-05 ], "bp_grad_norms_F": [ 0.002686889609321952, 0.0028029615059494972, 0.002866453491151333, 0.002669648267328739, 0.0019349679350852966 ], "gamma_dfa": NaN, "acc_eval": 0.6240234375, "loss_eval": 1.1350867748260498, "epoch": 75 }, { "hidden_norms": [ 264.3004455566406, 236.1824188232422, 223.4772186279297, 214.64682006835938, 207.52272033691406 ], "bp_grad_norms_per_sample_med": [ 4.3003376049455255e-05, 4.6196739276638255e-05, 4.8772617446957156e-05, 4.7264005843317136e-05, 3.6179160815663636e-05 ], "bp_grad_norms_F": [ 0.0027191757690161467, 0.0028310383204370737, 0.0028950762934982777, 0.002689448418095708, 0.0019433586858212948 ], "gamma_dfa": NaN, "acc_eval": 0.6259765625, "loss_eval": 1.1378443241119385, "epoch": 76 }, { "hidden_norms": [ 262.62811279296875, 235.80126953125, 222.7261199951172, 213.42430114746094, 205.99493408203125 ], "bp_grad_norms_per_sample_med": [ 4.4399519538274035e-05, 4.737091148854233e-05, 4.900431667920202e-05, 4.768445069203153e-05, 3.608842962421477e-05 ], "bp_grad_norms_F": [ 0.0027450472116470337, 0.0028562990482896566, 0.0029378861654549837, 0.0027161173056811094, 0.0019581648521125317 ], "gamma_dfa": NaN, "acc_eval": 0.6220703125, "loss_eval": 1.137312889099121, "epoch": 77 }, { "hidden_norms": [ 262.612060546875, 235.62489318847656, 222.1566925048828, 212.93875122070312, 205.24142456054688 ], "bp_grad_norms_per_sample_med": [ 4.443951911525801e-05, 4.7095887566683814e-05, 4.906025424133986e-05, 4.8352503654314205e-05, 3.6001758417114615e-05 ], "bp_grad_norms_F": [ 0.002745443256571889, 0.002859732834622264, 0.002942001214250922, 0.002725319005548954, 0.001969744684174657 ], "gamma_dfa": NaN, "acc_eval": 0.6279296875, "loss_eval": 1.126712441444397, "epoch": 78 }, { "hidden_norms": [ 262.6611633300781, 235.52174377441406, 221.89093017578125, 213.1799774169922, 204.9930877685547 ], "bp_grad_norms_per_sample_med": [ 4.5766752009512857e-05, 4.834473293158226e-05, 5.181043525226414e-05, 4.826926306122914e-05, 3.573719732230529e-05 ], "bp_grad_norms_F": [ 0.0027218428440392017, 0.002838012296706438, 0.002919211983680725, 0.0027209871914237738, 0.001970200566574931 ], "gamma_dfa": NaN, "acc_eval": 0.62109375, "loss_eval": 1.1352139711380005, "epoch": 79 }, { "hidden_norms": [ 261.58856201171875, 234.9381103515625, 221.2636260986328, 211.9308624267578, 204.54647827148438 ], "bp_grad_norms_per_sample_med": [ 4.5460306864697486e-05, 4.857210296904668e-05, 4.9856924306368455e-05, 4.823243580176495e-05, 3.731804099516012e-05 ], "bp_grad_norms_F": [ 0.002767088357359171, 0.0028805267065763474, 0.0029621378052979708, 0.00275496207177639, 0.001986011164262891 ], "gamma_dfa": NaN, "acc_eval": 0.6259765625, "loss_eval": 1.134087324142456, "epoch": 80 }, { "hidden_norms": [ 261.3812561035156, 234.79383850097656, 220.678955078125, 211.66114807128906, 203.9405517578125 ], "bp_grad_norms_per_sample_med": [ 4.64644399471581e-05, 5.052189590060152e-05, 5.2927574870409444e-05, 5.0570299208629876e-05, 3.7252495530992746e-05 ], "bp_grad_norms_F": [ 0.0027735778130590916, 0.002885127207264304, 0.0029686433263123035, 0.002763227093964815, 0.0019980284851044416 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.135728359222412, "epoch": 81 }, { "hidden_norms": [ 261.2560729980469, 233.66014099121094, 220.25682067871094, 211.13511657714844, 203.18130493164062 ], "bp_grad_norms_per_sample_med": [ 4.6268629375845194e-05, 4.9701800890034065e-05, 5.169105133973062e-05, 5.069339385954663e-05, 3.80978781322483e-05 ], "bp_grad_norms_F": [ 0.0028223153203725815, 0.0029419492930173874, 0.0030234854202717543, 0.002805375959724188, 0.002015760401263833 ], "gamma_dfa": NaN, "acc_eval": 0.619140625, "loss_eval": 1.1317980289459229, "epoch": 82 }, { "hidden_norms": [ 260.62255859375, 233.12937927246094, 219.89907836914062, 210.4191436767578, 202.494873046875 ], "bp_grad_norms_per_sample_med": [ 4.5126867917133495e-05, 4.8572586820228025e-05, 5.1520797569537535e-05, 4.971070302417502e-05, 3.838812335743569e-05 ], "bp_grad_norms_F": [ 0.0028271761257201433, 0.002944816369563341, 0.003029909450560808, 0.0028170389123260975, 0.002025141380727291 ], "gamma_dfa": NaN, "acc_eval": 0.6259765625, "loss_eval": 1.1392892599105835, "epoch": 83 }, { "hidden_norms": [ 260.0465393066406, 232.27760314941406, 218.845458984375, 209.7770233154297, 201.92831420898438 ], "bp_grad_norms_per_sample_med": [ 4.730001455754973e-05, 5.118208355270326e-05, 5.1580365834524855e-05, 4.936498589813709e-05, 3.706002826220356e-05 ], "bp_grad_norms_F": [ 0.0028656981885433197, 0.002991823712363839, 0.0030798574443906546, 0.0028517318423837423, 0.0020406947005540133 ], "gamma_dfa": NaN, "acc_eval": 0.625, "loss_eval": 1.1393200159072876, "epoch": 84 }, { "hidden_norms": [ 259.99285888671875, 232.2432403564453, 218.6685333251953, 209.5802001953125, 201.7836456298828 ], "bp_grad_norms_per_sample_med": [ 4.4883607188239694e-05, 4.9325379222864285e-05, 5.1563201850512996e-05, 4.9446705816080794e-05, 3.641278817667626e-05 ], "bp_grad_norms_F": [ 0.002843427937477827, 0.0029685739427804947, 0.0030620063189417124, 0.0028350763022899628, 0.0020346841774880886 ], "gamma_dfa": NaN, "acc_eval": 0.625, "loss_eval": 1.136763572692871, "epoch": 85 }, { "hidden_norms": [ 259.7002868652344, 232.1937713623047, 218.6339569091797, 209.42572021484375, 201.48532104492188 ], "bp_grad_norms_per_sample_med": [ 4.557083229883574e-05, 5.006462743040174e-05, 5.1964529120596126e-05, 5.040188261773437e-05, 3.70733359886799e-05 ], "bp_grad_norms_F": [ 0.002866365248337388, 0.0029951538890600204, 0.0030862949788570404, 0.0028592217713594437, 0.002047886373475194 ], "gamma_dfa": NaN, "acc_eval": 0.630859375, "loss_eval": 1.139750361442566, "epoch": 86 }, { "hidden_norms": [ 259.22808837890625, 232.3558807373047, 218.42848205566406, 209.1579132080078, 201.5212860107422 ], "bp_grad_norms_per_sample_med": [ 4.5765504182782024e-05, 4.875436570728198e-05, 5.104453521198593e-05, 5.005718412576243e-05, 3.675639891298488e-05 ], "bp_grad_norms_F": [ 0.002878013998270035, 0.003002135781571269, 0.0030916042160242796, 0.002861205255612731, 0.0020479748491197824 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.1344283819198608, "epoch": 87 }, { "hidden_norms": [ 259.1551513671875, 232.05300903320312, 218.15708923339844, 208.9161834716797, 201.6800537109375 ], "bp_grad_norms_per_sample_med": [ 4.611797339748591e-05, 4.964259278494865e-05, 5.252738264971413e-05, 5.0600574468262494e-05, 3.820879283011891e-05 ], "bp_grad_norms_F": [ 0.0028855716809630394, 0.003010405693203211, 0.0031016215216368437, 0.002874146681278944, 0.0020545709412544966 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.135157823562622, "epoch": 88 }, { "hidden_norms": [ 259.21893310546875, 231.72747802734375, 217.7665252685547, 208.59022521972656, 201.1155548095703 ], "bp_grad_norms_per_sample_med": [ 4.6835561079205945e-05, 5.060776311438531e-05, 5.325842721504159e-05, 5.128757766215131e-05, 3.774667493416928e-05 ], "bp_grad_norms_F": [ 0.002893448108807206, 0.0030188425444066525, 0.0031124993693083525, 0.002883171197026968, 0.002058332087472081 ], "gamma_dfa": NaN, "acc_eval": 0.6298828125, "loss_eval": 1.1357543468475342, "epoch": 89 }, { "hidden_norms": [ 258.88385009765625, 230.9880828857422, 217.33352661132812, 208.3406524658203, 200.54083251953125 ], "bp_grad_norms_per_sample_med": [ 4.6940938773332164e-05, 5.0942355301231146e-05, 5.368283382267691e-05, 5.184212204767391e-05, 3.746367656276561e-05 ], "bp_grad_norms_F": [ 0.0029224599711596966, 0.0030530549120157957, 0.003145798807963729, 0.0029114321805536747, 0.0020718672312796116 ], "gamma_dfa": NaN, "acc_eval": 0.6279296875, "loss_eval": 1.1398890018463135, "epoch": 90 }, { "hidden_norms": [ 258.7764587402344, 231.19357299804688, 217.22779846191406, 207.97528076171875, 199.982421875 ], "bp_grad_norms_per_sample_med": [ 4.70306295028422e-05, 5.185308327781968e-05, 5.281997437123209e-05, 5.1426530262688175e-05, 3.7254685594234616e-05 ], "bp_grad_norms_F": [ 0.002924826927483082, 0.0030514320824295282, 0.0031429482623934746, 0.0029119658283889294, 0.0020754521246999502 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.138663411140442, "epoch": 91 }, { "hidden_norms": [ 258.7837829589844, 230.58901977539062, 217.062255859375, 207.7244873046875, 199.89395141601562 ], "bp_grad_norms_per_sample_med": [ 4.688404078478925e-05, 5.141457950230688e-05, 5.3491079597733915e-05, 5.087396493763663e-05, 3.739634121302515e-05 ], "bp_grad_norms_F": [ 0.0029230716172605753, 0.0030518025159835815, 0.0031419326551258564, 0.002910938812419772, 0.00207503535784781 ], "gamma_dfa": NaN, "acc_eval": 0.626953125, "loss_eval": 1.1365739107131958, "epoch": 92 }, { "hidden_norms": [ 258.7561950683594, 230.4254913330078, 217.07546997070312, 207.6160125732422, 199.7816162109375 ], "bp_grad_norms_per_sample_med": [ 4.680828351411037e-05, 5.096250242786482e-05, 5.211709503782913e-05, 5.09246347064618e-05, 3.779645703616552e-05 ], "bp_grad_norms_F": [ 0.002931967144832015, 0.0030605625361204147, 0.00315046776086092, 0.0029180829878896475, 0.002077121753245592 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.1363377571105957, "epoch": 93 }, { "hidden_norms": [ 258.76409912109375, 230.5386505126953, 216.76475524902344, 207.16859436035156, 199.2827911376953 ], "bp_grad_norms_per_sample_med": [ 4.749056097352877e-05, 5.2020419389009476e-05, 5.3769603255204856e-05, 5.178397987037897e-05, 3.789216498262249e-05 ], "bp_grad_norms_F": [ 0.0029493479523807764, 0.0030784173868596554, 0.0031682881526649, 0.0029316784348338842, 0.002084067091345787 ], "gamma_dfa": NaN, "acc_eval": 0.6298828125, "loss_eval": 1.1382873058319092, "epoch": 94 }, { "hidden_norms": [ 258.7884826660156, 230.40945434570312, 216.70376586914062, 207.1806182861328, 199.41917419433594 ], "bp_grad_norms_per_sample_med": [ 4.741501834359951e-05, 5.169968062546104e-05, 5.352263542590663e-05, 5.053802306065336e-05, 3.758866660064086e-05 ], "bp_grad_norms_F": [ 0.002947731176391244, 0.003076745430007577, 0.0031680618412792683, 0.0029321794863790274, 0.0020845714025199413 ], "gamma_dfa": NaN, "acc_eval": 0.630859375, "loss_eval": 1.1382077932357788, "epoch": 95 }, { "hidden_norms": [ 258.766845703125, 230.38992309570312, 216.7628173828125, 207.26092529296875, 199.36366271972656 ], "bp_grad_norms_per_sample_med": [ 4.718741183751263e-05, 5.1928480388596654e-05, 5.3666040912503377e-05, 5.089692058390938e-05, 3.752821430680342e-05 ], "bp_grad_norms_F": [ 0.002943811472505331, 0.003073457395657897, 0.0031646883580833673, 0.0029298998415470123, 0.002084212377667427 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.138296365737915, "epoch": 96 }, { "hidden_norms": [ 258.8481140136719, 230.38389587402344, 216.7748260498047, 207.24560546875, 199.39401245117188 ], "bp_grad_norms_per_sample_med": [ 4.728109706775285e-05, 5.156427505426109e-05, 5.3663239668821916e-05, 5.139272616361268e-05, 3.7748181057395414e-05 ], "bp_grad_norms_F": [ 0.002947240835055709, 0.003076959168538451, 0.0031680231913924217, 0.0029323517810553312, 0.0020851469598710537 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.1388041973114014, "epoch": 97 }, { "hidden_norms": [ 258.77734375, 230.3692626953125, 216.7212677001953, 207.1890869140625, 199.34091186523438 ], "bp_grad_norms_per_sample_med": [ 4.7204313887050375e-05, 5.154019163455814e-05, 5.373918611439876e-05, 5.1062332204310223e-05, 3.7904177588643506e-05 ], "bp_grad_norms_F": [ 0.0029484080150723457, 0.0030780842062085867, 0.0031695417128503323, 0.0029333126731216908, 0.002085541607812047 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.138832688331604, "epoch": 98 }, { "hidden_norms": [ 258.7897644042969, 230.38552856445312, 216.73997497558594, 207.1963653564453, 199.38656616210938 ], "bp_grad_norms_per_sample_med": [ 4.726059705717489e-05, 5.1730185077758506e-05, 5.3854040743317455e-05, 5.0960083171958104e-05, 3.793121504713781e-05 ], "bp_grad_norms_F": [ 0.00294809159822762, 0.003077775239944458, 0.003169153118506074, 0.0029330949764698744, 0.0020853858441114426 ], "gamma_dfa": NaN, "acc_eval": 0.62890625, "loss_eval": 1.1388249397277832, "epoch": 99 }, { "hidden_norms": [ 258.7891845703125, 230.38888549804688, 216.73963928222656, 207.19769287109375, 199.4077606201172 ], "bp_grad_norms_per_sample_med": [ 4.725577309727669e-05, 5.174486432224512e-05, 5.38085114385467e-05, 5.098402107250877e-05, 3.7933263229206204e-05 ], "bp_grad_norms_F": [ 0.002948042470961809, 0.0030777468346059322, 0.003169137053191662, 0.002933081705123186, 0.0020853858441114426 ], "gamma_dfa": NaN, "acc_eval": 0.6279296875, "loss_eval": 1.1387826204299927, "epoch": 100 } ], "dfa_log": [ { "hidden_norms": [ 8.696551322937012, 8.737784385681152, 8.813130378723145, 8.844642639160156, 8.889528274536133 ], "bp_grad_norms_per_sample_med": [ 0.0010079912608489394, 0.0010035138111561537, 0.0009970925748348236, 0.0009936393471434712, 0.000986678060144186 ], "bp_grad_norms_F": [ 0.035574451088905334, 0.035288579761981964, 0.035048045217990875, 0.0346725769340992, 0.03439188003540039 ], "gamma_dfa": 0.0033523982419865206, "acc_eval": 0.0927734375, "loss_eval": 2.4863264560699463, "epoch": 0 }, { "hidden_norms": [ 900.3377685546875, 3463.92626953125, 6660.5166015625, 10478.5126953125, 13466.513671875 ], "bp_grad_norms_per_sample_med": [ 2.017142833210528e-06, 7.972002435963077e-07, 7.783806381667091e-07, 7.758338256280695e-07, 7.810436954969191e-07 ], "bp_grad_norms_F": [ 0.00013047464017290622, 7.321321754716337e-05, 7.131113670766354e-05, 7.113779429346323e-05, 7.09498199285008e-05 ], "gamma_dfa": 0.1028625147882849, "acc_eval": 0.2861328125, "loss_eval": 1.970402717590332, "epoch": 1 }, { "hidden_norms": [ 1784.805419921875, 14085.2138671875, 36523.9375, 61422.50390625, 73870.3359375 ], "bp_grad_norms_per_sample_med": [ 9.087140711017128e-07, 1.772240381114898e-07, 1.705584367073243e-07, 1.7156033038645546e-07, 1.728751612972701e-07 ], "bp_grad_norms_F": [ 4.7445286327274516e-05, 1.1973520486208145e-05, 9.698592293716501e-06, 9.335580216429662e-06, 9.154121471510734e-06 ], "gamma_dfa": 0.09588160619023256, "acc_eval": 0.298828125, "loss_eval": 1.9628738164901733, "epoch": 2 }, { "hidden_norms": [ 2670.88134765625, 35761.4921875, 99927.7890625, 170223.953125, 201448.390625 ], "bp_grad_norms_per_sample_med": [ 5.815078338855528e-07, 7.772520405069372e-08, 7.527528111950232e-08, 7.557918735301428e-08, 7.57173737042649e-08 ], "bp_grad_norms_F": [ 2.8944486984983087e-05, 3.2005805223889183e-06, 2.6765355869429186e-06, 2.639568720042007e-06, 2.6436800908413716e-06 ], "gamma_dfa": 0.09442083747126162, "acc_eval": 0.2900390625, "loss_eval": 1.9821033477783203, "epoch": 3 }, { "hidden_norms": [ 3506.001220703125, 70233.9375, 205054.078125, 348792.375, 416698.5625 ], "bp_grad_norms_per_sample_med": [ 4.5228594558466284e-07, 4.338783554658221e-08, 4.114394869247917e-08, 4.122260932604149e-08, 4.124275321260029e-08 ], "bp_grad_norms_F": [ 2.319143823115155e-05, 1.7165241388283903e-06, 1.3772670399703202e-06, 1.3777447520624264e-06, 1.3796359326079255e-06 ], "gamma_dfa": 0.09172606549691409, "acc_eval": 0.298828125, "loss_eval": 1.9661527872085571, "epoch": 4 }, { "hidden_norms": [ 4351.04052734375, 120982.0390625, 361547.03125, 633667.3125, 764198.75 ], "bp_grad_norms_per_sample_med": [ 3.632259790720127e-07, 2.6118947005215887e-08, 2.4913996199416033e-08, 2.494128636953974e-08, 2.4942012899487054e-08 ], "bp_grad_norms_F": [ 1.894752676889766e-05, 1.1090510270150844e-06, 8.424218549407669e-07, 8.403117703892349e-07, 8.407336054006009e-07 ], "gamma_dfa": 0.08992433547973633, "acc_eval": 0.2900390625, "loss_eval": 1.980475664138794, "epoch": 5 }, { "hidden_norms": [ 5174.9833984375, 189817.0625, 576763.3125, 1012734.125, 1235217.5 ], "bp_grad_norms_per_sample_med": [ 3.340334444601467e-07, 1.826493090106851e-08, 1.7263264595612782e-08, 1.730784759956805e-08, 1.7305337607353977e-08 ], "bp_grad_norms_F": [ 1.7139096598839387e-05, 7.582453918075771e-07, 5.794162802885694e-07, 5.812879635413992e-07, 5.813373604723893e-07 ], "gamma_dfa": 0.08752730302512646, "acc_eval": 0.3056640625, "loss_eval": 1.9696743488311768, "epoch": 6 }, { "hidden_norms": [ 5963.3935546875, 276686.75, 861517.375, 1555059.75, 1913322.5 ], "bp_grad_norms_per_sample_med": [ 2.834741223978199e-07, 1.3120247110975924e-08, 1.2326365705916942e-08, 1.2353129186237766e-08, 1.2349524958210623e-08 ], "bp_grad_norms_F": [ 1.4978587387304287e-05, 5.169860628484457e-07, 4.2094282548532647e-07, 4.222391680741566e-07, 4.222146685606276e-07 ], "gamma_dfa": 0.08884745300747454, "acc_eval": 0.2919921875, "loss_eval": 1.9592503309249878, "epoch": 7 }, { "hidden_norms": [ 6751.1630859375, 390990.65625, 1268157.625, 2303462.75, 2850455.0 ], "bp_grad_norms_per_sample_med": [ 2.5272595394199016e-07, 9.644952392307005e-09, 9.213153795428752e-09, 9.189856875480018e-09, 9.217835383878992e-09 ], "bp_grad_norms_F": [ 1.3214407772466075e-05, 3.7820277043465467e-07, 3.14011003865744e-07, 3.1468064776163374e-07, 3.146610936255456e-07 ], "gamma_dfa": 0.08774545323103666, "acc_eval": 0.3115234375, "loss_eval": 1.9636309146881104, "epoch": 8 }, { "hidden_norms": [ 7557.10302734375, 541741.25, 1767146.375, 3237576.25, 4005094.0 ], "bp_grad_norms_per_sample_med": [ 2.3122942138797953e-07, 7.519741274109037e-09, 7.2226606917524805e-09, 7.218183384338772e-09, 7.221534037427091e-09 ], "bp_grad_norms_F": [ 1.196970697492361e-05, 2.9184533900661336e-07, 2.4720966962377133e-07, 2.4752529270699597e-07, 2.4754368155299744e-07 ], "gamma_dfa": 0.08941872720606625, "acc_eval": 0.2900390625, "loss_eval": 1.9587393999099731, "epoch": 9 }, { "hidden_norms": [ 8353.015625, 720288.5625, 2367034.25, 4437438.5, 5500873.0 ], "bp_grad_norms_per_sample_med": [ 2.1009967099416826e-07, 6.096115612308495e-09, 5.8281148795913396e-09, 5.816529036195561e-09, 5.823292070772368e-09 ], "bp_grad_norms_F": [ 1.0853039384528529e-05, 2.2833219759377243e-07, 1.979581298883204e-07, 1.9814572738141578e-07, 1.9820384977720096e-07 ], "gamma_dfa": 0.09132041316479445, "acc_eval": 0.2978515625, "loss_eval": 1.9605882167816162, "epoch": 10 }, { "hidden_norms": [ 9134.4443359375, 924688.8125, 3108971.25, 5809310.0, 7180875.5 ], "bp_grad_norms_per_sample_med": [ 1.9402843065563502e-07, 4.977510403847418e-09, 4.8141264308299014e-09, 4.791541829973767e-09, 4.794175723077387e-09 ], "bp_grad_norms_F": [ 1.0063903573609423e-05, 1.9364638603747153e-07, 1.6622837506474752e-07, 1.6636218447274587e-07, 1.6641583044929575e-07 ], "gamma_dfa": 0.08994872949551791, "acc_eval": 0.2822265625, "loss_eval": 1.9717106819152832, "epoch": 11 }, { "hidden_norms": [ 9934.0107421875, 1171186.5, 4059807.75, 7477705.0, 9248714.0 ], "bp_grad_norms_per_sample_med": [ 1.802942222184356e-07, 4.213630333538276e-09, 4.032348677185382e-09, 4.031016409555832e-09, 4.033940292913485e-09 ], "bp_grad_norms_F": [ 9.375374247611035e-06, 1.60658984782458e-07, 1.398711617639492e-07, 1.399746452079853e-07, 1.4004145043600147e-07 ], "gamma_dfa": 0.09168496390338987, "acc_eval": 0.2998046875, "loss_eval": 1.9513648748397827, "epoch": 12 }, { "hidden_norms": [ 10690.2216796875, 1474348.375, 5210694.5, 9539616.0, 11795722.0 ], "bp_grad_norms_per_sample_med": [ 1.7011585384807404e-07, 3.5948770626959003e-09, 3.444458496204561e-09, 3.439692752849055e-09, 3.4398179860062328e-09 ], "bp_grad_norms_F": [ 8.913790225051343e-06, 1.346561759874021e-07, 1.1880944583708697e-07, 1.1887690476442003e-07, 1.1894194784645151e-07 ], "gamma_dfa": 0.0931803259300068, "acc_eval": 0.3134765625, "loss_eval": 1.959463357925415, "epoch": 13 }, { "hidden_norms": [ 11428.3076171875, 1789460.25, 6431273.0, 11810251.0, 14610525.0 ], "bp_grad_norms_per_sample_med": [ 1.5823535193248972e-07, 3.1298097447063356e-09, 3.012203153573978e-09, 3.010908633527265e-09, 3.010648619294898e-09 ], "bp_grad_norms_F": [ 8.233506378019229e-06, 1.1668681310084139e-07, 1.0298786889961775e-07, 1.0303519104581937e-07, 1.0309597797686365e-07 ], "gamma_dfa": 0.09336384548805654, "acc_eval": 0.2861328125, "loss_eval": 1.9515889883041382, "epoch": 14 }, { "hidden_norms": [ 12175.4384765625, 2177908.0, 7886216.5, 14475684.0, 17927020.0 ], "bp_grad_norms_per_sample_med": [ 1.5137742082060868e-07, 2.705691448667835e-09, 2.5981530260565933e-09, 2.5995214869567462e-09, 2.6000293029682098e-09 ], "bp_grad_norms_F": [ 7.800716048222966e-06, 1.0053086896277819e-07, 8.984200405848242e-08, 8.987952071493055e-08, 8.993622913067156e-08 ], "gamma_dfa": 0.09357930033002049, "acc_eval": 0.2978515625, "loss_eval": 1.9580912590026855, "epoch": 15 }, { "hidden_norms": [ 12918.6787109375, 2622644.5, 9573671.0, 17460572.0, 21682046.0 ], "bp_grad_norms_per_sample_med": [ 1.432233602827182e-07, 2.359643591631766e-09, 2.2714441438864696e-09, 2.2688442236074025e-09, 2.2694950363444377e-09 ], "bp_grad_norms_F": [ 7.43454029361601e-06, 8.846858889910436e-08, 7.942762891843813e-08, 7.945371294226788e-08, 7.950914238108453e-08 ], "gamma_dfa": 0.09332277777139097, "acc_eval": 0.30859375, "loss_eval": 1.9656270742416382, "epoch": 16 }, { "hidden_norms": [ 13676.931640625, 3144179.5, 11421599.0, 20832254.0, 25907438.0 ], "bp_grad_norms_per_sample_med": [ 1.3402345189206244e-07, 2.1064472388587774e-09, 2.0263852817947736e-09, 2.0199610872850826e-09, 2.0222397090208233e-09 ], "bp_grad_norms_F": [ 6.909830062795663e-06, 7.773559929091789e-08, 7.076827301943922e-08, 7.077783692466255e-08, 7.082799413637986e-08 ], "gamma_dfa": 0.0945073509356007, "acc_eval": 0.296875, "loss_eval": 1.9510960578918457, "epoch": 17 }, { "hidden_norms": [ 14410.64453125, 3691622.0, 13302875.0, 24659928.0, 30700242.0 ], "bp_grad_norms_per_sample_med": [ 1.2569752527724631e-07, 1.8540845525549798e-09, 1.8018908587436044e-09, 1.8003264434796051e-09, 1.802896276714705e-09 ], "bp_grad_norms_F": [ 6.58303315503872e-06, 6.894391191281102e-08, 6.3350469758916e-08, 6.336826174901944e-08, 6.340740554833246e-08 ], "gamma_dfa": 0.09388192358892411, "acc_eval": 0.30859375, "loss_eval": 1.9456725120544434, "epoch": 18 }, { "hidden_norms": [ 15102.634765625, 4270070.0, 15687016.0, 28858048.0, 35882240.0 ], "bp_grad_norms_per_sample_med": [ 1.2314617947595252e-07, 1.6925943979728686e-09, 1.6383979728473719e-09, 1.6367472932543592e-09, 1.6394127166918793e-09 ], "bp_grad_norms_F": [ 6.343140285025584e-06, 6.240136940505181e-08, 5.757489418556361e-08, 5.7587019597349354e-08, 5.7624333749117795e-08 ], "gamma_dfa": 0.09518493304494768, "acc_eval": 0.302734375, "loss_eval": 1.9497833251953125, "epoch": 19 }, { "hidden_norms": [ 15809.6728515625, 4913181.0, 18109688.0, 33281892.0, 41436228.0 ], "bp_grad_norms_per_sample_med": [ 1.1704661773137559e-07, 1.533212445892218e-09, 1.483607681151966e-09, 1.4837684414459318e-09, 1.4838255069093975e-09 ], "bp_grad_norms_F": [ 6.079233116906835e-06, 5.7217945936827164e-08, 5.270470992968512e-08, 5.2718213794378244e-08, 5.2752689327917324e-08 ], "gamma_dfa": 0.09407007653499022, "acc_eval": 0.2958984375, "loss_eval": 1.961036205291748, "epoch": 20 }, { "hidden_norms": [ 16522.783203125, 5620503.0, 20819020.0, 38391960.0, 47723272.0 ], "bp_grad_norms_per_sample_med": [ 1.1146808986950418e-07, 1.4118024527220996e-09, 1.3678460586419305e-09, 1.3669514409286876e-09, 1.3668450815629285e-09 ], "bp_grad_norms_F": [ 5.778397280664649e-06, 5.162353389209784e-08, 4.8153967924235985e-08, 4.816252285877454e-08, 4.8193449231348495e-08 ], "gamma_dfa": 0.09494083630852401, "acc_eval": 0.2958984375, "loss_eval": 1.9576481580734253, "epoch": 21 }, { "hidden_norms": [ 17230.27734375, 6437730.5, 23789486.0, 43960328.0, 54569096.0 ], "bp_grad_norms_per_sample_med": [ 1.0952022932997352e-07, 1.2858689668604484e-09, 1.246260317167014e-09, 1.2462959553261044e-09, 1.2484926426026277e-09 ], "bp_grad_norms_F": [ 5.637425147142494e-06, 4.732414282671016e-08, 4.430494371376881e-08, 4.431280586913999e-08, 4.434128086927558e-08 ], "gamma_dfa": 0.09481688600499183, "acc_eval": 0.2900390625, "loss_eval": 1.9625442028045654, "epoch": 22 }, { "hidden_norms": [ 17916.12890625, 7217473.5, 26969020.0, 49888804.0, 62010184.0 ], "bp_grad_norms_per_sample_med": [ 1.043977349013403e-07, 1.1912204556097095e-09, 1.159051632448893e-09, 1.1590449711107453e-09, 1.159014662022173e-09 ], "bp_grad_norms_F": [ 5.385433269111672e-06, 4.3334623001101136e-08, 4.083162963297582e-08, 4.0836408032873805e-08, 4.0863898931320364e-08 ], "gamma_dfa": 0.0946647283853963, "acc_eval": 0.2939453125, "loss_eval": 1.9656811952590942, "epoch": 23 }, { "hidden_norms": [ 18617.46875, 8095365.0, 30241864.0, 56059896.0, 69702984.0 ], "bp_grad_norms_per_sample_med": [ 1.001103129283365e-07, 1.1034658742303805e-09, 1.0674757744411068e-09, 1.0666105776380164e-09, 1.0677670969627684e-09 ], "bp_grad_norms_F": [ 5.150916877028067e-06, 3.999087283546032e-08, 3.779740609388682e-08, 3.780221291549424e-08, 3.782682256314729e-08 ], "gamma_dfa": 0.09509630355751142, "acc_eval": 0.296875, "loss_eval": 1.9476948976516724, "epoch": 24 }, { "hidden_norms": [ 19248.7890625, 9047595.0, 33634812.0, 62495088.0, 77796536.0 ], "bp_grad_norms_per_sample_med": [ 9.749370377676314e-08, 1.0280801765460978e-09, 9.980430926148642e-10, 9.978470272287154e-10, 9.990493987643845e-10 ], "bp_grad_norms_F": [ 5.017087005398935e-06, 3.7442834610601494e-08, 3.536156611971819e-08, 3.536548476290591e-08, 3.538822213045023e-08 ], "gamma_dfa": 0.09479212731821463, "acc_eval": 0.2861328125, "loss_eval": 1.9604804515838623, "epoch": 25 }, { "hidden_norms": [ 19902.470703125, 10030725.0, 37252656.0, 69351704.0, 86270768.0 ], "bp_grad_norms_per_sample_med": [ 9.411947843318558e-08, 9.563448921667828e-10, 9.361866837309663e-10, 9.359075736625755e-10, 9.361766917237446e-10 ], "bp_grad_norms_F": [ 4.873440502706217e-06, 3.4947159832654506e-08, 3.313299146157078e-08, 3.3137865784738096e-08, 3.315915364510147e-08 ], "gamma_dfa": 0.09510701123508625, "acc_eval": 0.2978515625, "loss_eval": 1.9498941898345947, "epoch": 26 }, { "hidden_norms": [ 20513.66796875, 11086393.0, 41223968.0, 76828584.0, 95694480.0 ], "bp_grad_norms_per_sample_med": [ 9.249640697817085e-08, 9.003223166992314e-10, 8.743661350507637e-10, 8.736535939135592e-10, 8.752278901624777e-10 ], "bp_grad_norms_F": [ 4.75014485346037e-06, 3.290759664764664e-08, 3.1125043875590563e-08, 3.1127818544973707e-08, 3.11488683735206e-08 ], "gamma_dfa": 0.09552363055991009, "acc_eval": 0.2841796875, "loss_eval": 1.9527215957641602, "epoch": 27 }, { "hidden_norms": [ 21161.345703125, 12263719.0, 45533684.0, 84877296.0, 105753224.0 ], "bp_grad_norms_per_sample_med": [ 8.900443049242313e-08, 8.457264888406257e-10, 8.261510919815862e-10, 8.261567541190118e-10, 8.276057061884501e-10 ], "bp_grad_norms_F": [ 4.624974280886818e-06, 3.0792985938887796e-08, 2.9227694042788244e-08, 2.9232776199705768e-08, 2.9251353339532216e-08 ], "gamma_dfa": 0.09527035459177569, "acc_eval": 0.2890625, "loss_eval": 1.950648307800293, "epoch": 28 }, { "hidden_norms": [ 21787.568359375, 13358760.0, 49723396.0, 92840264.0, 115901424.0 ], "bp_grad_norms_per_sample_med": [ 8.79872459336184e-08, 8.034463094830357e-10, 7.846168159630906e-10, 7.837334670135476e-10, 7.841179927581265e-10 ], "bp_grad_norms_F": [ 4.530191290541552e-06, 2.9184068495169413e-08, 2.7723606521590227e-08, 2.7726789753046432e-08, 2.7744931685447227e-08 ], "gamma_dfa": 0.09598725114483386, "acc_eval": 0.2919921875, "loss_eval": 1.9504928588867188, "epoch": 29 }, { "hidden_norms": [ 22378.34765625, 14611837.0, 54335560.0, 101350864.0, 126710488.0 ], "bp_grad_norms_per_sample_med": [ 8.497670478391228e-08, 7.560595483013799e-10, 7.353461728420996e-10, 7.342743080229752e-10, 7.348425756781296e-10 ], "bp_grad_norms_F": [ 4.383283339848276e-06, 2.7485034692631416e-08, 2.6182895851434296e-08, 2.618475392068831e-08, 2.620201833281044e-08 ], "gamma_dfa": 0.09509110247017816, "acc_eval": 0.2958984375, "loss_eval": 1.9564056396484375, "epoch": 30 }, { "hidden_norms": [ 22972.798828125, 15931348.0, 59291124.0, 110237776.0, 138020368.0 ], "bp_grad_norms_per_sample_med": [ 8.252197858382715e-08, 7.193445838993284e-10, 6.977300404109599e-10, 6.966639487515636e-10, 6.977723399081981e-10 ], "bp_grad_norms_F": [ 4.255563453625655e-06, 2.5971447215056287e-08, 2.4833044065530885e-08, 2.4835205891804435e-08, 2.4851219748711628e-08 ], "gamma_dfa": 0.0951943755208049, "acc_eval": 0.30859375, "loss_eval": 1.9508299827575684, "epoch": 31 }, { "hidden_norms": [ 23525.689453125, 17283022.0, 64234984.0, 119317480.0, 149347744.0 ], "bp_grad_norms_per_sample_med": [ 8.036072784989301e-08, 6.884249836858203e-10, 6.666004415123439e-10, 6.656397100179845e-10, 6.674217845059616e-10 ], "bp_grad_norms_F": [ 4.212505245959619e-06, 2.4864668546342727e-08, 2.375563212808629e-08, 2.3757841915994504e-08, 2.3773273127858374e-08 ], "gamma_dfa": 0.09534151147818193, "acc_eval": 0.294921875, "loss_eval": 1.95639967918396, "epoch": 32 }, { "hidden_norms": [ 24102.95703125, 18811968.0, 69193392.0, 128823560.0, 161700704.0 ], "bp_grad_norms_per_sample_med": [ 7.921565980950618e-08, 6.526117424243694e-10, 6.390621365426341e-10, 6.381262185328751e-10, 6.384171524764781e-10 ], "bp_grad_norms_F": [ 4.09630820286111e-06, 2.3687046990517047e-08, 2.2686869272092736e-08, 2.2687553169475905e-08, 2.2702355551018627e-08 ], "gamma_dfa": 0.0947199320216896, "acc_eval": 0.2880859375, "loss_eval": 1.960526943206787, "epoch": 33 }, { "hidden_norms": [ 24687.955078125, 20313542.0, 74389296.0, 138258576.0, 173791248.0 ], "bp_grad_norms_per_sample_med": [ 7.937118340350935e-08, 6.360312831965587e-10, 6.205357339084117e-10, 6.196035906569364e-10, 6.196675395031548e-10 ], "bp_grad_norms_F": [ 4.070574505021796e-06, 2.2864428572688666e-08, 2.1894738466698982e-08, 2.1895061763643753e-08, 2.1909569269951135e-08 ], "gamma_dfa": 0.09556430295924656, "acc_eval": 0.2822265625, "loss_eval": 1.97263765335083, "epoch": 34 }, { "hidden_norms": [ 25226.55078125, 21851366.0, 80000824.0, 148574480.0, 186595952.0 ], "bp_grad_norms_per_sample_med": [ 7.592127104771862e-08, 6.044152955908544e-10, 5.892630272619215e-10, 5.896260146798227e-10, 5.900769872724254e-10 ], "bp_grad_norms_F": [ 3.966818894696189e-06, 2.1824051898988728e-08, 2.093374718015184e-08, 2.093443285389185e-08, 2.0947767964685227e-08 ], "gamma_dfa": 0.09587649442255497, "acc_eval": 0.298828125, "loss_eval": 1.9495991468429565, "epoch": 35 }, { "hidden_norms": [ 25759.50390625, 23391128.0, 85561480.0, 158667136.0, 198961760.0 ], "bp_grad_norms_per_sample_med": [ 7.493858333873504e-08, 5.860726903783586e-10, 5.731417562770957e-10, 5.733850616529423e-10, 5.73569580719635e-10 ], "bp_grad_norms_F": [ 3.896147973136976e-06, 2.099926454945944e-08, 2.0218029916918567e-08, 2.0218159590967844e-08, 2.0230830344303286e-08 ], "gamma_dfa": 0.09563440945930779, "acc_eval": 0.294921875, "loss_eval": 1.954901099205017, "epoch": 36 }, { "hidden_norms": [ 26267.0859375, 25111884.0, 91593392.0, 169479968.0, 212491408.0 ], "bp_grad_norms_per_sample_med": [ 7.387680511783401e-08, 5.612941222921108e-10, 5.475105369079358e-10, 5.468157038279742e-10, 5.479569020749864e-10 ], "bp_grad_norms_F": [ 3.838411430479027e-06, 2.0261547106770195e-08, 1.9493551661753372e-08, 1.949278782831243e-08, 1.9505332460312275e-08 ], "gamma_dfa": 0.09528586096712388, "acc_eval": 0.302734375, "loss_eval": 1.9556396007537842, "epoch": 37 }, { "hidden_norms": [ 26761.587890625, 26706742.0, 97554944.0, 180407616.0, 226265728.0 ], "bp_grad_norms_per_sample_med": [ 7.260722156843258e-08, 5.407673198121188e-10, 5.32608401826451e-10, 5.31698407524317e-10, 5.328552044048251e-10 ], "bp_grad_norms_F": [ 3.7372303722804645e-06, 1.9519287519642603e-08, 1.8807236656925852e-08, 1.8806394663783976e-08, 1.8818212765836506e-08 ], "gamma_dfa": 0.09491665422683582, "acc_eval": 0.2890625, "loss_eval": 1.963973879814148, "epoch": 38 }, { "hidden_norms": [ 27302.328125, 28336562.0, 103781320.0, 191401696.0, 240130064.0 ], "bp_grad_norms_per_sample_med": [ 7.187927053564636e-08, 5.305865746763061e-10, 5.205576525391109e-10, 5.20661624925367e-10, 5.217564713611011e-10 ], "bp_grad_norms_F": [ 3.734877054739627e-06, 1.88775892695503e-08, 1.8220953634795478e-08, 1.8220212893993448e-08, 1.8231482101782603e-08 ], "gamma_dfa": 0.0957885464449646, "acc_eval": 0.302734375, "loss_eval": 1.9604723453521729, "epoch": 39 }, { "hidden_norms": [ 27801.44140625, 30051226.0, 109945288.0, 203002704.0, 254881776.0 ], "bp_grad_norms_per_sample_med": [ 6.894305215610075e-08, 5.044222262107212e-10, 4.932855790507062e-10, 4.934126440758746e-10, 4.940316489232544e-10 ], "bp_grad_norms_F": [ 3.610647127061384e-06, 1.8150354108570355e-08, 1.753623024569606e-08, 1.7534704355171016e-08, 1.7545806585417267e-08 ], "gamma_dfa": 0.09517717303242534, "acc_eval": 0.2958984375, "loss_eval": 1.9589688777923584, "epoch": 40 }, { "hidden_norms": [ 28266.703125, 31897594.0, 116263888.0, 215162448.0, 270215296.0 ], "bp_grad_norms_per_sample_med": [ 6.807566421684896e-08, 4.835814526593651e-10, 4.775287942848649e-10, 4.773109685274335e-10, 4.784843632421598e-10 ], "bp_grad_norms_F": [ 3.590413371057366e-06, 1.7596850199197434e-08, 1.705259222717359e-08, 1.7050926004458233e-08, 1.7061644541627174e-08 ], "gamma_dfa": 0.0961545761092566, "acc_eval": 0.30859375, "loss_eval": 1.9595096111297607, "epoch": 41 }, { "hidden_norms": [ 28755.66015625, 33582328.0, 122605680.0, 226378480.0, 284438688.0 ], "bp_grad_norms_per_sample_med": [ 6.689399612014313e-08, 4.746543713629592e-10, 4.678599174745557e-10, 4.68083238835959e-10, 4.683119447790318e-10 ], "bp_grad_norms_F": [ 3.5121436212648405e-06, 1.7124380136124273e-08, 1.6555107507087996e-08, 1.655343240258844e-08, 1.656368908697914e-08 ], "gamma_dfa": 0.09569378412561491, "acc_eval": 0.287109375, "loss_eval": 1.9612011909484863, "epoch": 42 }, { "hidden_norms": [ 29227.5703125, 35443612.0, 129229904.0, 238040368.0, 299000064.0 ], "bp_grad_norms_per_sample_med": [ 6.582912703834154e-08, 4.575871348500016e-10, 4.493441174702184e-10, 4.48520082185766e-10, 4.485415650012925e-10 ], "bp_grad_norms_F": [ 3.4321058137720684e-06, 1.6602150765265833e-08, 1.6083028242519504e-08, 1.6080972997656318e-08, 1.609118882583971e-08 ], "gamma_dfa": 0.09606127908773487, "acc_eval": 0.306640625, "loss_eval": 1.9551353454589844, "epoch": 43 }, { "hidden_norms": [ 29665.798828125, 37243032.0, 135839760.0, 250377328.0, 314433920.0 ], "bp_grad_norms_per_sample_med": [ 6.588776813032382e-08, 4.4936304677278827e-10, 4.4115311403913893e-10, 4.406963405312325e-10, 4.4055534220710513e-10 ], "bp_grad_norms_F": [ 3.3984799756581197e-06, 1.6157997606569552e-08, 1.564128204734061e-08, 1.5638891071034777e-08, 1.564865925729464e-08 ], "gamma_dfa": 0.09547593681054423, "acc_eval": 0.2900390625, "loss_eval": 1.9503705501556396, "epoch": 44 }, { "hidden_norms": [ 30096.123046875, 39014544.0, 141817168.0, 261217760.0, 328197248.0 ], "bp_grad_norms_per_sample_med": [ 6.549055342475185e-08, 4.3991607578952596e-10, 4.348142956800416e-10, 4.3428130536149467e-10, 4.349899329625373e-10 ], "bp_grad_norms_F": [ 3.382166596566094e-06, 1.5776649320287106e-08, 1.5299850275596327e-08, 1.5297549893489304e-08, 1.5307026757227504e-08 ], "gamma_dfa": 0.09610002994304523, "acc_eval": 0.2998046875, "loss_eval": 1.952854037284851, "epoch": 45 }, { "hidden_norms": [ 30554.974609375, 40873780.0, 148087312.0, 272436128.0, 342258336.0 ], "bp_grad_norms_per_sample_med": [ 6.514299855098216e-08, 4.291983157767021e-10, 4.228755678958862e-10, 4.2251957488304015e-10, 4.227345695717588e-10 ], "bp_grad_norms_F": [ 3.3793355669331504e-06, 1.5485536408732514e-08, 1.4993654318118388e-08, 1.499121538017789e-08, 1.5000590991576246e-08 ], "gamma_dfa": 0.09557013235462364, "acc_eval": 0.3017578125, "loss_eval": 1.9633105993270874, "epoch": 46 }, { "hidden_norms": [ 30981.4765625, 42548124.0, 153904848.0, 283882112.0, 356627616.0 ], "bp_grad_norms_per_sample_med": [ 6.343542224840348e-08, 4.1842326825580756e-10, 4.139384113255318e-10, 4.141494092113618e-10, 4.1477912771092917e-10 ], "bp_grad_norms_F": [ 3.3046233056666097e-06, 1.508391989091251e-08, 1.4620022525946297e-08, 1.4617588028897899e-08, 1.462664656060042e-08 ], "gamma_dfa": 0.09567815247282851, "acc_eval": 0.296875, "loss_eval": 1.958325982093811, "epoch": 47 }, { "hidden_norms": [ 31383.2578125, 44333160.0, 160058736.0, 295685184.0, 371288096.0 ], "bp_grad_norms_per_sample_med": [ 6.18988522660402e-08, 4.057836289206307e-10, 4.0004452528386025e-10, 3.9987613220660023e-10, 4.004964138104583e-10 ], "bp_grad_norms_F": [ 3.2255043151963037e-06, 1.4663311453944061e-08, 1.4252069746589768e-08, 1.424969386931707e-08, 1.4258660918642363e-08 ], "gamma_dfa": 0.09609431066201068, "acc_eval": 0.302734375, "loss_eval": 1.9508600234985352, "epoch": 48 }, { "hidden_norms": [ 31750.03125, 46204072.0, 166757840.0, 307620864.0, 385856832.0 ], "bp_grad_norms_per_sample_med": [ 6.133605978675405e-08, 3.9670436380312424e-10, 3.904292722456404e-10, 3.9002356899686674e-10, 3.9039230181892037e-10 ], "bp_grad_norms_F": [ 3.2063508115243167e-06, 1.4354414545891814e-08, 1.3938280751801813e-08, 1.3935605558401676e-08, 1.394456727865645e-08 ], "gamma_dfa": 0.09565898558139452, "acc_eval": 0.310546875, "loss_eval": 1.9467211961746216, "epoch": 49 }, { "hidden_norms": [ 32133.1484375, 47907484.0, 173083168.0, 319475424.0, 400677984.0 ], "bp_grad_norms_per_sample_med": [ 6.030914079246941e-08, 3.8645733835274143e-10, 3.81215115030642e-10, 3.812981042017327e-10, 3.811861937208505e-10 ], "bp_grad_norms_F": [ 3.177025973855052e-06, 1.4072985443647212e-08, 1.368274382684831e-08, 1.3679918531295243e-08, 1.368857649453048e-08 ], "gamma_dfa": 0.09606298332801089, "acc_eval": 0.30078125, "loss_eval": 1.9524433612823486, "epoch": 50 }, { "hidden_norms": [ 32483.716796875, 49794588.0, 179046160.0, 330962240.0, 414954912.0 ], "bp_grad_norms_per_sample_med": [ 6.051003254015086e-08, 3.794887737385011e-10, 3.751928767670165e-10, 3.752734789586043e-10, 3.7574471312140645e-10 ], "bp_grad_norms_F": [ 3.154751766487607e-06, 1.3766489281863414e-08, 1.339402011524271e-08, 1.3391274755747418e-08, 1.3399712450734569e-08 ], "gamma_dfa": 0.09573800596626825, "acc_eval": 0.3046875, "loss_eval": 1.952356219291687, "epoch": 51 }, { "hidden_norms": [ 32825.296875, 51662352.0, 185889568.0, 343223360.0, 430225696.0 ], "bp_grad_norms_per_sample_med": [ 5.9168662858155585e-08, 3.7636679883767954e-10, 3.7184264001233203e-10, 3.7154498921943e-10, 3.7157116272723556e-10 ], "bp_grad_norms_F": [ 3.0909043289284455e-06, 1.346105005239906e-08, 1.3102917861829155e-08, 1.3100156515122308e-08, 1.3108366836434016e-08 ], "gamma_dfa": 0.09539097778178984, "acc_eval": 0.291015625, "loss_eval": 1.9585516452789307, "epoch": 52 }, { "hidden_norms": [ 33148.9453125, 53487464.0, 192413680.0, 354830112.0, 444651488.0 ], "bp_grad_norms_per_sample_med": [ 5.949418024897568e-08, 3.692673389288359e-10, 3.6510769407804844e-10, 3.6480282683548637e-10, 3.65057900575394e-10 ], "bp_grad_norms_F": [ 3.0807416351308348e-06, 1.3205962545725924e-08, 1.2856014031115137e-08, 1.2853148767533185e-08, 1.2861222309368259e-08 ], "gamma_dfa": 0.09566472223013989, "acc_eval": 0.2880859375, "loss_eval": 1.9538320302963257, "epoch": 53 }, { "hidden_norms": [ 33465.359375, 55258308.0, 198680688.0, 365875680.0, 458634560.0 ], "bp_grad_norms_per_sample_med": [ 5.9228732141036744e-08, 3.640579226971141e-10, 3.6045816331764513e-10, 3.6029040861862427e-10, 3.6025293859154317e-10 ], "bp_grad_norms_F": [ 3.058711854464491e-06, 1.294814744312589e-08, 1.2619584488504643e-08, 1.2616848898971966e-08, 1.2624772338654111e-08 ], "gamma_dfa": 0.09607254836737411, "acc_eval": 0.2998046875, "loss_eval": 1.9489495754241943, "epoch": 54 }, { "hidden_norms": [ 33763.53125, 56920656.0, 204554208.0, 376681216.0, 472155680.0 ], "bp_grad_norms_per_sample_med": [ 5.756867338391203e-08, 3.4894195866108646e-10, 3.4671995829960167e-10, 3.464649955819965e-10, 3.4666045034548176e-10 ], "bp_grad_norms_F": [ 3.092292217843351e-06, 1.2733584853208413e-08, 1.2427238793577544e-08, 1.2424394846277664e-08, 1.2432122886707475e-08 ], "gamma_dfa": 0.09629741777825984, "acc_eval": 0.3017578125, "loss_eval": 1.9477816820144653, "epoch": 55 }, { "hidden_norms": [ 34061.03125, 58650568.0, 210577584.0, 387585472.0, 485747168.0 ], "bp_grad_norms_per_sample_med": [ 5.70959208801014e-08, 3.4928168690662176e-10, 3.46003392603933e-10, 3.4562114281655454e-10, 3.4606426058125805e-10 ], "bp_grad_norms_F": [ 3.178826091243536e-06, 1.2512856528701377e-08, 1.2208544397651622e-08, 1.2205639166040783e-08, 1.2213387634574246e-08 ], "gamma_dfa": 0.09542209599749185, "acc_eval": 0.3046875, "loss_eval": 1.9549853801727295, "epoch": 56 }, { "hidden_norms": [ 34344.76171875, 60294200.0, 216821792.0, 398493824.0, 499371840.0 ], "bp_grad_norms_per_sample_med": [ 5.7367511629990986e-08, 3.416208427253764e-10, 3.378898272288211e-10, 3.377436663676292e-10, 3.386138314187548e-10 ], "bp_grad_norms_F": [ 3.2603361432848033e-06, 1.2295201301526504e-08, 1.2022674411582557e-08, 1.2019833128817936e-08, 1.2027326690144946e-08 ], "gamma_dfa": 0.09621504079404986, "acc_eval": 0.294921875, "loss_eval": 1.9597327709197998, "epoch": 57 }, { "hidden_norms": [ 34621.87109375, 62004936.0, 222707536.0, 409299680.0, 512662208.0 ], "bp_grad_norms_per_sample_med": [ 5.6534943837505125e-08, 3.356194766546139e-10, 3.3068575655548216e-10, 3.3087257933495096e-10, 3.3104252672444545e-10 ], "bp_grad_norms_F": [ 3.325955731270369e-06, 1.2073825494951507e-08, 1.1812358202689666e-08, 1.1809524025352403e-08, 1.1816909228912209e-08 ], "gamma_dfa": 0.09621665377926547, "acc_eval": 0.3017578125, "loss_eval": 1.9411261081695557, "epoch": 58 }, { "hidden_norms": [ 34892.69921875, 63619864.0, 228332912.0, 419524224.0, 525474048.0 ], "bp_grad_norms_per_sample_med": [ 5.6131870707076814e-08, 3.3116545616884707e-10, 3.281262206389357e-10, 3.2806185545908306e-10, 3.281940552657403e-10 ], "bp_grad_norms_F": [ 3.306513235656894e-06, 1.1909767394513437e-08, 1.165356344756674e-08, 1.1650684861308491e-08, 1.1658000786951561e-08 ], "gamma_dfa": 0.09604647590094828, "acc_eval": 0.30078125, "loss_eval": 1.9494699239730835, "epoch": 59 }, { "hidden_norms": [ 35134.12890625, 65285940.0, 233831760.0, 429654048.0, 537931904.0 ], "bp_grad_norms_per_sample_med": [ 5.542536740676951e-08, 3.2549649087165733e-10, 3.224807365587168e-10, 3.2198288479889925e-10, 3.2189514942437825e-10 ], "bp_grad_norms_F": [ 3.2077998639579164e-06, 1.1713971126425804e-08, 1.1479991179896842e-08, 1.147721562233528e-08, 1.1484392992144876e-08 ], "gamma_dfa": 0.09610223810159368, "acc_eval": 0.298828125, "loss_eval": 1.947687029838562, "epoch": 60 }, { "hidden_norms": [ 35383.89453125, 66896316.0, 239557328.0, 439032672.0, 549329344.0 ], "bp_grad_norms_per_sample_med": [ 5.55890657949476e-08, 3.2204855449080583e-10, 3.1836161484832814e-10, 3.185524344306856e-10, 3.1883792828146795e-10 ], "bp_grad_norms_F": [ 3.19811397275771e-06, 1.1587792059231106e-08, 1.1364262419988336e-08, 1.1361324325775968e-08, 1.1368459951199839e-08 ], "gamma_dfa": 0.09620415412791772, "acc_eval": 0.3046875, "loss_eval": 1.9550621509552002, "epoch": 61 }, { "hidden_norms": [ 35603.75390625, 68393976.0, 244906672.0, 448738336.0, 561222784.0 ], "bp_grad_norms_per_sample_med": [ 5.4847117070266904e-08, 3.208481536010055e-10, 3.1700905789300293e-10, 3.1679742162893376e-10, 3.169834394967097e-10 ], "bp_grad_norms_F": [ 3.1413667329616146e-06, 1.1423910706298557e-08, 1.1206890526693769e-08, 1.1204000394116065e-08, 1.1211046313519546e-08 ], "gamma_dfa": 0.09554143912100699, "acc_eval": 0.302734375, "loss_eval": 1.9572508335113525, "epoch": 62 }, { "hidden_norms": [ 35840.75, 69909448.0, 249732624.0, 457790144.0, 572499584.0 ], "bp_grad_norms_per_sample_med": [ 5.482150200464275e-08, 3.132541726014182e-10, 3.1085201079861235e-10, 3.1094149477439714e-10, 3.1132280087220465e-10 ], "bp_grad_norms_F": [ 3.1111580938159022e-06, 1.1274166489272375e-08, 1.1068144623038734e-08, 1.1065306892987792e-08, 1.1072265770906142e-08 ], "gamma_dfa": 0.09598036286843126, "acc_eval": 0.2939453125, "loss_eval": 1.9514048099517822, "epoch": 63 }, { "hidden_norms": [ 36044.14453125, 71301840.0, 254043168.0, 466339968.0, 583323328.0 ], "bp_grad_norms_per_sample_med": [ 5.41697069422753e-08, 3.088812261520246e-10, 3.0549318630335165e-10, 3.051613683968668e-10, 3.050981411956144e-10 ], "bp_grad_norms_F": [ 3.063583790208213e-06, 1.1131353616633533e-08, 1.0936378025405702e-08, 1.0933466576545925e-08, 1.0940373940115933e-08 ], "gamma_dfa": 0.09560732997124433, "acc_eval": 0.3076171875, "loss_eval": 1.9496949911117554, "epoch": 64 }, { "hidden_norms": [ 36240.3046875, 72753064.0, 259111488.0, 475471840.0, 594591872.0 ], "bp_grad_norms_per_sample_med": [ 5.367900612895937e-08, 3.0714322751812517e-10, 3.043856555695612e-10, 3.04040070897571e-10, 3.043043039774318e-10 ], "bp_grad_norms_F": [ 3.096502268817858e-06, 1.1002981636920595e-08, 1.0808172135057248e-08, 1.0805252692591694e-08, 1.0812099660029162e-08 ], "gamma_dfa": 0.09588889799488243, "acc_eval": 0.2978515625, "loss_eval": 1.951111078262329, "epoch": 65 }, { "hidden_norms": [ 36427.96484375, 74044192.0, 263715872.0, 483414560.0, 604480512.0 ], "bp_grad_norms_per_sample_med": [ 5.3715726977543454e-08, 3.022930794571721e-10, 2.992986969374556e-10, 2.9908994725325044e-10, 2.9924074329557016e-10 ], "bp_grad_norms_F": [ 3.0333421818795614e-06, 1.0890616408687492e-08, 1.0706762587631147e-08, 1.0703858244198727e-08, 1.071066169089363e-08 ], "gamma_dfa": 0.09630945282333414, "acc_eval": 0.30078125, "loss_eval": 1.949332594871521, "epoch": 66 }, { "hidden_norms": [ 36613.015625, 75303768.0, 267802576.0, 490809920.0, 613719616.0 ], "bp_grad_norms_per_sample_med": [ 5.348211473688025e-08, 3.012197435925401e-10, 2.9878169383046327e-10, 2.9841951132425493e-10, 2.984068825373498e-10 ], "bp_grad_norms_F": [ 3.008998646691907e-06, 1.0781116444036343e-08, 1.0603616651394532e-08, 1.0600682998074262e-08, 1.0607434930420823e-08 ], "gamma_dfa": 0.0960872639734589, "acc_eval": 0.310546875, "loss_eval": 1.9464266300201416, "epoch": 67 }, { "hidden_norms": [ 36784.2265625, 76478576.0, 271792224.0, 498011968.0, 622710336.0 ], "bp_grad_norms_per_sample_med": [ 5.403291680750044e-08, 3.0129157502223336e-10, 2.977850743768329e-10, 2.975975854635493e-10, 2.9797145306709183e-10 ], "bp_grad_norms_F": [ 2.9997727324371226e-06, 1.0701310948491027e-08, 1.052768094922385e-08, 1.0524773941256171e-08, 1.0531463701113353e-08 ], "gamma_dfa": 0.09624087948759552, "acc_eval": 0.2939453125, "loss_eval": 1.9560136795043945, "epoch": 68 }, { "hidden_norms": [ 36953.8671875, 77622176.0, 275419712.0, 504592704.0, 630923392.0 ], "bp_grad_norms_per_sample_med": [ 5.3204310290766443e-08, 2.9739929963135125e-10, 2.9424951364376284e-10, 2.9405439194718497e-10, 2.94715835069681e-10 ], "bp_grad_norms_F": [ 2.95851918963308e-06, 1.0595774924127e-08, 1.0427880781094245e-08, 1.042505370918434e-08, 1.0431726593651547e-08 ], "gamma_dfa": 0.09637677710998105, "acc_eval": 0.2978515625, "loss_eval": 1.950129747390747, "epoch": 69 }, { "hidden_norms": [ 37103.0546875, 78713944.0, 279082240.0, 511376384.0, 639270976.0 ], "bp_grad_norms_per_sample_med": [ 5.3287564583115454e-08, 2.9558042125010786e-10, 2.94046592630437e-10, 2.936023091315576e-10, 2.9353278141464045e-10 ], "bp_grad_norms_F": [ 2.9398986498563318e-06, 1.0504810354916572e-08, 1.034081797968156e-08, 1.0337980249630618e-08, 1.0344593626143705e-08 ], "gamma_dfa": 0.09638382289995207, "acc_eval": 0.29296875, "loss_eval": 1.9502758979797363, "epoch": 70 }, { "hidden_norms": [ 37248.1015625, 79737480.0, 282511072.0, 517720224.0, 647238976.0 ], "bp_grad_norms_per_sample_med": [ 5.260229585246634e-08, 2.899096518405031e-10, 2.8717414557455356e-10, 2.8704966181791747e-10, 2.871551885164081e-10 ], "bp_grad_norms_F": [ 2.9307011573109776e-06, 1.0423523377767197e-08, 1.0264206373733487e-08, 1.0261346439222052e-08, 1.0267889649639983e-08 ], "gamma_dfa": 0.0963258501906239, "acc_eval": 0.3017578125, "loss_eval": 1.949232816696167, "epoch": 71 }, { "hidden_norms": [ 37381.0390625, 80657776.0, 285833920.0, 523738208.0, 654706368.0 ], "bp_grad_norms_per_sample_med": [ 5.2669339112298985e-08, 2.929272380214343e-10, 2.8994415202099333e-10, 2.898675188767186e-10, 2.900694684448979e-10 ], "bp_grad_norms_F": [ 2.912831860157894e-06, 1.0341300260563457e-08, 1.018425699328418e-08, 1.0181377518847512e-08, 1.0187909182945987e-08 ], "gamma_dfa": 0.09613002402329585, "acc_eval": 0.2958984375, "loss_eval": 1.9482614994049072, "epoch": 72 }, { "hidden_norms": [ 37505.28515625, 81612512.0, 289044000.0, 529475296.0, 661837376.0 ], "bp_grad_norms_per_sample_med": [ 5.200942965188915e-08, 2.875680804592662e-10, 2.8434027354862224e-10, 2.8415880759524725e-10, 2.840882251664567e-10 ], "bp_grad_norms_F": [ 2.9117632038833108e-06, 1.0266585803719863e-08, 1.0111568471415922e-08, 1.0108765380323348e-08, 1.0115227766505086e-08 ], "gamma_dfa": 0.09620579873444512, "acc_eval": 0.2958984375, "loss_eval": 1.949747085571289, "epoch": 73 }, { "hidden_norms": [ 37622.05078125, 82508960.0, 292035424.0, 534928544.0, 668760064.0 ], "bp_grad_norms_per_sample_med": [ 5.211632014834322e-08, 2.8521121575586506e-10, 2.8250474182200946e-10, 2.822122813217476e-10, 2.8265498275281686e-10 ], "bp_grad_norms_F": [ 2.9012180675636046e-06, 1.0211213208322079e-08, 1.0059093114023199e-08, 1.0056256272150677e-08, 1.0062689348444565e-08 ], "gamma_dfa": 0.09616703895881074, "acc_eval": 0.2998046875, "loss_eval": 1.9510722160339355, "epoch": 74 }, { "hidden_norms": [ 37739.125, 83378024.0, 294890528.0, 540384832.0, 675452224.0 ], "bp_grad_norms_per_sample_med": [ 5.20015284166675e-08, 2.812508559379978e-10, 2.7935267987722057e-10, 2.7908611532900807e-10, 2.792987507937994e-10 ], "bp_grad_norms_F": [ 2.858193283827859e-06, 1.0136964156970407e-08, 9.987989102455685e-09, 9.985158477832101e-09, 9.991581784163373e-09 ], "gamma_dfa": 0.09625962336212979, "acc_eval": 0.306640625, "loss_eval": 1.949669599533081, "epoch": 75 }, { "hidden_norms": [ 37841.23828125, 84099792.0, 297324992.0, 545087552.0, 681202944.0 ], "bp_grad_norms_per_sample_med": [ 5.180555717743118e-08, 2.81841883165157e-10, 2.790032094246442e-10, 2.7877883335136744e-10, 2.790592201762365e-10 ], "bp_grad_norms_F": [ 2.8341921733954223e-06, 1.0072185752107998e-08, 9.925220645357058e-09, 9.922425547870262e-09, 9.928815103421584e-09 ], "gamma_dfa": 0.09619013674819143, "acc_eval": 0.2958984375, "loss_eval": 1.947105884552002, "epoch": 76 }, { "hidden_norms": [ 37933.76953125, 84846568.0, 299677280.0, 549384448.0, 686714688.0 ], "bp_grad_norms_per_sample_med": [ 5.136923775239666e-08, 2.810240096184913e-10, 2.7924595968897847e-10, 2.7894245246962157e-10, 2.789228015220857e-10 ], "bp_grad_norms_F": [ 2.822413307512761e-06, 1.0021487639733095e-08, 9.876163886701761e-09, 9.873332373899757e-09, 9.879697948633748e-09 ], "gamma_dfa": 0.09583658421615837, "acc_eval": 0.306640625, "loss_eval": 1.9495177268981934, "epoch": 77 }, { "hidden_norms": [ 38020.0, 85562224.0, 301864096.0, 553597760.0, 691941760.0 ], "bp_grad_norms_per_sample_med": [ 5.160018545780076e-08, 2.8198060553208393e-10, 2.797063691772905e-10, 2.7946911451692813e-10, 2.796869680299352e-10 ], "bp_grad_norms_F": [ 2.7969890652457252e-06, 9.96650406648314e-09, 9.82430670148915e-09, 9.821477853222405e-09, 9.827816782603804e-09 ], "gamma_dfa": 0.09604255547674256, "acc_eval": 0.298828125, "loss_eval": 1.9492969512939453, "epoch": 78 }, { "hidden_norms": [ 38095.6171875, 86194680.0, 304047168.0, 557639872.0, 696924224.0 ], "bp_grad_norms_per_sample_med": [ 5.120950063997043e-08, 2.782411523405415e-10, 2.750368821580196e-10, 2.7475391406461824e-10, 2.748750949077561e-10 ], "bp_grad_norms_F": [ 2.7781038625107612e-06, 9.913026843832995e-09, 9.771905951083681e-09, 9.769114406310564e-09, 9.775444453907767e-09 ], "gamma_dfa": 0.09590470486728009, "acc_eval": 0.3037109375, "loss_eval": 1.9471888542175293, "epoch": 79 }, { "hidden_norms": [ 38161.02734375, 86761784.0, 305935040.0, 560989248.0, 701039488.0 ], "bp_grad_norms_per_sample_med": [ 5.1234330555871566e-08, 2.762826911695271e-10, 2.737765292248895e-10, 2.7344454478495095e-10, 2.735327242486818e-10 ], "bp_grad_norms_F": [ 2.7851888262375724e-06, 9.883654783493512e-09, 9.742406881230181e-09, 9.73962688277652e-09, 9.74590719238222e-09 ], "gamma_dfa": 0.0961023918025603, "acc_eval": 0.306640625, "loss_eval": 1.9466722011566162, "epoch": 80 }, { "hidden_norms": [ 38225.30859375, 87283448.0, 307635232.0, 564114432.0, 704943360.0 ], "bp_grad_norms_per_sample_med": [ 5.112997669698416e-08, 2.7494201360056536e-10, 2.7230390164945106e-10, 2.724628855865774e-10, 2.7264715485308955e-10 ], "bp_grad_norms_F": [ 2.775808070509811e-06, 9.851329529908526e-09, 9.711465409623088e-09, 9.708682746634167e-09, 9.714950621741991e-09 ], "gamma_dfa": 0.09609865310994792, "acc_eval": 0.30078125, "loss_eval": 1.9487848281860352, "epoch": 81 }, { "hidden_norms": [ 38286.74609375, 87760048.0, 309161312.0, 566976960.0, 708521920.0 ], "bp_grad_norms_per_sample_med": [ 5.100326561091606e-08, 2.750530914141791e-10, 2.7221699894219853e-10, 2.720162428637707e-10, 2.72086408958927e-10 ], "bp_grad_norms_F": [ 2.76197988569038e-06, 9.813816426174071e-09, 9.67496749382235e-09, 9.672206147115503e-09, 9.678448265049155e-09 ], "gamma_dfa": 0.09604053818475222, "acc_eval": 0.3017578125, "loss_eval": 1.946324110031128, "epoch": 82 }, { "hidden_norms": [ 38345.609375, 88198008.0, 310597792.0, 569628928.0, 711849600.0 ], "bp_grad_norms_per_sample_med": [ 5.150431903189201e-08, 2.739733162560043e-10, 2.706747326275405e-10, 2.703801071923806e-10, 2.703643420254309e-10 ], "bp_grad_norms_F": [ 2.754284651018679e-06, 9.79015535307326e-09, 9.652834087603424e-09, 9.650069188182897e-09, 9.656329069684944e-09 ], "gamma_dfa": 0.09618356187274912, "acc_eval": 0.3017578125, "loss_eval": 1.952025294303894, "epoch": 83 }, { "hidden_norms": [ 38393.00390625, 88631992.0, 311868064.0, 571956672.0, 714769600.0 ], "bp_grad_norms_per_sample_med": [ 5.135545677603659e-08, 2.741361304625656e-10, 2.7016161530113436e-10, 2.7007868164119486e-10, 2.702876256144293e-10 ], "bp_grad_norms_F": [ 2.7439270979812136e-06, 9.758214680744004e-09, 9.621899721423688e-09, 9.619145480144198e-09, 9.625373387223135e-09 ], "gamma_dfa": 0.09624775896372739, "acc_eval": 0.302734375, "loss_eval": 1.9458943605422974, "epoch": 84 }, { "hidden_norms": [ 38432.8515625, 89003520.0, 313081504.0, 574038272.0, 717387392.0 ], "bp_grad_norms_per_sample_med": [ 5.1023032909824906e-08, 2.709044100157598e-10, 2.6825267007701825e-10, 2.6804419794856926e-10, 2.6862953528272726e-10 ], "bp_grad_norms_F": [ 2.7511816824699054e-06, 9.751657259471358e-09, 9.615223284242802e-09, 9.612453943930177e-09, 9.618667640154399e-09 ], "gamma_dfa": 0.09613665863071219, "acc_eval": 0.3095703125, "loss_eval": 1.9508092403411865, "epoch": 85 }, { "hidden_norms": [ 38471.12890625, 89306096.0, 314023616.0, 575863488.0, 719706496.0 ], "bp_grad_norms_per_sample_med": [ 5.104102740460803e-08, 2.722161940305057e-10, 2.698590240157728e-10, 2.697040091259595e-10, 2.698894441266475e-10 ], "bp_grad_norms_F": [ 2.731306722125737e-06, 9.717195048608573e-09, 9.582218574166745e-09, 9.579466997422514e-09, 9.585680693646736e-09 ], "gamma_dfa": 0.09615167022275273, "acc_eval": 0.296875, "loss_eval": 1.9497017860412598, "epoch": 86 }, { "hidden_norms": [ 38506.49609375, 89593104.0, 314968672.0, 577511168.0, 721761728.0 ], "bp_grad_norms_per_sample_med": [ 5.099763100702148e-08, 2.7151769721456276e-10, 2.698610224172171e-10, 2.6943663966605413e-10, 2.6953861365086595e-10 ], "bp_grad_norms_F": [ 2.73057457889081e-06, 9.698882585951196e-09, 9.564125491579034e-09, 9.561379243905321e-09, 9.567577841096409e-09 ], "gamma_dfa": 0.09604650201799814, "acc_eval": 0.2998046875, "loss_eval": 1.948227882385254, "epoch": 87 }, { "hidden_norms": [ 38536.46875, 89827632.0, 315715328.0, 578913664.0, 723505408.0 ], "bp_grad_norms_per_sample_med": [ 5.074277709127273e-08, 2.7221166987168033e-10, 2.7026783588901537e-10, 2.700663026544703e-10, 2.7004307123768e-10 ], "bp_grad_norms_F": [ 2.727413175307447e-06, 9.684548274435656e-09, 9.549998125635284e-09, 9.547248325247892e-09, 9.553437152476363e-09 ], "gamma_dfa": 0.09602321147394832, "acc_eval": 0.2978515625, "loss_eval": 1.9482835531234741, "epoch": 88 }, { "hidden_norms": [ 38560.86328125, 90036944.0, 316345728.0, 580143808.0, 725043392.0 ], "bp_grad_norms_per_sample_med": [ 5.10075821580358e-08, 2.70407807256845e-10, 2.6787719265009e-10, 2.677959520802631e-10, 2.679190480581184e-10 ], "bp_grad_norms_F": [ 2.7208343453821726e-06, 9.672045386821537e-09, 9.538242196072133e-09, 9.535500389290519e-09, 9.541698986481606e-09 ], "gamma_dfa": 0.09616725159867201, "acc_eval": 0.3017578125, "loss_eval": 1.9490463733673096, "epoch": 89 }, { "hidden_norms": [ 38581.62890625, 90197056.0, 316901888.0, 581085248.0, 726214080.0 ], "bp_grad_norms_per_sample_med": [ 5.062888064344406e-08, 2.7050772732906125e-10, 2.680498045748436e-10, 2.6770730077174676e-10, 2.6768456895531756e-10 ], "bp_grad_norms_F": [ 2.7148839762958232e-06, 9.659022026653474e-09, 9.525311206459719e-09, 9.522568511499685e-09, 9.528759115084995e-09 ], "gamma_dfa": 0.09604255046724575, "acc_eval": 0.2998046875, "loss_eval": 1.9472681283950806, "epoch": 90 }, { "hidden_norms": [ 38598.60546875, 90331488.0, 317399072.0, 581959360.0, 727306816.0 ], "bp_grad_norms_per_sample_med": [ 5.070089059699967e-08, 2.706254109696715e-10, 2.6912555517455417e-10, 2.687201572371123e-10, 2.686441624710767e-10 ], "bp_grad_norms_F": [ 2.7157270778843667e-06, 9.650602983413137e-09, 9.516874399650987e-09, 9.514130816512534e-09, 9.520310761956807e-09 ], "gamma_dfa": 0.09604466614109697, "acc_eval": 0.296875, "loss_eval": 1.9475460052490234, "epoch": 91 }, { "hidden_norms": [ 38612.046875, 90438432.0, 317761152.0, 582634240.0, 728132928.0 ], "bp_grad_norms_per_sample_med": [ 5.071476039120171e-08, 2.693741063541921e-10, 2.670912935265335e-10, 2.670463572496118e-10, 2.6704632949403617e-10 ], "bp_grad_norms_F": [ 2.7161215712112607e-06, 9.646365484172748e-09, 9.512908683007026e-09, 9.51017486983119e-09, 9.516351262561784e-09 ], "gamma_dfa": 0.09614986698579742, "acc_eval": 0.3017578125, "loss_eval": 1.947176218032837, "epoch": 92 }, { "hidden_norms": [ 38622.60546875, 90514344.0, 318023872.0, 583138880.0, 728758976.0 ], "bp_grad_norms_per_sample_med": [ 5.0669719087181875e-08, 2.7007937553058525e-10, 2.6770055616687216e-10, 2.676309729388038e-10, 2.678066102212995e-10 ], "bp_grad_norms_F": [ 2.715124537644442e-06, 9.639773423941733e-09, 9.506337939058085e-09, 9.503595244098051e-09, 9.509768084114967e-09 ], "gamma_dfa": 0.09608547511743382, "acc_eval": 0.30078125, "loss_eval": 1.9474897384643555, "epoch": 93 }, { "hidden_norms": [ 38631.16796875, 90589928.0, 318254208.0, 583549632.0, 729273152.0 ], "bp_grad_norms_per_sample_med": [ 5.0695071251993795e-08, 2.704435009270867e-10, 2.6853075318911124e-10, 2.682237765228024e-10, 2.6814858666845964e-10 ], "bp_grad_norms_F": [ 2.7134594802191714e-06, 9.634878672670766e-09, 9.501549769197482e-09, 9.498809738772707e-09, 9.504978137897524e-09 ], "gamma_dfa": 0.0960953844114556, "acc_eval": 0.2978515625, "loss_eval": 1.9472770690917969, "epoch": 94 }, { "hidden_norms": [ 38638.31640625, 90643280.0, 318415136.0, 583858560.0, 729656640.0 ], "bp_grad_norms_per_sample_med": [ 5.078240761235975e-08, 2.6967122979115743e-10, 2.669718335290838e-10, 2.6691132637424175e-10, 2.6697202781811313e-10 ], "bp_grad_norms_F": [ 2.711297611313057e-06, 9.631804687160184e-09, 9.498727138179675e-09, 9.495988884111739e-09, 9.502159947771815e-09 ], "gamma_dfa": 0.09613717825050117, "acc_eval": 0.2998046875, "loss_eval": 1.94759202003479, "epoch": 95 }, { "hidden_norms": [ 38642.26171875, 90677816.0, 318520992.0, 584046976.0, 729889984.0 ], "bp_grad_norms_per_sample_med": [ 5.069002995128358e-08, 2.6985705336990407e-10, 2.6735619274020905e-10, 2.671637633344659e-10, 2.6708837919109385e-10 ], "bp_grad_norms_F": [ 2.7110704650112893e-06, 9.629748554118578e-09, 9.496692321420142e-09, 9.493953179173786e-09, 9.500122466477023e-09 ], "gamma_dfa": 0.09612438916155952, "acc_eval": 0.2998046875, "loss_eval": 1.9474642276763916, "epoch": 96 }, { "hidden_norms": [ 38644.16015625, 90695256.0, 318576288.0, 584137856.0, 730003328.0 ], "bp_grad_norms_per_sample_med": [ 5.070784681038276e-08, 2.6936791686082984e-10, 2.671484977678773e-10, 2.668835430430505e-10, 2.671484977678773e-10 ], "bp_grad_norms_F": [ 2.710563421715051e-06, 9.628578823139833e-09, 9.495578545681838e-09, 9.492838515257063e-09, 9.499009578917139e-09 ], "gamma_dfa": 0.09612188487153617, "acc_eval": 0.298828125, "loss_eval": 1.9476267099380493, "epoch": 97 }, { "hidden_norms": [ 38646.0625, 90710400.0, 318627968.0, 584229760.0, 730119232.0 ], "bp_grad_norms_per_sample_med": [ 5.075278863841959e-08, 2.692224221334527e-10, 2.671664001141494e-10, 2.669355292361786e-10, 2.6700280875147087e-10 ], "bp_grad_norms_F": [ 2.7103426418761956e-06, 9.62763913037179e-09, 9.494667274623225e-09, 9.49192813237687e-09, 9.498098307858527e-09 ], "gamma_dfa": 0.09612667236069683, "acc_eval": 0.2998046875, "loss_eval": 1.9476723670959473, "epoch": 98 }, { "hidden_norms": [ 38646.953125, 90717408.0, 318651872.0, 584275776.0, 730176960.0 ], "bp_grad_norms_per_sample_med": [ 5.076975639894954e-08, 2.691815659261465e-10, 2.671429466527542e-10, 2.669321430559535e-10, 2.669318377446217e-10 ], "bp_grad_norms_F": [ 2.7102296371595003e-06, 9.62716750763093e-09, 9.494214303629178e-09, 9.491475161382823e-09, 9.4976462250429e-09 ], "gamma_dfa": 0.09612801273397054, "acc_eval": 0.2998046875, "loss_eval": 1.9476864337921143, "epoch": 99 }, { "hidden_norms": [ 38646.98046875, 90717592.0, 318652416.0, 584276736.0, 730178112.0 ], "bp_grad_norms_per_sample_med": [ 5.076372033840926e-08, 2.692036038531853e-10, 2.6715371581609304e-10, 2.669119369969053e-10, 2.6695023969125486e-10 ], "bp_grad_norms_F": [ 2.710211447265465e-06, 9.627171060344608e-09, 9.494216968164437e-09, 9.491476937739662e-09, 9.497648001399739e-09 ], "gamma_dfa": 0.09612751441454748, "acc_eval": 0.2998046875, "loss_eval": 1.947685956954956, "epoch": 100 } ] }