diff options
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s456.json')
| -rw-r--r-- | results/snapshot_evolution_v2/snapshot_evolution_s456.json | 5473 |
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s456.json b/results/snapshot_evolution_v2/snapshot_evolution_s456.json new file mode 100644 index 0000000..f78065f --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s456.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010079912608489394, + 0.0010035138111561537, + 0.0009970925748348236, + 0.0009936393471434712, + 0.000986678060144186 + ], + "bp_grad_norms_F": [ + 0.035574451088905334, + 0.035288579761981964, + 0.035048045217990875, + 0.0346725769340992, + 0.03439188003540039 + ], + "gamma_dfa": NaN, + "acc_eval": 0.0927734375, + "loss_eval": 2.4863264560699463, + "epoch": 0 + }, + { + "hidden_norms": [ + 79.9596176147461, + 82.38219451904297, + 86.97193145751953, + 92.46615600585938, + 99.17337799072266 + ], + "bp_grad_norms_per_sample_med": [ + 5.704927025362849e-05, + 5.414035331341438e-05, + 5.3104751714272425e-05, + 5.354730456019752e-05, + 5.5780339607736096e-05 + ], + "bp_grad_norms_F": [ + 0.00240120361559093, + 0.0021707164123654366, + 0.002052225871011615, + 0.0020026240963488817, + 0.002049861242994666 + ], + "gamma_dfa": NaN, + "acc_eval": 0.400390625, + "loss_eval": 1.6942739486694336, + "epoch": 1 + }, + { + "hidden_norms": [ + 95.21885681152344, + 97.9500732421875, + 101.84932708740234, + 108.15538787841797, + 115.16011810302734 + ], + "bp_grad_norms_per_sample_med": [ + 4.467168764676899e-05, + 4.3202508095419034e-05, + 4.3004638428101316e-05, + 4.286228431737982e-05, + 4.4292191887507215e-05 + ], + "bp_grad_norms_F": [ + 0.0018949288642033935, + 0.0017146588070318103, + 0.0016399234300479293, + 0.001598119386471808, + 0.0016228299355134368 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4599609375, + "loss_eval": 1.5051867961883545, + "epoch": 2 + }, + { + "hidden_norms": [ + 112.65824890136719, + 111.87681579589844, + 114.76032257080078, + 118.74363708496094, + 125.05441284179688 + ], + "bp_grad_norms_per_sample_med": [ + 4.4033156882505864e-05, + 4.2794465116458014e-05, + 4.2031828343169764e-05, + 4.134616028750315e-05, + 4.226301462040283e-05 + ], + "bp_grad_norms_F": [ + 0.0018527565989643335, + 0.0017638156423345208, + 0.0016669610049575567, + 0.0015881577273830771, + 0.0015705813420936465 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4931640625, + "loss_eval": 1.4331163167953491, + "epoch": 3 + }, + { + "hidden_norms": [ + 126.20967102050781, + 125.90274810791016, + 128.2918243408203, + 131.685302734375, + 136.71499633789062 + ], + "bp_grad_norms_per_sample_med": [ + 4.358301157481037e-05, + 4.267259282642044e-05, + 4.196130612399429e-05, + 4.08500200137496e-05, + 4.0281276596942917e-05 + ], + "bp_grad_norms_F": [ + 0.0018887611804530025, + 0.0017927174922078848, + 0.0016837789444252849, + 0.0015876276884227991, + 0.0015263468958437443 + ], + "gamma_dfa": NaN, + "acc_eval": 0.490234375, + "loss_eval": 1.4055290222167969, + "epoch": 4 + }, + { + "hidden_norms": [ + 137.673583984375, + 136.8435516357422, + 138.64651489257812, + 141.41473388671875, + 147.87835693359375 + ], + "bp_grad_norms_per_sample_med": [ + 4.085261025466025e-05, + 4.06657018174883e-05, + 3.941181785194203e-05, + 3.858502532239072e-05, + 3.7998870539013296e-05 + ], + "bp_grad_norms_F": [ + 0.001770049100741744, + 0.0016922445502132177, + 0.0016029543476179242, + 0.0015241446672007442, + 0.0014664788031950593 + ], + "gamma_dfa": NaN, + "acc_eval": 0.50390625, + "loss_eval": 1.3763911724090576, + "epoch": 5 + }, + { + "hidden_norms": [ + 150.45315551757812, + 148.60609436035156, + 150.3750457763672, + 152.9460906982422, + 158.2902069091797 + ], + "bp_grad_norms_per_sample_med": [ + 3.8344696804415435e-05, + 3.8422465877374634e-05, + 3.834897142951377e-05, + 3.7070902180857956e-05, + 3.6289642594056204e-05 + ], + "bp_grad_norms_F": [ + 0.0017990845954045653, + 0.001743242726661265, + 0.0016358466818928719, + 0.0015305348206311464, + 0.0014392968732863665 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5166015625, + "loss_eval": 1.373401165008545, + "epoch": 6 + }, + { + "hidden_norms": [ + 162.06126403808594, + 159.53811645507812, + 158.62655639648438, + 160.54307556152344, + 165.60415649414062 + ], + "bp_grad_norms_per_sample_med": [ + 3.797870522248559e-05, + 3.766914960579015e-05, + 3.7873480323469266e-05, + 3.735603968380019e-05, + 3.6521956644719467e-05 + ], + "bp_grad_norms_F": [ + 0.001707478309981525, + 0.0016470234841108322, + 0.0015834521036595106, + 0.001506388420239091, + 0.001406461582519114 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5283203125, + "loss_eval": 1.3223559856414795, + "epoch": 7 + }, + { + "hidden_norms": [ + 169.8936309814453, + 168.42221069335938, + 169.54115295410156, + 171.452880859375, + 176.4298553466797 + ], + "bp_grad_norms_per_sample_med": [ + 3.760562321986072e-05, + 3.8139285607030615e-05, + 3.7332967622205615e-05, + 3.670771184260957e-05, + 3.4867567592300475e-05 + ], + "bp_grad_norms_F": [ + 0.001674071652814746, + 0.0016396756982430816, + 0.001556537114083767, + 0.001464220928028226, + 0.0013669237960129976 + ], + "gamma_dfa": NaN, + "acc_eval": 0.529296875, + "loss_eval": 1.3310301303863525, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.821044921875, + 176.60687255859375, + 177.76409912109375, + 179.53733825683594, + 184.176513671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.643108357209712e-05, + 3.605252277338877e-05, + 3.6002034903503954e-05, + 3.529640525812283e-05, + 3.386645403224975e-05 + ], + "bp_grad_norms_F": [ + 0.0016080558998510242, + 0.0015692447777837515, + 0.0014910849276930094, + 0.0014210963854566216, + 0.0013221093686297536 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5390625, + "loss_eval": 1.3072502613067627, + "epoch": 9 + }, + { + "hidden_norms": [ + 188.1353759765625, + 184.39834594726562, + 184.91822814941406, + 185.82460021972656, + 191.45692443847656 + ], + "bp_grad_norms_per_sample_med": [ + 3.544713035807945e-05, + 3.5891316656488925e-05, + 3.613864828366786e-05, + 3.507022120174952e-05, + 3.361281778779812e-05 + ], + "bp_grad_norms_F": [ + 0.0015651460271328688, + 0.0015296414494514465, + 0.0014787326799705625, + 0.0014131872449070215, + 0.0013114992761984468 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5537109375, + "loss_eval": 1.2935423851013184, + "epoch": 10 + }, + { + "hidden_norms": [ + 193.53599548339844, + 189.33700561523438, + 190.08908081054688, + 192.31288146972656, + 198.0936737060547 + ], + "bp_grad_norms_per_sample_med": [ + 3.3899334084708244e-05, + 3.468272552709095e-05, + 3.463856774033047e-05, + 3.383589137229137e-05, + 3.240162550355308e-05 + ], + "bp_grad_norms_F": [ + 0.001495138043537736, + 0.0014781414065510035, + 0.0014301009941846132, + 0.0013711795909330249, + 0.0012839946430176497 + ], + "gamma_dfa": NaN, + "acc_eval": 0.544921875, + "loss_eval": 1.2766207456588745, + "epoch": 11 + }, + { + "hidden_norms": [ + 199.85023498535156, + 194.9699249267578, + 193.4657440185547, + 194.60928344726562, + 199.97662353515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.289094092906453e-05, + 3.539410317898728e-05, + 3.491900861263275e-05, + 3.4397991839796305e-05, + 3.252939859521575e-05 + ], + "bp_grad_norms_F": [ + 0.0015656249597668648, + 0.0015614606672897935, + 0.0015110056847333908, + 0.0014306820230558515, + 0.00130200176499784 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5439453125, + "loss_eval": 1.2812860012054443, + "epoch": 12 + }, + { + "hidden_norms": [ + 206.15440368652344, + 199.86099243164062, + 199.35470581054688, + 201.66831970214844, + 206.71054077148438 + ], + "bp_grad_norms_per_sample_med": [ + 3.430957076488994e-05, + 3.5125638532917947e-05, + 3.523785198922269e-05, + 3.404217568458989e-05, + 3.245573316235095e-05 + ], + "bp_grad_norms_F": [ + 0.0015102275647222996, + 0.0015037795528769493, + 0.001468595233745873, + 0.0013989906292408705, + 0.0012804438592866063 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5517578125, + "loss_eval": 1.2559274435043335, + "epoch": 13 + }, + { + "hidden_norms": [ + 209.39404296875, + 203.8543243408203, + 201.63771057128906, + 202.7413787841797, + 209.64585876464844 + ], + "bp_grad_norms_per_sample_med": [ + 3.3599189919186756e-05, + 3.511353497742675e-05, + 3.4795291867339984e-05, + 3.415898390812799e-05, + 3.225719046895392e-05 + ], + "bp_grad_norms_F": [ + 0.0015785910654813051, + 0.0015854343073442578, + 0.0015357385855168104, + 0.00144979078322649, + 0.0013052559224888682 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2778449058532715, + "epoch": 14 + }, + { + "hidden_norms": [ + 214.74293518066406, + 208.2928924560547, + 206.78591918945312, + 207.79452514648438, + 213.0249481201172 + ], + "bp_grad_norms_per_sample_med": [ + 3.347836172906682e-05, + 3.457088314462453e-05, + 3.509481393848546e-05, + 3.4477459848858416e-05, + 3.169552292092703e-05 + ], + "bp_grad_norms_F": [ + 0.0015018024714663625, + 0.0015100837917998433, + 0.0014814585447311401, + 0.0014098759274929762, + 0.0012745971325784922 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5693359375, + "loss_eval": 1.2316113710403442, + "epoch": 15 + }, + { + "hidden_norms": [ + 223.09906005859375, + 214.6353302001953, + 211.16726684570312, + 210.60520935058594, + 214.28952026367188 + ], + "bp_grad_norms_per_sample_med": [ + 3.5336081054992974e-05, + 3.693878170452081e-05, + 3.7104789953446016e-05, + 3.635902612586506e-05, + 3.3355980121996254e-05 + ], + "bp_grad_norms_F": [ + 0.0015461220173165202, + 0.0015768769662827253, + 0.0015498694265261292, + 0.001453379518352449, + 0.0013068238040432334 + ], + "gamma_dfa": NaN, + "acc_eval": 0.55078125, + "loss_eval": 1.2516858577728271, + "epoch": 16 + }, + { + "hidden_norms": [ + 225.36517333984375, + 217.36669921875, + 214.27880859375, + 215.62054443359375, + 219.76197814941406 + ], + "bp_grad_norms_per_sample_med": [ + 3.474476397968829e-05, + 3.609717168728821e-05, + 3.612042564782314e-05, + 3.547673986759037e-05, + 3.216006007278338e-05 + ], + "bp_grad_norms_F": [ + 0.001510953065007925, + 0.0015347315929830074, + 0.0015160846523940563, + 0.001440546941012144, + 0.0012782461708411574 + ], + "gamma_dfa": NaN, + "acc_eval": 0.583984375, + "loss_eval": 1.2262325286865234, + "epoch": 17 + }, + { + "hidden_norms": [ + 230.7099151611328, + 222.3380889892578, + 218.67819213867188, + 217.3147735595703, + 221.999755859375 + ], + "bp_grad_norms_per_sample_med": [ + 3.285402272013016e-05, + 3.4367294574622065e-05, + 3.490627204882912e-05, + 3.413260492379777e-05, + 3.064925112994388e-05 + ], + "bp_grad_norms_F": [ + 0.0015693235909566283, + 0.0015950833912938833, + 0.0015582602936774492, + 0.001467122812755406, + 0.0012723723193630576 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5751953125, + "loss_eval": 1.2127145528793335, + "epoch": 18 + }, + { + "hidden_norms": [ + 235.28932189941406, + 226.01202392578125, + 222.56756591796875, + 222.25152587890625, + 226.0247344970703 + ], + "bp_grad_norms_per_sample_med": [ + 3.336059671710245e-05, + 3.488900983938947e-05, + 3.518831363180652e-05, + 3.5047873097937554e-05, + 3.1955056329024956e-05 + ], + "bp_grad_norms_F": [ + 0.0015264152316376567, + 0.0015387749299407005, + 0.0015209508128464222, + 0.001451890799216926, + 0.00127940543461591 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5673828125, + "loss_eval": 1.2340281009674072, + "epoch": 19 + }, + { + "hidden_norms": [ + 239.98486328125, + 230.95614624023438, + 226.7176513671875, + 225.3818359375, + 231.0238037109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.4207379940198734e-05, + 3.5167759051546454e-05, + 3.5256896808277816e-05, + 3.462574022705667e-05, + 3.117474989267066e-05 + ], + "bp_grad_norms_F": [ + 0.0015223841182887554, + 0.0015598630998283625, + 0.0015445069875568151, + 0.0014689662493765354, + 0.0012761331163346767 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2441283464431763, + "epoch": 20 + }, + { + "hidden_norms": [ + 245.0663299560547, + 233.2012939453125, + 227.60426330566406, + 226.96006774902344, + 229.30145263671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.25386063195765e-05, + 3.39963698934298e-05, + 3.503257903503254e-05, + 3.4624255931703374e-05, + 3.013665264006704e-05 + ], + "bp_grad_norms_F": [ + 0.001554132904857397, + 0.0015968671068549156, + 0.001575724920257926, + 0.0014765377854928374, + 0.0012655528262257576 + ], + "gamma_dfa": NaN, + "acc_eval": 0.595703125, + "loss_eval": 1.1905839443206787, + "epoch": 21 + }, + { + "hidden_norms": [ + 246.93258666992188, + 235.25485229492188, + 232.71095275878906, + 231.27796936035156, + 235.4611358642578 + ], + "bp_grad_norms_per_sample_med": [ + 3.248557914048433e-05, + 3.448772622505203e-05, + 3.525316424202174e-05, + 3.4218086511828005e-05, + 2.997798401338514e-05 + ], + "bp_grad_norms_F": [ + 0.001511804643087089, + 0.0015418389812111855, + 0.001536028808914125, + 0.0014609270729124546, + 0.001262559788301587 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.2032543420791626, + "epoch": 22 + }, + { + "hidden_norms": [ + 251.2838592529297, + 237.0211639404297, + 234.6432342529297, + 233.30433654785156, + 238.11598205566406 + ], + "bp_grad_norms_per_sample_med": [ + 3.3030770282493904e-05, + 3.484229455352761e-05, + 3.59142868546769e-05, + 3.533583367243409e-05, + 3.1214847695082426e-05 + ], + "bp_grad_norms_F": [ + 0.0015120860189199448, + 0.00155613012611866, + 0.0015533699188381433, + 0.001477457000873983, + 0.0012758751399815083 + ], + "gamma_dfa": NaN, + "acc_eval": 0.568359375, + "loss_eval": 1.220862627029419, + "epoch": 23 + }, + { + "hidden_norms": [ + 253.3640594482422, + 242.6001739501953, + 237.11773681640625, + 237.31105041503906, + 241.1314697265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.295885835541412e-05, + 3.492692485451698e-05, + 3.562758502084762e-05, + 3.515293064992875e-05, + 3.0970571970101446e-05 + ], + "bp_grad_norms_F": [ + 0.001516172313131392, + 0.0015499184373766184, + 0.0015383078716695309, + 0.0014658188447356224, + 0.0012659834465011954 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.1925604343414307, + "epoch": 24 + }, + { + "hidden_norms": [ + 258.6325378417969, + 245.05575561523438, + 239.04722595214844, + 237.04385375976562, + 240.51011657714844 + ], + "bp_grad_norms_per_sample_med": [ + 3.258220021962188e-05, + 3.459660729276948e-05, + 3.553628994268365e-05, + 3.461805317783728e-05, + 3.001722870976664e-05 + ], + "bp_grad_norms_F": [ + 0.0015354488277807832, + 0.001572331297211349, + 0.0015721773961558938, + 0.0014915125211700797, + 0.0012740870006382465 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.1843492984771729, + "epoch": 25 + }, + { + "hidden_norms": [ + 262.35577392578125, + 247.456298828125, + 241.52687072753906, + 239.8603057861328, + 242.48818969726562 + ], + "bp_grad_norms_per_sample_med": [ + 3.335328074172139e-05, + 3.581988130463287e-05, + 3.6700876080431044e-05, + 3.52635579474736e-05, + 3.091046164627187e-05 + ], + "bp_grad_norms_F": [ + 0.0015506797935813665, + 0.0016048819525167346, + 0.0016078166663646698, + 0.0015189298428595066, + 0.001287299208343029 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.2021183967590332, + "epoch": 26 + }, + { + "hidden_norms": [ + 262.69769287109375, + 248.58924865722656, + 243.61415100097656, + 242.7408905029297, + 243.58761596679688 + ], + "bp_grad_norms_per_sample_med": [ + 3.363215728313662e-05, + 3.542406557244249e-05, + 3.617940456024371e-05, + 3.522956103552133e-05, + 3.093081613769755e-05 + ], + "bp_grad_norms_F": [ + 0.0015515872510150075, + 0.0015918170101940632, + 0.0015870564384385943, + 0.0015067857457324862, + 0.001285396981984377 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.1753299236297607, + "epoch": 27 + }, + { + "hidden_norms": [ + 264.57330322265625, + 252.62904357910156, + 246.43833923339844, + 245.4523468017578, + 247.43896484375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3458851248724386e-05, + 3.510742317303084e-05, + 3.596700116759166e-05, + 3.530932735884562e-05, + 3.0871200578985736e-05 + ], + "bp_grad_norms_F": [ + 0.0015561054460704327, + 0.0015992044936865568, + 0.0016016490990296006, + 0.0015203922521322966, + 0.001274992828257382 + ], + "gamma_dfa": NaN, + "acc_eval": 0.587890625, + "loss_eval": 1.1872658729553223, + "epoch": 28 + }, + { + "hidden_norms": [ + 268.63336181640625, + 253.74609375, + 247.2230224609375, + 244.07066345214844, + 248.91635131835938 + ], + "bp_grad_norms_per_sample_med": [ + 3.388441837159917e-05, + 3.55305674020201e-05, + 3.711709723575041e-05, + 3.565939550753683e-05, + 3.06438232655637e-05 + ], + "bp_grad_norms_F": [ + 0.0015880814753472805, + 0.001632494037039578, + 0.0016352345701307058, + 0.001542495796456933, + 0.001282386132515967 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1748178005218506, + "epoch": 29 + }, + { + "hidden_norms": [ + 269.5155944824219, + 254.65687561035156, + 249.08070373535156, + 246.4084930419922, + 248.03065490722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.340150215080939e-05, + 3.542837657732889e-05, + 3.656153057818301e-05, + 3.62997452612035e-05, + 3.134588405373506e-05 + ], + "bp_grad_norms_F": [ + 0.0015988025115802884, + 0.0016428054077550769, + 0.0016343789175152779, + 0.00154898373875767, + 0.001290567102842033 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.184614658355713, + "epoch": 30 + }, + { + "hidden_norms": [ + 273.0482482910156, + 255.88157653808594, + 249.6538543701172, + 246.09181213378906, + 250.09861755371094 + ], + "bp_grad_norms_per_sample_med": [ + 3.485401612124406e-05, + 3.613552325987257e-05, + 3.727355215232819e-05, + 3.6410303437151015e-05, + 3.111722253379412e-05 + ], + "bp_grad_norms_F": [ + 0.0016218513483181596, + 0.001677986583672464, + 0.0016929754056036472, + 0.001593436230905354, + 0.0013143697287887335 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5673828125, + "loss_eval": 1.2012369632720947, + "epoch": 31 + }, + { + "hidden_norms": [ + 274.05010986328125, + 255.77792358398438, + 247.96664428710938, + 246.15379333496094, + 248.44847106933594 + ], + "bp_grad_norms_per_sample_med": [ + 3.431778895901516e-05, + 3.609380655689165e-05, + 3.7377911212388426e-05, + 3.6012417695019394e-05, + 3.0985673220129684e-05 + ], + "bp_grad_norms_F": [ + 0.0016116296174004674, + 0.0016683804569765925, + 0.0016786488704383373, + 0.0015687323175370693, + 0.001289981184527278 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1654620170593262, + "epoch": 32 + }, + { + "hidden_norms": [ + 274.6156921386719, + 257.166259765625, + 251.9473876953125, + 251.01661682128906, + 252.84222412109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.185174864483997e-05, + 3.433173696976155e-05, + 3.572784407879226e-05, + 3.4680619137361646e-05, + 2.997389128722716e-05 + ], + "bp_grad_norms_F": [ + 0.0015743848634883761, + 0.001610185718163848, + 0.0016222007106989622, + 0.0015360275283455849, + 0.0012806184822693467 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1679120063781738, + "epoch": 33 + }, + { + "hidden_norms": [ + 274.3385009765625, + 256.1404724121094, + 249.90264892578125, + 247.3904266357422, + 249.5623016357422 + ], + "bp_grad_norms_per_sample_med": [ + 3.419954009586945e-05, + 3.6830995668424293e-05, + 3.8464357203338295e-05, + 3.64230691047851e-05, + 3.0958552088122815e-05 + ], + "bp_grad_norms_F": [ + 0.0016346886986866593, + 0.0016823107143864036, + 0.0016956342151388526, + 0.0015958002768456936, + 0.0013100137002766132 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5927734375, + "loss_eval": 1.1599082946777344, + "epoch": 34 + }, + { + "hidden_norms": [ + 276.65985107421875, + 258.50543212890625, + 251.1997833251953, + 247.7036895751953, + 248.07545471191406 + ], + "bp_grad_norms_per_sample_med": [ + 3.384043520782143e-05, + 3.567537714843638e-05, + 3.686825220938772e-05, + 3.5754670534515753e-05, + 3.0301211154437624e-05 + ], + "bp_grad_norms_F": [ + 0.0016451155534014106, + 0.0016956959152594209, + 0.001703266054391861, + 0.0016015227884054184, + 0.0013142916141077876 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.148215889930725, + "epoch": 35 + }, + { + "hidden_norms": [ + 279.6298522949219, + 261.1481018066406, + 253.67742919921875, + 250.86221313476562, + 250.6768035888672 + ], + "bp_grad_norms_per_sample_med": [ + 3.341220144648105e-05, + 3.499272861517966e-05, + 3.6701327189803123e-05, + 3.602671858971007e-05, + 3.081390605075285e-05 + ], + "bp_grad_norms_F": [ + 0.0016287019243463874, + 0.0016769150970503688, + 0.0016951658762991428, + 0.0015969424275681376, + 0.0013187138829380274 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.1451219320297241, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.2866516113281, + 258.4331359863281, + 251.4995880126953, + 249.0448455810547, + 248.5166015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.2723561162129045e-05, + 3.4428499930072576e-05, + 3.571901106624864e-05, + 3.4436179703334346e-05, + 2.9252587410155684e-05 + ], + "bp_grad_norms_F": [ + 0.0016638770466670394, + 0.0017149352934211493, + 0.0017208203207701445, + 0.0016291715437546372, + 0.0013402353506535292 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.145239233970642, + "epoch": 37 + }, + { + "hidden_norms": [ + 279.7109680175781, + 259.3131103515625, + 250.73587036132812, + 247.214111328125, + 249.20944213867188 + ], + "bp_grad_norms_per_sample_med": [ + 3.449835639912635e-05, + 3.682902752188966e-05, + 3.780073166126385e-05, + 3.652105442597531e-05, + 3.046718666155357e-05 + ], + "bp_grad_norms_F": [ + 0.001753124757669866, + 0.0018144651548936963, + 0.0018306451383978128, + 0.0017095789080485702, + 0.001379602705128491 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5908203125, + "loss_eval": 1.1677792072296143, + "epoch": 38 + }, + { + "hidden_norms": [ + 279.9946594238281, + 260.2458190917969, + 252.0008087158203, + 250.56716918945312, + 250.73135375976562 + ], + "bp_grad_norms_per_sample_med": [ + 3.489958180580288e-05, + 3.730110984179191e-05, + 3.791403287323192e-05, + 3.650010330602527e-05, + 3.076100256294012e-05 + ], + "bp_grad_norms_F": [ + 0.0017145961755886674, + 0.0017580300336703658, + 0.001775139826349914, + 0.0016669962788000703, + 0.0013597821816802025 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1510668992996216, + "epoch": 39 + }, + { + "hidden_norms": [ + 280.5132751464844, + 260.75970458984375, + 252.2814178466797, + 249.84548950195312, + 248.41783142089844 + ], + "bp_grad_norms_per_sample_med": [ + 3.552919588400982e-05, + 3.777973688556813e-05, + 3.952483166358434e-05, + 3.783141073654406e-05, + 3.1490348192164674e-05 + ], + "bp_grad_norms_F": [ + 0.0017431442392989993, + 0.0017984459409490228, + 0.0018199888290837407, + 0.0017078405944630504, + 0.0013792469399049878 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1412110328674316, + "epoch": 40 + }, + { + "hidden_norms": [ + 279.3873596191406, + 259.55096435546875, + 251.9462432861328, + 247.29443359375, + 247.82852172851562 + ], + "bp_grad_norms_per_sample_med": [ + 3.456972990534268e-05, + 3.654780448414385e-05, + 3.848340566037223e-05, + 3.736113285413012e-05, + 3.1597948691342026e-05 + ], + "bp_grad_norms_F": [ + 0.0017544032307341695, + 0.0018107325304299593, + 0.0018319039372727275, + 0.0017261328175663948, + 0.0013868761016055942 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1418483257293701, + "epoch": 41 + }, + { + "hidden_norms": [ + 282.4360656738281, + 261.22149658203125, + 251.49090576171875, + 247.5189208984375, + 247.03427124023438 + ], + "bp_grad_norms_per_sample_med": [ + 3.5179280530428514e-05, + 3.728548108483665e-05, + 3.779769394895993e-05, + 3.6327692214399576e-05, + 3.026284321094863e-05 + ], + "bp_grad_norms_F": [ + 0.0017881252570077777, + 0.0018441356951370835, + 0.0018691252917051315, + 0.0017487212317064404, + 0.0013921407517045736 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1468144655227661, + "epoch": 42 + }, + { + "hidden_norms": [ + 283.1267395019531, + 261.29425048828125, + 252.38563537597656, + 248.00192260742188, + 246.58505249023438 + ], + "bp_grad_norms_per_sample_med": [ + 3.485176421236247e-05, + 3.699021544889547e-05, + 3.812833165284246e-05, + 3.7145182432141155e-05, + 3.1198313081404194e-05 + ], + "bp_grad_norms_F": [ + 0.0017692983383312821, + 0.0018438888946548104, + 0.001876220339909196, + 0.0017641744343563914, + 0.0014044356066733599 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1329892873764038, + "epoch": 43 + }, + { + "hidden_norms": [ + 281.29327392578125, + 259.43359375, + 249.52906799316406, + 246.0892333984375, + 243.162109375 + ], + "bp_grad_norms_per_sample_med": [ + 3.586204911698587e-05, + 3.787377499975264e-05, + 3.9215286960825324e-05, + 3.7436715501826257e-05, + 3.160976120852865e-05 + ], + "bp_grad_norms_F": [ + 0.0018376735970377922, + 0.0019067999674007297, + 0.0019337635021656752, + 0.0017983472207561135, + 0.001438757055439055 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6181640625, + "loss_eval": 1.144508957862854, + "epoch": 44 + }, + { + "hidden_norms": [ + 282.5230407714844, + 259.55322265625, + 248.72308349609375, + 245.0394287109375, + 243.0651092529297 + ], + "bp_grad_norms_per_sample_med": [ + 3.6309906136011705e-05, + 3.868114436045289e-05, + 4.0484872442903e-05, + 3.8203681469894946e-05, + 3.144023139611818e-05 + ], + "bp_grad_norms_F": [ + 0.0018340122187510133, + 0.0019134157337248325, + 0.0019425065256655216, + 0.0018252682639285922, + 0.001443033921532333 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1290326118469238, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.8598327636719, + 260.14111328125, + 250.84779357910156, + 245.9561767578125, + 243.0910186767578 + ], + "bp_grad_norms_per_sample_med": [ + 3.4626806154847145e-05, + 3.693445250974037e-05, + 3.8311845855787396e-05, + 3.7721722037531435e-05, + 3.145459049846977e-05 + ], + "bp_grad_norms_F": [ + 0.0018591763218864799, + 0.0019209657330065966, + 0.0019388735527172685, + 0.001830682042054832, + 0.001447839429602027 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1423537731170654, + "epoch": 46 + }, + { + "hidden_norms": [ + 280.17266845703125, + 259.26568603515625, + 248.45452880859375, + 243.45750427246094, + 241.2735137939453 + ], + "bp_grad_norms_per_sample_med": [ + 3.609486884670332e-05, + 3.887504499289207e-05, + 4.01619981857948e-05, + 3.9294092857744545e-05, + 3.1412804673891515e-05 + ], + "bp_grad_norms_F": [ + 0.0018975000130012631, + 0.0019804267212748528, + 0.002001592656597495, + 0.0018729616422206163, + 0.0014571875799447298 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1366385221481323, + "epoch": 47 + }, + { + "hidden_norms": [ + 281.79833984375, + 259.25860595703125, + 249.18551635742188, + 244.24977111816406, + 240.67100524902344 + ], + "bp_grad_norms_per_sample_med": [ + 3.47710374626331e-05, + 3.7153975426917896e-05, + 3.885528349201195e-05, + 3.792768620769493e-05, + 3.113777347607538e-05 + ], + "bp_grad_norms_F": [ + 0.0019318967824801803, + 0.0019981141667813063, + 0.0020311782136559486, + 0.0018996316939592361, + 0.0014788025291636586 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6162109375, + "loss_eval": 1.138331651687622, + "epoch": 48 + }, + { + "hidden_norms": [ + 282.3840637207031, + 258.1807861328125, + 248.13995361328125, + 243.45587158203125, + 239.51858520507812 + ], + "bp_grad_norms_per_sample_med": [ + 3.68369001080282e-05, + 3.935660788556561e-05, + 4.189974788459949e-05, + 3.9929436752572656e-05, + 3.188087430316955e-05 + ], + "bp_grad_norms_F": [ + 0.0019372758688405156, + 0.0020036858040839434, + 0.0020287453662604094, + 0.001896715839393437, + 0.0014835885958746076 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1377842426300049, + "epoch": 49 + }, + { + "hidden_norms": [ + 280.9283142089844, + 257.81524658203125, + 248.47984313964844, + 241.96157836914062, + 238.4756317138672 + ], + "bp_grad_norms_per_sample_med": [ + 3.7310775951482356e-05, + 3.98769298044499e-05, + 4.1753111872822046e-05, + 4.021048516733572e-05, + 3.21856678056065e-05 + ], + "bp_grad_norms_F": [ + 0.0019433718407526612, + 0.0020235073752701283, + 0.002055324148386717, + 0.0019370814552530646, + 0.0015049076173454523 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.133098840713501, + "epoch": 50 + }, + { + "hidden_norms": [ + 279.66400146484375, + 256.7322082519531, + 246.65223693847656, + 241.45947265625, + 236.65582275390625 + ], + "bp_grad_norms_per_sample_med": [ + 3.620017014327459e-05, + 3.800772174145095e-05, + 4.072795491083525e-05, + 3.888807259500027e-05, + 3.182498039677739e-05 + ], + "bp_grad_norms_F": [ + 0.0019729172345250845, + 0.002036863239482045, + 0.0020802877843379974, + 0.0019662927370518446, + 0.0015235996106639504 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1315571069717407, + "epoch": 51 + }, + { + "hidden_norms": [ + 280.00152587890625, + 258.0238037109375, + 247.4223175048828, + 240.8101348876953, + 237.3229217529297 + ], + "bp_grad_norms_per_sample_med": [ + 3.6401659599505365e-05, + 3.855170143651776e-05, + 4.065703978994861e-05, + 3.844475213554688e-05, + 3.1645795388612896e-05 + ], + "bp_grad_norms_F": [ + 0.0019983802922070026, + 0.0020701857283711433, + 0.002107742242515087, + 0.001981276087462902, + 0.0015306670684367418 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.137194037437439, + "epoch": 52 + }, + { + "hidden_norms": [ + 278.19708251953125, + 255.23036193847656, + 245.5857696533203, + 239.48196411132812, + 235.09983825683594 + ], + "bp_grad_norms_per_sample_med": [ + 3.97727417293936e-05, + 4.185501529718749e-05, + 4.392741175252013e-05, + 4.302372326492332e-05, + 3.48737376043573e-05 + ], + "bp_grad_norms_F": [ + 0.002044696593657136, + 0.00211329385638237, + 0.002144050318747759, + 0.0020148823969066143, + 0.0015573638956993818 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1354646682739258, + "epoch": 53 + }, + { + "hidden_norms": [ + 276.7043762207031, + 255.62408447265625, + 243.71484375, + 238.2984161376953, + 233.8153076171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.715257116709836e-05, + 3.887641287292354e-05, + 4.099323268746957e-05, + 3.948296944145113e-05, + 3.221148654120043e-05 + ], + "bp_grad_norms_F": [ + 0.0020365805830806494, + 0.00209893099963665, + 0.0021342532709240913, + 0.0020123852882534266, + 0.0015702869277447462 + ], + "gamma_dfa": NaN, + "acc_eval": 0.623046875, + "loss_eval": 1.1295127868652344, + "epoch": 54 + }, + { + "hidden_norms": [ + 279.308349609375, + 255.30587768554688, + 243.6786651611328, + 237.71823120117188, + 232.89991760253906 + ], + "bp_grad_norms_per_sample_med": [ + 3.9407084841514006e-05, + 4.1900668293237686e-05, + 4.364689812064171e-05, + 4.154618363827467e-05, + 3.264051701989956e-05 + ], + "bp_grad_norms_F": [ + 0.0021011638455092907, + 0.002175872679799795, + 0.002217113971710205, + 0.002071501687169075, + 0.0015880379360169172 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1201554536819458, + "epoch": 55 + }, + { + "hidden_norms": [ + 276.9933166503906, + 253.379638671875, + 244.23390197753906, + 238.01930236816406, + 233.3076171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.799827391048893e-05, + 4.017200990347192e-05, + 4.2665858927648515e-05, + 4.083341627847403e-05, + 3.210103386663832e-05 + ], + "bp_grad_norms_F": [ + 0.002064710482954979, + 0.0021362933330237865, + 0.0021728368010371923, + 0.0020478416699916124, + 0.0015873984666541219 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1222728490829468, + "epoch": 56 + }, + { + "hidden_norms": [ + 276.41168212890625, + 251.91033935546875, + 241.81382751464844, + 234.8279266357422, + 230.53956604003906 + ], + "bp_grad_norms_per_sample_med": [ + 3.770063631236553e-05, + 3.94962407881394e-05, + 4.150882887188345e-05, + 4.040042040287517e-05, + 3.2475280022481456e-05 + ], + "bp_grad_norms_F": [ + 0.002123177284374833, + 0.0021965675987303257, + 0.00223328173160553, + 0.0020905195269733667, + 0.0016039537731558084 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1091526746749878, + "epoch": 57 + }, + { + "hidden_norms": [ + 274.760986328125, + 250.0972442626953, + 239.511474609375, + 233.29798889160156, + 228.16070556640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.728809315362014e-05, + 4.0525967051507905e-05, + 4.239326517563313e-05, + 4.087138222530484e-05, + 3.216422919649631e-05 + ], + "bp_grad_norms_F": [ + 0.0021635335870087147, + 0.0022461507469415665, + 0.0022873859852552414, + 0.002144098049029708, + 0.001636566361412406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6416015625, + "loss_eval": 1.1180500984191895, + "epoch": 58 + }, + { + "hidden_norms": [ + 273.91064453125, + 249.49452209472656, + 238.54373168945312, + 232.80734252929688, + 225.6833953857422 + ], + "bp_grad_norms_per_sample_med": [ + 3.966117583331652e-05, + 4.1986208088928834e-05, + 4.316144259064458e-05, + 4.332280877861194e-05, + 3.44519030477386e-05 + ], + "bp_grad_norms_F": [ + 0.0021825931034982204, + 0.0022617392241954803, + 0.0023092019837349653, + 0.00216560042463243, + 0.0016612708568572998 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.131789207458496, + "epoch": 59 + }, + { + "hidden_norms": [ + 274.90008544921875, + 250.0712127685547, + 238.57467651367188, + 231.15719604492188, + 225.55587768554688 + ], + "bp_grad_norms_per_sample_med": [ + 4.130819797865115e-05, + 4.363877815194428e-05, + 4.489632920012809e-05, + 4.4512398744700477e-05, + 3.470887531875633e-05 + ], + "bp_grad_norms_F": [ + 0.002240521367639303, + 0.002310203853994608, + 0.0023576009552925825, + 0.002204722724854946, + 0.0016799044096842408 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1323366165161133, + "epoch": 60 + }, + { + "hidden_norms": [ + 275.4504699707031, + 249.5341796875, + 237.540283203125, + 230.39208984375, + 224.43321228027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.056218676851131e-05, + 4.288182390155271e-05, + 4.5818003854947165e-05, + 4.356648423708975e-05, + 3.492152245598845e-05 + ], + "bp_grad_norms_F": [ + 0.002249655080959201, + 0.0023316002916544676, + 0.002382595557719469, + 0.002231382764875889, + 0.00168902100995183 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1275749206542969, + "epoch": 61 + }, + { + "hidden_norms": [ + 273.6263122558594, + 248.43479919433594, + 234.8235321044922, + 228.0020751953125, + 222.4278106689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.0597744373371825e-05, + 4.323143730289303e-05, + 4.647616151487455e-05, + 4.4688425987260416e-05, + 3.521826511132531e-05 + ], + "bp_grad_norms_F": [ + 0.002307126997038722, + 0.0023877634666860104, + 0.0024417925160378218, + 0.0022813305258750916, + 0.001714664394967258 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1252907514572144, + "epoch": 62 + }, + { + "hidden_norms": [ + 271.7508239746094, + 246.79209899902344, + 233.84280395507812, + 226.96934509277344, + 220.57888793945312 + ], + "bp_grad_norms_per_sample_med": [ + 4.177554728812538e-05, + 4.393904600874521e-05, + 4.635817458620295e-05, + 4.428510874276981e-05, + 3.396430111024529e-05 + ], + "bp_grad_norms_F": [ + 0.002355988370254636, + 0.0024527544155716896, + 0.0025022663176059723, + 0.0023387460969388485, + 0.0017370774876326323 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1249933242797852, + "epoch": 63 + }, + { + "hidden_norms": [ + 271.7035217285156, + 246.70675659179688, + 233.96661376953125, + 226.53175354003906, + 220.52359008789062 + ], + "bp_grad_norms_per_sample_med": [ + 4.2499312257859856e-05, + 4.503092714003287e-05, + 4.670799171435647e-05, + 4.5866876462241635e-05, + 3.720118911587633e-05 + ], + "bp_grad_norms_F": [ + 0.002408105880022049, + 0.0024944571778178215, + 0.002545328810811043, + 0.002381332218647003, + 0.0017641197191551328 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1418037414550781, + "epoch": 64 + }, + { + "hidden_norms": [ + 271.0970153808594, + 246.78770446777344, + 234.2436065673828, + 226.7012176513672, + 219.61680603027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.040581188746728e-05, + 4.3224725231993943e-05, + 4.4494401663541794e-05, + 4.3532105337362736e-05, + 3.4612559829838574e-05 + ], + "bp_grad_norms_F": [ + 0.0024068003986030817, + 0.002485552802681923, + 0.002538430504500866, + 0.002368941670283675, + 0.0017652952810749412 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1279454231262207, + "epoch": 65 + }, + { + "hidden_norms": [ + 270.66473388671875, + 244.8525390625, + 232.8356475830078, + 224.2222137451172, + 217.24554443359375 + ], + "bp_grad_norms_per_sample_med": [ + 4.1549992602085695e-05, + 4.493525193538517e-05, + 4.7448877012357116e-05, + 4.479651397559792e-05, + 3.5401590139372274e-05 + ], + "bp_grad_norms_F": [ + 0.002463088370859623, + 0.002551029436290264, + 0.002594881458207965, + 0.0024160456378012896, + 0.001803302438929677 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6376953125, + "loss_eval": 1.1330325603485107, + "epoch": 66 + }, + { + "hidden_norms": [ + 269.8645935058594, + 243.50497436523438, + 231.37692260742188, + 222.27967834472656, + 215.22059631347656 + ], + "bp_grad_norms_per_sample_med": [ + 4.1519095248077065e-05, + 4.487609476200305e-05, + 4.708006963483058e-05, + 4.4878328480990604e-05, + 3.578457108233124e-05 + ], + "bp_grad_norms_F": [ + 0.0024854058865457773, + 0.0025721373967826366, + 0.0026270432863384485, + 0.0024401266127824783, + 0.0018134783022105694 + ], + "gamma_dfa": NaN, + "acc_eval": 0.63671875, + "loss_eval": 1.123876690864563, + "epoch": 67 + }, + { + "hidden_norms": [ + 269.28570556640625, + 242.04359436035156, + 229.53497314453125, + 221.24327087402344, + 215.1306610107422 + ], + "bp_grad_norms_per_sample_med": [ + 4.279898348613642e-05, + 4.6176737669156864e-05, + 4.813459236174822e-05, + 4.609950337908231e-05, + 3.566763552953489e-05 + ], + "bp_grad_norms_F": [ + 0.0024860126432031393, + 0.002575797727331519, + 0.0026342689525336027, + 0.0024608916137367487, + 0.0018216874450445175 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.122079849243164, + "epoch": 68 + }, + { + "hidden_norms": [ + 268.3481140136719, + 242.3759765625, + 229.19241333007812, + 220.78233337402344, + 213.58587646484375 + ], + "bp_grad_norms_per_sample_med": [ + 4.163750054431148e-05, + 4.50872685178183e-05, + 4.8797548515722156e-05, + 4.597716542775743e-05, + 3.505409767967649e-05 + ], + "bp_grad_norms_F": [ + 0.0025033215060830116, + 0.002596172271296382, + 0.002654082840308547, + 0.002480126451700926, + 0.0018305372213944793 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6328125, + "loss_eval": 1.1238645315170288, + "epoch": 69 + }, + { + "hidden_norms": [ + 267.92425537109375, + 239.90985107421875, + 228.08212280273438, + 219.12835693359375, + 212.38052368164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.42373457190115e-05, + 4.6515069698216394e-05, + 4.823393464903347e-05, + 4.762738535646349e-05, + 3.6444154829951e-05 + ], + "bp_grad_norms_F": [ + 0.0025684935972094536, + 0.002675230847671628, + 0.0027295781765133142, + 0.0025394319090992212, + 0.0018643162911757827 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.135793685913086, + "epoch": 70 + }, + { + "hidden_norms": [ + 266.2279052734375, + 239.37680053710938, + 226.3264923095703, + 218.04910278320312, + 210.68836975097656 + ], + "bp_grad_norms_per_sample_med": [ + 4.4824198994319886e-05, + 4.7638000978622586e-05, + 4.962517414242029e-05, + 4.7396664740517735e-05, + 3.5957502404926345e-05 + ], + "bp_grad_norms_F": [ + 0.002600227715447545, + 0.002714222064241767, + 0.002763595897704363, + 0.0025755097158253193, + 0.0018772372277453542 + ], + "gamma_dfa": NaN, + "acc_eval": 0.623046875, + "loss_eval": 1.123576283454895, + "epoch": 71 + }, + { + "hidden_norms": [ + 266.4837951660156, + 239.67581176757812, + 227.51805114746094, + 218.58811950683594, + 211.26596069335938 + ], + "bp_grad_norms_per_sample_med": [ + 4.245663512847386e-05, + 4.560768138617277e-05, + 4.797001020051539e-05, + 4.539322981145233e-05, + 3.4807548217941076e-05 + ], + "bp_grad_norms_F": [ + 0.0025984421372413635, + 0.002703956561163068, + 0.002762222196906805, + 0.002577459439635277, + 0.0018865292659029365 + ], + "gamma_dfa": NaN, + "acc_eval": 0.61328125, + "loss_eval": 1.1362444162368774, + "epoch": 72 + }, + { + "hidden_norms": [ + 264.8100891113281, + 237.96121215820312, + 226.14822387695312, + 217.3454132080078, + 208.98077392578125 + ], + "bp_grad_norms_per_sample_med": [ + 4.217765308567323e-05, + 4.603620618581772e-05, + 4.735886977869086e-05, + 4.5346474507823586e-05, + 3.594472218537703e-05 + ], + "bp_grad_norms_F": [ + 0.0026375274173915386, + 0.0027397233061492443, + 0.0028012648690491915, + 0.0026011927984654903, + 0.0018980697495862842 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6318359375, + "loss_eval": 1.1286330223083496, + "epoch": 73 + }, + { + "hidden_norms": [ + 264.8172302246094, + 238.0478057861328, + 225.0303497314453, + 217.1344757080078, + 209.569580078125 + ], + "bp_grad_norms_per_sample_med": [ + 4.242224895278923e-05, + 4.6696859499206766e-05, + 4.831598562304862e-05, + 4.5893459173385054e-05, + 3.54531584889628e-05 + ], + "bp_grad_norms_F": [ + 0.0026500027161091566, + 0.002760941395536065, + 0.0028223067056387663, + 0.0026202781591564417, + 0.001915424014441669 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1304678916931152, + "epoch": 74 + }, + { + "hidden_norms": [ + 264.7013854980469, + 237.4438018798828, + 225.43527221679688, + 216.18502807617188, + 208.08302307128906 + ], + "bp_grad_norms_per_sample_med": [ + 4.43761091446504e-05, + 4.801220347872004e-05, + 4.9817157560028136e-05, + 4.829527097172104e-05, + 3.73583534383215e-05 + ], + "bp_grad_norms_F": [ + 0.002686889609321952, + 0.0028029615059494972, + 0.002866453491151333, + 0.002669648267328739, + 0.0019349679350852966 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6240234375, + "loss_eval": 1.1350867748260498, + "epoch": 75 + }, + { + "hidden_norms": [ + 264.3004455566406, + 236.1824188232422, + 223.4772186279297, + 214.64682006835938, + 207.52272033691406 + ], + "bp_grad_norms_per_sample_med": [ + 4.3003376049455255e-05, + 4.6196739276638255e-05, + 4.8772617446957156e-05, + 4.7264005843317136e-05, + 3.6179160815663636e-05 + ], + "bp_grad_norms_F": [ + 0.0027191757690161467, + 0.0028310383204370737, + 0.0028950762934982777, + 0.002689448418095708, + 0.0019433586858212948 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1378443241119385, + "epoch": 76 + }, + { + "hidden_norms": [ + 262.62811279296875, + 235.80126953125, + 222.7261199951172, + 213.42430114746094, + 205.99493408203125 + ], + "bp_grad_norms_per_sample_med": [ + 4.4399519538274035e-05, + 4.737091148854233e-05, + 4.900431667920202e-05, + 4.768445069203153e-05, + 3.608842962421477e-05 + ], + "bp_grad_norms_F": [ + 0.0027450472116470337, + 0.0028562990482896566, + 0.0029378861654549837, + 0.0027161173056811094, + 0.0019581648521125317 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6220703125, + "loss_eval": 1.137312889099121, + "epoch": 77 + }, + { + "hidden_norms": [ + 262.612060546875, + 235.62489318847656, + 222.1566925048828, + 212.93875122070312, + 205.24142456054688 + ], + "bp_grad_norms_per_sample_med": [ + 4.443951911525801e-05, + 4.7095887566683814e-05, + 4.906025424133986e-05, + 4.8352503654314205e-05, + 3.6001758417114615e-05 + ], + "bp_grad_norms_F": [ + 0.002745443256571889, + 0.002859732834622264, + 0.002942001214250922, + 0.002725319005548954, + 0.001969744684174657 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.126712441444397, + "epoch": 78 + }, + { + "hidden_norms": [ + 262.6611633300781, + 235.52174377441406, + 221.89093017578125, + 213.1799774169922, + 204.9930877685547 + ], + "bp_grad_norms_per_sample_med": [ + 4.5766752009512857e-05, + 4.834473293158226e-05, + 5.181043525226414e-05, + 4.826926306122914e-05, + 3.573719732230529e-05 + ], + "bp_grad_norms_F": [ + 0.0027218428440392017, + 0.002838012296706438, + 0.002919211983680725, + 0.0027209871914237738, + 0.001970200566574931 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62109375, + "loss_eval": 1.1352139711380005, + "epoch": 79 + }, + { + "hidden_norms": [ + 261.58856201171875, + 234.9381103515625, + 221.2636260986328, + 211.9308624267578, + 204.54647827148438 + ], + "bp_grad_norms_per_sample_med": [ + 4.5460306864697486e-05, + 4.857210296904668e-05, + 4.9856924306368455e-05, + 4.823243580176495e-05, + 3.731804099516012e-05 + ], + "bp_grad_norms_F": [ + 0.002767088357359171, + 0.0028805267065763474, + 0.0029621378052979708, + 0.00275496207177639, + 0.001986011164262891 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.134087324142456, + "epoch": 80 + }, + { + "hidden_norms": [ + 261.3812561035156, + 234.79383850097656, + 220.678955078125, + 211.66114807128906, + 203.9405517578125 + ], + "bp_grad_norms_per_sample_med": [ + 4.64644399471581e-05, + 5.052189590060152e-05, + 5.2927574870409444e-05, + 5.0570299208629876e-05, + 3.7252495530992746e-05 + ], + "bp_grad_norms_F": [ + 0.0027735778130590916, + 0.002885127207264304, + 0.0029686433263123035, + 0.002763227093964815, + 0.0019980284851044416 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.135728359222412, + "epoch": 81 + }, + { + "hidden_norms": [ + 261.2560729980469, + 233.66014099121094, + 220.25682067871094, + 211.13511657714844, + 203.18130493164062 + ], + "bp_grad_norms_per_sample_med": [ + 4.6268629375845194e-05, + 4.9701800890034065e-05, + 5.169105133973062e-05, + 5.069339385954663e-05, + 3.80978781322483e-05 + ], + "bp_grad_norms_F": [ + 0.0028223153203725815, + 0.0029419492930173874, + 0.0030234854202717543, + 0.002805375959724188, + 0.002015760401263833 + ], + "gamma_dfa": NaN, + "acc_eval": 0.619140625, + "loss_eval": 1.1317980289459229, + "epoch": 82 + }, + { + "hidden_norms": [ + 260.62255859375, + 233.12937927246094, + 219.89907836914062, + 210.4191436767578, + 202.494873046875 + ], + "bp_grad_norms_per_sample_med": [ + 4.5126867917133495e-05, + 4.8572586820228025e-05, + 5.1520797569537535e-05, + 4.971070302417502e-05, + 3.838812335743569e-05 + ], + "bp_grad_norms_F": [ + 0.0028271761257201433, + 0.002944816369563341, + 0.003029909450560808, + 0.0028170389123260975, + 0.002025141380727291 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6259765625, + "loss_eval": 1.1392892599105835, + "epoch": 83 + }, + { + "hidden_norms": [ + 260.0465393066406, + 232.27760314941406, + 218.845458984375, + 209.7770233154297, + 201.92831420898438 + ], + "bp_grad_norms_per_sample_med": [ + 4.730001455754973e-05, + 5.118208355270326e-05, + 5.1580365834524855e-05, + 4.936498589813709e-05, + 3.706002826220356e-05 + ], + "bp_grad_norms_F": [ + 0.0028656981885433197, + 0.002991823712363839, + 0.0030798574443906546, + 0.0028517318423837423, + 0.0020406947005540133 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.1393200159072876, + "epoch": 84 + }, + { + "hidden_norms": [ + 259.99285888671875, + 232.2432403564453, + 218.6685333251953, + 209.5802001953125, + 201.7836456298828 + ], + "bp_grad_norms_per_sample_med": [ + 4.4883607188239694e-05, + 4.9325379222864285e-05, + 5.1563201850512996e-05, + 4.9446705816080794e-05, + 3.641278817667626e-05 + ], + "bp_grad_norms_F": [ + 0.002843427937477827, + 0.0029685739427804947, + 0.0030620063189417124, + 0.0028350763022899628, + 0.0020346841774880886 + ], + "gamma_dfa": NaN, + "acc_eval": 0.625, + "loss_eval": 1.136763572692871, + "epoch": 85 + }, + { + "hidden_norms": [ + 259.7002868652344, + 232.1937713623047, + 218.6339569091797, + 209.42572021484375, + 201.48532104492188 + ], + "bp_grad_norms_per_sample_med": [ + 4.557083229883574e-05, + 5.006462743040174e-05, + 5.1964529120596126e-05, + 5.040188261773437e-05, + 3.70733359886799e-05 + ], + "bp_grad_norms_F": [ + 0.002866365248337388, + 0.0029951538890600204, + 0.0030862949788570404, + 0.0028592217713594437, + 0.002047886373475194 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.139750361442566, + "epoch": 86 + }, + { + "hidden_norms": [ + 259.22808837890625, + 232.3558807373047, + 218.42848205566406, + 209.1579132080078, + 201.5212860107422 + ], + "bp_grad_norms_per_sample_med": [ + 4.5765504182782024e-05, + 4.875436570728198e-05, + 5.104453521198593e-05, + 5.005718412576243e-05, + 3.675639891298488e-05 + ], + "bp_grad_norms_F": [ + 0.002878013998270035, + 0.003002135781571269, + 0.0030916042160242796, + 0.002861205255612731, + 0.0020479748491197824 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1344283819198608, + "epoch": 87 + }, + { + "hidden_norms": [ + 259.1551513671875, + 232.05300903320312, + 218.15708923339844, + 208.9161834716797, + 201.6800537109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.611797339748591e-05, + 4.964259278494865e-05, + 5.252738264971413e-05, + 5.0600574468262494e-05, + 3.820879283011891e-05 + ], + "bp_grad_norms_F": [ + 0.0028855716809630394, + 0.003010405693203211, + 0.0031016215216368437, + 0.002874146681278944, + 0.0020545709412544966 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.135157823562622, + "epoch": 88 + }, + { + "hidden_norms": [ + 259.21893310546875, + 231.72747802734375, + 217.7665252685547, + 208.59022521972656, + 201.1155548095703 + ], + "bp_grad_norms_per_sample_med": [ + 4.6835561079205945e-05, + 5.060776311438531e-05, + 5.325842721504159e-05, + 5.128757766215131e-05, + 3.774667493416928e-05 + ], + "bp_grad_norms_F": [ + 0.002893448108807206, + 0.0030188425444066525, + 0.0031124993693083525, + 0.002883171197026968, + 0.002058332087472081 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6298828125, + "loss_eval": 1.1357543468475342, + "epoch": 89 + }, + { + "hidden_norms": [ + 258.88385009765625, + 230.9880828857422, + 217.33352661132812, + 208.3406524658203, + 200.54083251953125 + ], + "bp_grad_norms_per_sample_med": [ + 4.6940938773332164e-05, + 5.0942355301231146e-05, + 5.368283382267691e-05, + 5.184212204767391e-05, + 3.746367656276561e-05 + ], + "bp_grad_norms_F": [ + 0.0029224599711596966, + 0.0030530549120157957, + 0.003145798807963729, + 0.0029114321805536747, + 0.0020718672312796116 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.1398890018463135, + "epoch": 90 + }, + { + "hidden_norms": [ + 258.7764587402344, + 231.19357299804688, + 217.22779846191406, + 207.97528076171875, + 199.982421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.70306295028422e-05, + 5.185308327781968e-05, + 5.281997437123209e-05, + 5.1426530262688175e-05, + 3.7254685594234616e-05 + ], + "bp_grad_norms_F": [ + 0.002924826927483082, + 0.0030514320824295282, + 0.0031429482623934746, + 0.0029119658283889294, + 0.0020754521246999502 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138663411140442, + "epoch": 91 + }, + { + "hidden_norms": [ + 258.7837829589844, + 230.58901977539062, + 217.062255859375, + 207.7244873046875, + 199.89395141601562 + ], + "bp_grad_norms_per_sample_med": [ + 4.688404078478925e-05, + 5.141457950230688e-05, + 5.3491079597733915e-05, + 5.087396493763663e-05, + 3.739634121302515e-05 + ], + "bp_grad_norms_F": [ + 0.0029230716172605753, + 0.0030518025159835815, + 0.0031419326551258564, + 0.002910938812419772, + 0.00207503535784781 + ], + "gamma_dfa": NaN, + "acc_eval": 0.626953125, + "loss_eval": 1.1365739107131958, + "epoch": 92 + }, + { + "hidden_norms": [ + 258.7561950683594, + 230.4254913330078, + 217.07546997070312, + 207.6160125732422, + 199.7816162109375 + ], + "bp_grad_norms_per_sample_med": [ + 4.680828351411037e-05, + 5.096250242786482e-05, + 5.211709503782913e-05, + 5.09246347064618e-05, + 3.779645703616552e-05 + ], + "bp_grad_norms_F": [ + 0.002931967144832015, + 0.0030605625361204147, + 0.00315046776086092, + 0.0029180829878896475, + 0.002077121753245592 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1363377571105957, + "epoch": 93 + }, + { + "hidden_norms": [ + 258.76409912109375, + 230.5386505126953, + 216.76475524902344, + 207.16859436035156, + 199.2827911376953 + ], + "bp_grad_norms_per_sample_med": [ + 4.749056097352877e-05, + 5.2020419389009476e-05, + 5.3769603255204856e-05, + 5.178397987037897e-05, + 3.789216498262249e-05 + ], + "bp_grad_norms_F": [ + 0.0029493479523807764, + 0.0030784173868596554, + 0.0031682881526649, + 0.0029316784348338842, + 0.002084067091345787 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6298828125, + "loss_eval": 1.1382873058319092, + "epoch": 94 + }, + { + "hidden_norms": [ + 258.7884826660156, + 230.40945434570312, + 216.70376586914062, + 207.1806182861328, + 199.41917419433594 + ], + "bp_grad_norms_per_sample_med": [ + 4.741501834359951e-05, + 5.169968062546104e-05, + 5.352263542590663e-05, + 5.053802306065336e-05, + 3.758866660064086e-05 + ], + "bp_grad_norms_F": [ + 0.002947731176391244, + 0.003076745430007577, + 0.0031680618412792683, + 0.0029321794863790274, + 0.0020845714025199413 + ], + "gamma_dfa": NaN, + "acc_eval": 0.630859375, + "loss_eval": 1.1382077932357788, + "epoch": 95 + }, + { + "hidden_norms": [ + 258.766845703125, + 230.38992309570312, + 216.7628173828125, + 207.26092529296875, + 199.36366271972656 + ], + "bp_grad_norms_per_sample_med": [ + 4.718741183751263e-05, + 5.1928480388596654e-05, + 5.3666040912503377e-05, + 5.089692058390938e-05, + 3.752821430680342e-05 + ], + "bp_grad_norms_F": [ + 0.002943811472505331, + 0.003073457395657897, + 0.0031646883580833673, + 0.0029298998415470123, + 0.002084212377667427 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138296365737915, + "epoch": 96 + }, + { + "hidden_norms": [ + 258.8481140136719, + 230.38389587402344, + 216.7748260498047, + 207.24560546875, + 199.39401245117188 + ], + "bp_grad_norms_per_sample_med": [ + 4.728109706775285e-05, + 5.156427505426109e-05, + 5.3663239668821916e-05, + 5.139272616361268e-05, + 3.7748181057395414e-05 + ], + "bp_grad_norms_F": [ + 0.002947240835055709, + 0.003076959168538451, + 0.0031680231913924217, + 0.0029323517810553312, + 0.0020851469598710537 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1388041973114014, + "epoch": 97 + }, + { + "hidden_norms": [ + 258.77734375, + 230.3692626953125, + 216.7212677001953, + 207.1890869140625, + 199.34091186523438 + ], + "bp_grad_norms_per_sample_med": [ + 4.7204313887050375e-05, + 5.154019163455814e-05, + 5.373918611439876e-05, + 5.1062332204310223e-05, + 3.7904177588643506e-05 + ], + "bp_grad_norms_F": [ + 0.0029484080150723457, + 0.0030780842062085867, + 0.0031695417128503323, + 0.0029333126731216908, + 0.002085541607812047 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.138832688331604, + "epoch": 98 + }, + { + "hidden_norms": [ + 258.7897644042969, + 230.38552856445312, + 216.73997497558594, + 207.1963653564453, + 199.38656616210938 + ], + "bp_grad_norms_per_sample_med": [ + 4.726059705717489e-05, + 5.1730185077758506e-05, + 5.3854040743317455e-05, + 5.0960083171958104e-05, + 3.793121504713781e-05 + ], + "bp_grad_norms_F": [ + 0.00294809159822762, + 0.003077775239944458, + 0.003169153118506074, + 0.0029330949764698744, + 0.0020853858441114426 + ], + "gamma_dfa": NaN, + "acc_eval": 0.62890625, + "loss_eval": 1.1388249397277832, + "epoch": 99 + }, + { + "hidden_norms": [ + 258.7891845703125, + 230.38888549804688, + 216.73963928222656, + 207.19769287109375, + 199.4077606201172 + ], + "bp_grad_norms_per_sample_med": [ + 4.725577309727669e-05, + 5.174486432224512e-05, + 5.38085114385467e-05, + 5.098402107250877e-05, + 3.7933263229206204e-05 + ], + "bp_grad_norms_F": [ + 0.002948042470961809, + 0.0030777468346059322, + 0.003169137053191662, + 0.002933081705123186, + 0.0020853858441114426 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6279296875, + "loss_eval": 1.1387826204299927, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 8.737784385681152, + 8.813130378723145, + 8.844642639160156, + 8.889528274536133 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010079912608489394, + 0.0010035138111561537, + 0.0009970925748348236, + 0.0009936393471434712, + 0.000986678060144186 + ], + "bp_grad_norms_F": [ + 0.035574451088905334, + 0.035288579761981964, + 0.035048045217990875, + 0.0346725769340992, + 0.03439188003540039 + ], + "gamma_dfa": 0.0033523982419865206, + "acc_eval": 0.0927734375, + "loss_eval": 2.4863264560699463, + "epoch": 0 + }, + { + "hidden_norms": [ + 900.3377685546875, + 3463.92626953125, + 6660.5166015625, + 10478.5126953125, + 13466.513671875 + ], + "bp_grad_norms_per_sample_med": [ + 2.017142833210528e-06, + 7.972002435963077e-07, + 7.783806381667091e-07, + 7.758338256280695e-07, + 7.810436954969191e-07 + ], + "bp_grad_norms_F": [ + 0.00013047464017290622, + 7.321321754716337e-05, + 7.131113670766354e-05, + 7.113779429346323e-05, + 7.09498199285008e-05 + ], + "gamma_dfa": 0.1028625147882849, + "acc_eval": 0.2861328125, + "loss_eval": 1.970402717590332, + "epoch": 1 + }, + { + "hidden_norms": [ + 1784.805419921875, + 14085.2138671875, + 36523.9375, + 61422.50390625, + 73870.3359375 + ], + "bp_grad_norms_per_sample_med": [ + 9.087140711017128e-07, + 1.772240381114898e-07, + 1.705584367073243e-07, + 1.7156033038645546e-07, + 1.728751612972701e-07 + ], + "bp_grad_norms_F": [ + 4.7445286327274516e-05, + 1.1973520486208145e-05, + 9.698592293716501e-06, + 9.335580216429662e-06, + 9.154121471510734e-06 + ], + "gamma_dfa": 0.09588160619023256, + "acc_eval": 0.298828125, + "loss_eval": 1.9628738164901733, + "epoch": 2 + }, + { + "hidden_norms": [ + 2670.88134765625, + 35761.4921875, + 99927.7890625, + 170223.953125, + 201448.390625 + ], + "bp_grad_norms_per_sample_med": [ + 5.815078338855528e-07, + 7.772520405069372e-08, + 7.527528111950232e-08, + 7.557918735301428e-08, + 7.57173737042649e-08 + ], + "bp_grad_norms_F": [ + 2.8944486984983087e-05, + 3.2005805223889183e-06, + 2.6765355869429186e-06, + 2.639568720042007e-06, + 2.6436800908413716e-06 + ], + "gamma_dfa": 0.09442083747126162, + "acc_eval": 0.2900390625, + "loss_eval": 1.9821033477783203, + "epoch": 3 + }, + { + "hidden_norms": [ + 3506.001220703125, + 70233.9375, + 205054.078125, + 348792.375, + 416698.5625 + ], + "bp_grad_norms_per_sample_med": [ + 4.5228594558466284e-07, + 4.338783554658221e-08, + 4.114394869247917e-08, + 4.122260932604149e-08, + 4.124275321260029e-08 + ], + "bp_grad_norms_F": [ + 2.319143823115155e-05, + 1.7165241388283903e-06, + 1.3772670399703202e-06, + 1.3777447520624264e-06, + 1.3796359326079255e-06 + ], + "gamma_dfa": 0.09172606549691409, + "acc_eval": 0.298828125, + "loss_eval": 1.9661527872085571, + "epoch": 4 + }, + { + "hidden_norms": [ + 4351.04052734375, + 120982.0390625, + 361547.03125, + 633667.3125, + 764198.75 + ], + "bp_grad_norms_per_sample_med": [ + 3.632259790720127e-07, + 2.6118947005215887e-08, + 2.4913996199416033e-08, + 2.494128636953974e-08, + 2.4942012899487054e-08 + ], + "bp_grad_norms_F": [ + 1.894752676889766e-05, + 1.1090510270150844e-06, + 8.424218549407669e-07, + 8.403117703892349e-07, + 8.407336054006009e-07 + ], + "gamma_dfa": 0.08992433547973633, + "acc_eval": 0.2900390625, + "loss_eval": 1.980475664138794, + "epoch": 5 + }, + { + "hidden_norms": [ + 5174.9833984375, + 189817.0625, + 576763.3125, + 1012734.125, + 1235217.5 + ], + "bp_grad_norms_per_sample_med": [ + 3.340334444601467e-07, + 1.826493090106851e-08, + 1.7263264595612782e-08, + 1.730784759956805e-08, + 1.7305337607353977e-08 + ], + "bp_grad_norms_F": [ + 1.7139096598839387e-05, + 7.582453918075771e-07, + 5.794162802885694e-07, + 5.812879635413992e-07, + 5.813373604723893e-07 + ], + "gamma_dfa": 0.08752730302512646, + "acc_eval": 0.3056640625, + "loss_eval": 1.9696743488311768, + "epoch": 6 + }, + { + "hidden_norms": [ + 5963.3935546875, + 276686.75, + 861517.375, + 1555059.75, + 1913322.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.834741223978199e-07, + 1.3120247110975924e-08, + 1.2326365705916942e-08, + 1.2353129186237766e-08, + 1.2349524958210623e-08 + ], + "bp_grad_norms_F": [ + 1.4978587387304287e-05, + 5.169860628484457e-07, + 4.2094282548532647e-07, + 4.222391680741566e-07, + 4.222146685606276e-07 + ], + "gamma_dfa": 0.08884745300747454, + "acc_eval": 0.2919921875, + "loss_eval": 1.9592503309249878, + "epoch": 7 + }, + { + "hidden_norms": [ + 6751.1630859375, + 390990.65625, + 1268157.625, + 2303462.75, + 2850455.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.5272595394199016e-07, + 9.644952392307005e-09, + 9.213153795428752e-09, + 9.189856875480018e-09, + 9.217835383878992e-09 + ], + "bp_grad_norms_F": [ + 1.3214407772466075e-05, + 3.7820277043465467e-07, + 3.14011003865744e-07, + 3.1468064776163374e-07, + 3.146610936255456e-07 + ], + "gamma_dfa": 0.08774545323103666, + "acc_eval": 0.3115234375, + "loss_eval": 1.9636309146881104, + "epoch": 8 + }, + { + "hidden_norms": [ + 7557.10302734375, + 541741.25, + 1767146.375, + 3237576.25, + 4005094.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3122942138797953e-07, + 7.519741274109037e-09, + 7.2226606917524805e-09, + 7.218183384338772e-09, + 7.221534037427091e-09 + ], + "bp_grad_norms_F": [ + 1.196970697492361e-05, + 2.9184533900661336e-07, + 2.4720966962377133e-07, + 2.4752529270699597e-07, + 2.4754368155299744e-07 + ], + "gamma_dfa": 0.08941872720606625, + "acc_eval": 0.2900390625, + "loss_eval": 1.9587393999099731, + "epoch": 9 + }, + { + "hidden_norms": [ + 8353.015625, + 720288.5625, + 2367034.25, + 4437438.5, + 5500873.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.1009967099416826e-07, + 6.096115612308495e-09, + 5.8281148795913396e-09, + 5.816529036195561e-09, + 5.823292070772368e-09 + ], + "bp_grad_norms_F": [ + 1.0853039384528529e-05, + 2.2833219759377243e-07, + 1.979581298883204e-07, + 1.9814572738141578e-07, + 1.9820384977720096e-07 + ], + "gamma_dfa": 0.09132041316479445, + "acc_eval": 0.2978515625, + "loss_eval": 1.9605882167816162, + "epoch": 10 + }, + { + "hidden_norms": [ + 9134.4443359375, + 924688.8125, + 3108971.25, + 5809310.0, + 7180875.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.9402843065563502e-07, + 4.977510403847418e-09, + 4.8141264308299014e-09, + 4.791541829973767e-09, + 4.794175723077387e-09 + ], + "bp_grad_norms_F": [ + 1.0063903573609423e-05, + 1.9364638603747153e-07, + 1.6622837506474752e-07, + 1.6636218447274587e-07, + 1.6641583044929575e-07 + ], + "gamma_dfa": 0.08994872949551791, + "acc_eval": 0.2822265625, + "loss_eval": 1.9717106819152832, + "epoch": 11 + }, + { + "hidden_norms": [ + 9934.0107421875, + 1171186.5, + 4059807.75, + 7477705.0, + 9248714.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.802942222184356e-07, + 4.213630333538276e-09, + 4.032348677185382e-09, + 4.031016409555832e-09, + 4.033940292913485e-09 + ], + "bp_grad_norms_F": [ + 9.375374247611035e-06, + 1.60658984782458e-07, + 1.398711617639492e-07, + 1.399746452079853e-07, + 1.4004145043600147e-07 + ], + "gamma_dfa": 0.09168496390338987, + "acc_eval": 0.2998046875, + "loss_eval": 1.9513648748397827, + "epoch": 12 + }, + { + "hidden_norms": [ + 10690.2216796875, + 1474348.375, + 5210694.5, + 9539616.0, + 11795722.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7011585384807404e-07, + 3.5948770626959003e-09, + 3.444458496204561e-09, + 3.439692752849055e-09, + 3.4398179860062328e-09 + ], + "bp_grad_norms_F": [ + 8.913790225051343e-06, + 1.346561759874021e-07, + 1.1880944583708697e-07, + 1.1887690476442003e-07, + 1.1894194784645151e-07 + ], + "gamma_dfa": 0.0931803259300068, + "acc_eval": 0.3134765625, + "loss_eval": 1.959463357925415, + "epoch": 13 + }, + { + "hidden_norms": [ + 11428.3076171875, + 1789460.25, + 6431273.0, + 11810251.0, + 14610525.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5823535193248972e-07, + 3.1298097447063356e-09, + 3.012203153573978e-09, + 3.010908633527265e-09, + 3.010648619294898e-09 + ], + "bp_grad_norms_F": [ + 8.233506378019229e-06, + 1.1668681310084139e-07, + 1.0298786889961775e-07, + 1.0303519104581937e-07, + 1.0309597797686365e-07 + ], + "gamma_dfa": 0.09336384548805654, + "acc_eval": 0.2861328125, + "loss_eval": 1.9515889883041382, + "epoch": 14 + }, + { + "hidden_norms": [ + 12175.4384765625, + 2177908.0, + 7886216.5, + 14475684.0, + 17927020.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5137742082060868e-07, + 2.705691448667835e-09, + 2.5981530260565933e-09, + 2.5995214869567462e-09, + 2.6000293029682098e-09 + ], + "bp_grad_norms_F": [ + 7.800716048222966e-06, + 1.0053086896277819e-07, + 8.984200405848242e-08, + 8.987952071493055e-08, + 8.993622913067156e-08 + ], + "gamma_dfa": 0.09357930033002049, + "acc_eval": 0.2978515625, + "loss_eval": 1.9580912590026855, + "epoch": 15 + }, + { + "hidden_norms": [ + 12918.6787109375, + 2622644.5, + 9573671.0, + 17460572.0, + 21682046.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.432233602827182e-07, + 2.359643591631766e-09, + 2.2714441438864696e-09, + 2.2688442236074025e-09, + 2.2694950363444377e-09 + ], + "bp_grad_norms_F": [ + 7.43454029361601e-06, + 8.846858889910436e-08, + 7.942762891843813e-08, + 7.945371294226788e-08, + 7.950914238108453e-08 + ], + "gamma_dfa": 0.09332277777139097, + "acc_eval": 0.30859375, + "loss_eval": 1.9656270742416382, + "epoch": 16 + }, + { + "hidden_norms": [ + 13676.931640625, + 3144179.5, + 11421599.0, + 20832254.0, + 25907438.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3402345189206244e-07, + 2.1064472388587774e-09, + 2.0263852817947736e-09, + 2.0199610872850826e-09, + 2.0222397090208233e-09 + ], + "bp_grad_norms_F": [ + 6.909830062795663e-06, + 7.773559929091789e-08, + 7.076827301943922e-08, + 7.077783692466255e-08, + 7.082799413637986e-08 + ], + "gamma_dfa": 0.0945073509356007, + "acc_eval": 0.296875, + "loss_eval": 1.9510960578918457, + "epoch": 17 + }, + { + "hidden_norms": [ + 14410.64453125, + 3691622.0, + 13302875.0, + 24659928.0, + 30700242.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2569752527724631e-07, + 1.8540845525549798e-09, + 1.8018908587436044e-09, + 1.8003264434796051e-09, + 1.802896276714705e-09 + ], + "bp_grad_norms_F": [ + 6.58303315503872e-06, + 6.894391191281102e-08, + 6.3350469758916e-08, + 6.336826174901944e-08, + 6.340740554833246e-08 + ], + "gamma_dfa": 0.09388192358892411, + "acc_eval": 0.30859375, + "loss_eval": 1.9456725120544434, + "epoch": 18 + }, + { + "hidden_norms": [ + 15102.634765625, + 4270070.0, + 15687016.0, + 28858048.0, + 35882240.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2314617947595252e-07, + 1.6925943979728686e-09, + 1.6383979728473719e-09, + 1.6367472932543592e-09, + 1.6394127166918793e-09 + ], + "bp_grad_norms_F": [ + 6.343140285025584e-06, + 6.240136940505181e-08, + 5.757489418556361e-08, + 5.7587019597349354e-08, + 5.7624333749117795e-08 + ], + "gamma_dfa": 0.09518493304494768, + "acc_eval": 0.302734375, + "loss_eval": 1.9497833251953125, + "epoch": 19 + }, + { + "hidden_norms": [ + 15809.6728515625, + 4913181.0, + 18109688.0, + 33281892.0, + 41436228.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1704661773137559e-07, + 1.533212445892218e-09, + 1.483607681151966e-09, + 1.4837684414459318e-09, + 1.4838255069093975e-09 + ], + "bp_grad_norms_F": [ + 6.079233116906835e-06, + 5.7217945936827164e-08, + 5.270470992968512e-08, + 5.2718213794378244e-08, + 5.2752689327917324e-08 + ], + "gamma_dfa": 0.09407007653499022, + "acc_eval": 0.2958984375, + "loss_eval": 1.961036205291748, + "epoch": 20 + }, + { + "hidden_norms": [ + 16522.783203125, + 5620503.0, + 20819020.0, + 38391960.0, + 47723272.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1146808986950418e-07, + 1.4118024527220996e-09, + 1.3678460586419305e-09, + 1.3669514409286876e-09, + 1.3668450815629285e-09 + ], + "bp_grad_norms_F": [ + 5.778397280664649e-06, + 5.162353389209784e-08, + 4.8153967924235985e-08, + 4.816252285877454e-08, + 4.8193449231348495e-08 + ], + "gamma_dfa": 0.09494083630852401, + "acc_eval": 0.2958984375, + "loss_eval": 1.9576481580734253, + "epoch": 21 + }, + { + "hidden_norms": [ + 17230.27734375, + 6437730.5, + 23789486.0, + 43960328.0, + 54569096.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0952022932997352e-07, + 1.2858689668604484e-09, + 1.246260317167014e-09, + 1.2462959553261044e-09, + 1.2484926426026277e-09 + ], + "bp_grad_norms_F": [ + 5.637425147142494e-06, + 4.732414282671016e-08, + 4.430494371376881e-08, + 4.431280586913999e-08, + 4.434128086927558e-08 + ], + "gamma_dfa": 0.09481688600499183, + "acc_eval": 0.2900390625, + "loss_eval": 1.9625442028045654, + "epoch": 22 + }, + { + "hidden_norms": [ + 17916.12890625, + 7217473.5, + 26969020.0, + 49888804.0, + 62010184.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.043977349013403e-07, + 1.1912204556097095e-09, + 1.159051632448893e-09, + 1.1590449711107453e-09, + 1.159014662022173e-09 + ], + "bp_grad_norms_F": [ + 5.385433269111672e-06, + 4.3334623001101136e-08, + 4.083162963297582e-08, + 4.0836408032873805e-08, + 4.0863898931320364e-08 + ], + "gamma_dfa": 0.0946647283853963, + "acc_eval": 0.2939453125, + "loss_eval": 1.9656811952590942, + "epoch": 23 + }, + { + "hidden_norms": [ + 18617.46875, + 8095365.0, + 30241864.0, + 56059896.0, + 69702984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.001103129283365e-07, + 1.1034658742303805e-09, + 1.0674757744411068e-09, + 1.0666105776380164e-09, + 1.0677670969627684e-09 + ], + "bp_grad_norms_F": [ + 5.150916877028067e-06, + 3.999087283546032e-08, + 3.779740609388682e-08, + 3.780221291549424e-08, + 3.782682256314729e-08 + ], + "gamma_dfa": 0.09509630355751142, + "acc_eval": 0.296875, + "loss_eval": 1.9476948976516724, + "epoch": 24 + }, + { + "hidden_norms": [ + 19248.7890625, + 9047595.0, + 33634812.0, + 62495088.0, + 77796536.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.749370377676314e-08, + 1.0280801765460978e-09, + 9.980430926148642e-10, + 9.978470272287154e-10, + 9.990493987643845e-10 + ], + "bp_grad_norms_F": [ + 5.017087005398935e-06, + 3.7442834610601494e-08, + 3.536156611971819e-08, + 3.536548476290591e-08, + 3.538822213045023e-08 + ], + "gamma_dfa": 0.09479212731821463, + "acc_eval": 0.2861328125, + "loss_eval": 1.9604804515838623, + "epoch": 25 + }, + { + "hidden_norms": [ + 19902.470703125, + 10030725.0, + 37252656.0, + 69351704.0, + 86270768.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.411947843318558e-08, + 9.563448921667828e-10, + 9.361866837309663e-10, + 9.359075736625755e-10, + 9.361766917237446e-10 + ], + "bp_grad_norms_F": [ + 4.873440502706217e-06, + 3.4947159832654506e-08, + 3.313299146157078e-08, + 3.3137865784738096e-08, + 3.315915364510147e-08 + ], + "gamma_dfa": 0.09510701123508625, + "acc_eval": 0.2978515625, + "loss_eval": 1.9498941898345947, + "epoch": 26 + }, + { + "hidden_norms": [ + 20513.66796875, + 11086393.0, + 41223968.0, + 76828584.0, + 95694480.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.249640697817085e-08, + 9.003223166992314e-10, + 8.743661350507637e-10, + 8.736535939135592e-10, + 8.752278901624777e-10 + ], + "bp_grad_norms_F": [ + 4.75014485346037e-06, + 3.290759664764664e-08, + 3.1125043875590563e-08, + 3.1127818544973707e-08, + 3.11488683735206e-08 + ], + "gamma_dfa": 0.09552363055991009, + "acc_eval": 0.2841796875, + "loss_eval": 1.9527215957641602, + "epoch": 27 + }, + { + "hidden_norms": [ + 21161.345703125, + 12263719.0, + 45533684.0, + 84877296.0, + 105753224.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.900443049242313e-08, + 8.457264888406257e-10, + 8.261510919815862e-10, + 8.261567541190118e-10, + 8.276057061884501e-10 + ], + "bp_grad_norms_F": [ + 4.624974280886818e-06, + 3.0792985938887796e-08, + 2.9227694042788244e-08, + 2.9232776199705768e-08, + 2.9251353339532216e-08 + ], + "gamma_dfa": 0.09527035459177569, + "acc_eval": 0.2890625, + "loss_eval": 1.950648307800293, + "epoch": 28 + }, + { + "hidden_norms": [ + 21787.568359375, + 13358760.0, + 49723396.0, + 92840264.0, + 115901424.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.79872459336184e-08, + 8.034463094830357e-10, + 7.846168159630906e-10, + 7.837334670135476e-10, + 7.841179927581265e-10 + ], + "bp_grad_norms_F": [ + 4.530191290541552e-06, + 2.9184068495169413e-08, + 2.7723606521590227e-08, + 2.7726789753046432e-08, + 2.7744931685447227e-08 + ], + "gamma_dfa": 0.09598725114483386, + "acc_eval": 0.2919921875, + "loss_eval": 1.9504928588867188, + "epoch": 29 + }, + { + "hidden_norms": [ + 22378.34765625, + 14611837.0, + 54335560.0, + 101350864.0, + 126710488.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.497670478391228e-08, + 7.560595483013799e-10, + 7.353461728420996e-10, + 7.342743080229752e-10, + 7.348425756781296e-10 + ], + "bp_grad_norms_F": [ + 4.383283339848276e-06, + 2.7485034692631416e-08, + 2.6182895851434296e-08, + 2.618475392068831e-08, + 2.620201833281044e-08 + ], + "gamma_dfa": 0.09509110247017816, + "acc_eval": 0.2958984375, + "loss_eval": 1.9564056396484375, + "epoch": 30 + }, + { + "hidden_norms": [ + 22972.798828125, + 15931348.0, + 59291124.0, + 110237776.0, + 138020368.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.252197858382715e-08, + 7.193445838993284e-10, + 6.977300404109599e-10, + 6.966639487515636e-10, + 6.977723399081981e-10 + ], + "bp_grad_norms_F": [ + 4.255563453625655e-06, + 2.5971447215056287e-08, + 2.4833044065530885e-08, + 2.4835205891804435e-08, + 2.4851219748711628e-08 + ], + "gamma_dfa": 0.0951943755208049, + "acc_eval": 0.30859375, + "loss_eval": 1.9508299827575684, + "epoch": 31 + }, + { + "hidden_norms": [ + 23525.689453125, + 17283022.0, + 64234984.0, + 119317480.0, + 149347744.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.036072784989301e-08, + 6.884249836858203e-10, + 6.666004415123439e-10, + 6.656397100179845e-10, + 6.674217845059616e-10 + ], + "bp_grad_norms_F": [ + 4.212505245959619e-06, + 2.4864668546342727e-08, + 2.375563212808629e-08, + 2.3757841915994504e-08, + 2.3773273127858374e-08 + ], + "gamma_dfa": 0.09534151147818193, + "acc_eval": 0.294921875, + "loss_eval": 1.95639967918396, + "epoch": 32 + }, + { + "hidden_norms": [ + 24102.95703125, + 18811968.0, + 69193392.0, + 128823560.0, + 161700704.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.921565980950618e-08, + 6.526117424243694e-10, + 6.390621365426341e-10, + 6.381262185328751e-10, + 6.384171524764781e-10 + ], + "bp_grad_norms_F": [ + 4.09630820286111e-06, + 2.3687046990517047e-08, + 2.2686869272092736e-08, + 2.2687553169475905e-08, + 2.2702355551018627e-08 + ], + "gamma_dfa": 0.0947199320216896, + "acc_eval": 0.2880859375, + "loss_eval": 1.960526943206787, + "epoch": 33 + }, + { + "hidden_norms": [ + 24687.955078125, + 20313542.0, + 74389296.0, + 138258576.0, + 173791248.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.937118340350935e-08, + 6.360312831965587e-10, + 6.205357339084117e-10, + 6.196035906569364e-10, + 6.196675395031548e-10 + ], + "bp_grad_norms_F": [ + 4.070574505021796e-06, + 2.2864428572688666e-08, + 2.1894738466698982e-08, + 2.1895061763643753e-08, + 2.1909569269951135e-08 + ], + "gamma_dfa": 0.09556430295924656, + "acc_eval": 0.2822265625, + "loss_eval": 1.97263765335083, + "epoch": 34 + }, + { + "hidden_norms": [ + 25226.55078125, + 21851366.0, + 80000824.0, + 148574480.0, + 186595952.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.592127104771862e-08, + 6.044152955908544e-10, + 5.892630272619215e-10, + 5.896260146798227e-10, + 5.900769872724254e-10 + ], + "bp_grad_norms_F": [ + 3.966818894696189e-06, + 2.1824051898988728e-08, + 2.093374718015184e-08, + 2.093443285389185e-08, + 2.0947767964685227e-08 + ], + "gamma_dfa": 0.09587649442255497, + "acc_eval": 0.298828125, + "loss_eval": 1.9495991468429565, + "epoch": 35 + }, + { + "hidden_norms": [ + 25759.50390625, + 23391128.0, + 85561480.0, + 158667136.0, + 198961760.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.493858333873504e-08, + 5.860726903783586e-10, + 5.731417562770957e-10, + 5.733850616529423e-10, + 5.73569580719635e-10 + ], + "bp_grad_norms_F": [ + 3.896147973136976e-06, + 2.099926454945944e-08, + 2.0218029916918567e-08, + 2.0218159590967844e-08, + 2.0230830344303286e-08 + ], + "gamma_dfa": 0.09563440945930779, + "acc_eval": 0.294921875, + "loss_eval": 1.954901099205017, + "epoch": 36 + }, + { + "hidden_norms": [ + 26267.0859375, + 25111884.0, + 91593392.0, + 169479968.0, + 212491408.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.387680511783401e-08, + 5.612941222921108e-10, + 5.475105369079358e-10, + 5.468157038279742e-10, + 5.479569020749864e-10 + ], + "bp_grad_norms_F": [ + 3.838411430479027e-06, + 2.0261547106770195e-08, + 1.9493551661753372e-08, + 1.949278782831243e-08, + 1.9505332460312275e-08 + ], + "gamma_dfa": 0.09528586096712388, + "acc_eval": 0.302734375, + "loss_eval": 1.9556396007537842, + "epoch": 37 + }, + { + "hidden_norms": [ + 26761.587890625, + 26706742.0, + 97554944.0, + 180407616.0, + 226265728.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.260722156843258e-08, + 5.407673198121188e-10, + 5.32608401826451e-10, + 5.31698407524317e-10, + 5.328552044048251e-10 + ], + "bp_grad_norms_F": [ + 3.7372303722804645e-06, + 1.9519287519642603e-08, + 1.8807236656925852e-08, + 1.8806394663783976e-08, + 1.8818212765836506e-08 + ], + "gamma_dfa": 0.09491665422683582, + "acc_eval": 0.2890625, + "loss_eval": 1.963973879814148, + "epoch": 38 + }, + { + "hidden_norms": [ + 27302.328125, + 28336562.0, + 103781320.0, + 191401696.0, + 240130064.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.187927053564636e-08, + 5.305865746763061e-10, + 5.205576525391109e-10, + 5.20661624925367e-10, + 5.217564713611011e-10 + ], + "bp_grad_norms_F": [ + 3.734877054739627e-06, + 1.88775892695503e-08, + 1.8220953634795478e-08, + 1.8220212893993448e-08, + 1.8231482101782603e-08 + ], + "gamma_dfa": 0.0957885464449646, + "acc_eval": 0.302734375, + "loss_eval": 1.9604723453521729, + "epoch": 39 + }, + { + "hidden_norms": [ + 27801.44140625, + 30051226.0, + 109945288.0, + 203002704.0, + 254881776.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.894305215610075e-08, + 5.044222262107212e-10, + 4.932855790507062e-10, + 4.934126440758746e-10, + 4.940316489232544e-10 + ], + "bp_grad_norms_F": [ + 3.610647127061384e-06, + 1.8150354108570355e-08, + 1.753623024569606e-08, + 1.7534704355171016e-08, + 1.7545806585417267e-08 + ], + "gamma_dfa": 0.09517717303242534, + "acc_eval": 0.2958984375, + "loss_eval": 1.9589688777923584, + "epoch": 40 + }, + { + "hidden_norms": [ + 28266.703125, + 31897594.0, + 116263888.0, + 215162448.0, + 270215296.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.807566421684896e-08, + 4.835814526593651e-10, + 4.775287942848649e-10, + 4.773109685274335e-10, + 4.784843632421598e-10 + ], + "bp_grad_norms_F": [ + 3.590413371057366e-06, + 1.7596850199197434e-08, + 1.705259222717359e-08, + 1.7050926004458233e-08, + 1.7061644541627174e-08 + ], + "gamma_dfa": 0.0961545761092566, + "acc_eval": 0.30859375, + "loss_eval": 1.9595096111297607, + "epoch": 41 + }, + { + "hidden_norms": [ + 28755.66015625, + 33582328.0, + 122605680.0, + 226378480.0, + 284438688.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.689399612014313e-08, + 4.746543713629592e-10, + 4.678599174745557e-10, + 4.68083238835959e-10, + 4.683119447790318e-10 + ], + "bp_grad_norms_F": [ + 3.5121436212648405e-06, + 1.7124380136124273e-08, + 1.6555107507087996e-08, + 1.655343240258844e-08, + 1.656368908697914e-08 + ], + "gamma_dfa": 0.09569378412561491, + "acc_eval": 0.287109375, + "loss_eval": 1.9612011909484863, + "epoch": 42 + }, + { + "hidden_norms": [ + 29227.5703125, + 35443612.0, + 129229904.0, + 238040368.0, + 299000064.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.582912703834154e-08, + 4.575871348500016e-10, + 4.493441174702184e-10, + 4.48520082185766e-10, + 4.485415650012925e-10 + ], + "bp_grad_norms_F": [ + 3.4321058137720684e-06, + 1.6602150765265833e-08, + 1.6083028242519504e-08, + 1.6080972997656318e-08, + 1.609118882583971e-08 + ], + "gamma_dfa": 0.09606127908773487, + "acc_eval": 0.306640625, + "loss_eval": 1.9551353454589844, + "epoch": 43 + }, + { + "hidden_norms": [ + 29665.798828125, + 37243032.0, + 135839760.0, + 250377328.0, + 314433920.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.588776813032382e-08, + 4.4936304677278827e-10, + 4.4115311403913893e-10, + 4.406963405312325e-10, + 4.4055534220710513e-10 + ], + "bp_grad_norms_F": [ + 3.3984799756581197e-06, + 1.6157997606569552e-08, + 1.564128204734061e-08, + 1.5638891071034777e-08, + 1.564865925729464e-08 + ], + "gamma_dfa": 0.09547593681054423, + "acc_eval": 0.2900390625, + "loss_eval": 1.9503705501556396, + "epoch": 44 + }, + { + "hidden_norms": [ + 30096.123046875, + 39014544.0, + 141817168.0, + 261217760.0, + 328197248.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.549055342475185e-08, + 4.3991607578952596e-10, + 4.348142956800416e-10, + 4.3428130536149467e-10, + 4.349899329625373e-10 + ], + "bp_grad_norms_F": [ + 3.382166596566094e-06, + 1.5776649320287106e-08, + 1.5299850275596327e-08, + 1.5297549893489304e-08, + 1.5307026757227504e-08 + ], + "gamma_dfa": 0.09610002994304523, + "acc_eval": 0.2998046875, + "loss_eval": 1.952854037284851, + "epoch": 45 + }, + { + "hidden_norms": [ + 30554.974609375, + 40873780.0, + 148087312.0, + 272436128.0, + 342258336.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.514299855098216e-08, + 4.291983157767021e-10, + 4.228755678958862e-10, + 4.2251957488304015e-10, + 4.227345695717588e-10 + ], + "bp_grad_norms_F": [ + 3.3793355669331504e-06, + 1.5485536408732514e-08, + 1.4993654318118388e-08, + 1.499121538017789e-08, + 1.5000590991576246e-08 + ], + "gamma_dfa": 0.09557013235462364, + "acc_eval": 0.3017578125, + "loss_eval": 1.9633105993270874, + "epoch": 46 + }, + { + "hidden_norms": [ + 30981.4765625, + 42548124.0, + 153904848.0, + 283882112.0, + 356627616.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.343542224840348e-08, + 4.1842326825580756e-10, + 4.139384113255318e-10, + 4.141494092113618e-10, + 4.1477912771092917e-10 + ], + "bp_grad_norms_F": [ + 3.3046233056666097e-06, + 1.508391989091251e-08, + 1.4620022525946297e-08, + 1.4617588028897899e-08, + 1.462664656060042e-08 + ], + "gamma_dfa": 0.09567815247282851, + "acc_eval": 0.296875, + "loss_eval": 1.958325982093811, + "epoch": 47 + }, + { + "hidden_norms": [ + 31383.2578125, + 44333160.0, + 160058736.0, + 295685184.0, + 371288096.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.18988522660402e-08, + 4.057836289206307e-10, + 4.0004452528386025e-10, + 3.9987613220660023e-10, + 4.004964138104583e-10 + ], + "bp_grad_norms_F": [ + 3.2255043151963037e-06, + 1.4663311453944061e-08, + 1.4252069746589768e-08, + 1.424969386931707e-08, + 1.4258660918642363e-08 + ], + "gamma_dfa": 0.09609431066201068, + "acc_eval": 0.302734375, + "loss_eval": 1.9508600234985352, + "epoch": 48 + }, + { + "hidden_norms": [ + 31750.03125, + 46204072.0, + 166757840.0, + 307620864.0, + 385856832.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.133605978675405e-08, + 3.9670436380312424e-10, + 3.904292722456404e-10, + 3.9002356899686674e-10, + 3.9039230181892037e-10 + ], + "bp_grad_norms_F": [ + 3.2063508115243167e-06, + 1.4354414545891814e-08, + 1.3938280751801813e-08, + 1.3935605558401676e-08, + 1.394456727865645e-08 + ], + "gamma_dfa": 0.09565898558139452, + "acc_eval": 0.310546875, + "loss_eval": 1.9467211961746216, + "epoch": 49 + }, + { + "hidden_norms": [ + 32133.1484375, + 47907484.0, + 173083168.0, + 319475424.0, + 400677984.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.030914079246941e-08, + 3.8645733835274143e-10, + 3.81215115030642e-10, + 3.812981042017327e-10, + 3.811861937208505e-10 + ], + "bp_grad_norms_F": [ + 3.177025973855052e-06, + 1.4072985443647212e-08, + 1.368274382684831e-08, + 1.3679918531295243e-08, + 1.368857649453048e-08 + ], + "gamma_dfa": 0.09606298332801089, + "acc_eval": 0.30078125, + "loss_eval": 1.9524433612823486, + "epoch": 50 + }, + { + "hidden_norms": [ + 32483.716796875, + 49794588.0, + 179046160.0, + 330962240.0, + 414954912.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.051003254015086e-08, + 3.794887737385011e-10, + 3.751928767670165e-10, + 3.752734789586043e-10, + 3.7574471312140645e-10 + ], + "bp_grad_norms_F": [ + 3.154751766487607e-06, + 1.3766489281863414e-08, + 1.339402011524271e-08, + 1.3391274755747418e-08, + 1.3399712450734569e-08 + ], + "gamma_dfa": 0.09573800596626825, + "acc_eval": 0.3046875, + "loss_eval": 1.952356219291687, + "epoch": 51 + }, + { + "hidden_norms": [ + 32825.296875, + 51662352.0, + 185889568.0, + 343223360.0, + 430225696.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.9168662858155585e-08, + 3.7636679883767954e-10, + 3.7184264001233203e-10, + 3.7154498921943e-10, + 3.7157116272723556e-10 + ], + "bp_grad_norms_F": [ + 3.0909043289284455e-06, + 1.346105005239906e-08, + 1.3102917861829155e-08, + 1.3100156515122308e-08, + 1.3108366836434016e-08 + ], + "gamma_dfa": 0.09539097778178984, + "acc_eval": 0.291015625, + "loss_eval": 1.9585516452789307, + "epoch": 52 + }, + { + "hidden_norms": [ + 33148.9453125, + 53487464.0, + 192413680.0, + 354830112.0, + 444651488.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.949418024897568e-08, + 3.692673389288359e-10, + 3.6510769407804844e-10, + 3.6480282683548637e-10, + 3.65057900575394e-10 + ], + "bp_grad_norms_F": [ + 3.0807416351308348e-06, + 1.3205962545725924e-08, + 1.2856014031115137e-08, + 1.2853148767533185e-08, + 1.2861222309368259e-08 + ], + "gamma_dfa": 0.09566472223013989, + "acc_eval": 0.2880859375, + "loss_eval": 1.9538320302963257, + "epoch": 53 + }, + { + "hidden_norms": [ + 33465.359375, + 55258308.0, + 198680688.0, + 365875680.0, + 458634560.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.9228732141036744e-08, + 3.640579226971141e-10, + 3.6045816331764513e-10, + 3.6029040861862427e-10, + 3.6025293859154317e-10 + ], + "bp_grad_norms_F": [ + 3.058711854464491e-06, + 1.294814744312589e-08, + 1.2619584488504643e-08, + 1.2616848898971966e-08, + 1.2624772338654111e-08 + ], + "gamma_dfa": 0.09607254836737411, + "acc_eval": 0.2998046875, + "loss_eval": 1.9489495754241943, + "epoch": 54 + }, + { + "hidden_norms": [ + 33763.53125, + 56920656.0, + 204554208.0, + 376681216.0, + 472155680.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.756867338391203e-08, + 3.4894195866108646e-10, + 3.4671995829960167e-10, + 3.464649955819965e-10, + 3.4666045034548176e-10 + ], + "bp_grad_norms_F": [ + 3.092292217843351e-06, + 1.2733584853208413e-08, + 1.2427238793577544e-08, + 1.2424394846277664e-08, + 1.2432122886707475e-08 + ], + "gamma_dfa": 0.09629741777825984, + "acc_eval": 0.3017578125, + "loss_eval": 1.9477816820144653, + "epoch": 55 + }, + { + "hidden_norms": [ + 34061.03125, + 58650568.0, + 210577584.0, + 387585472.0, + 485747168.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.70959208801014e-08, + 3.4928168690662176e-10, + 3.46003392603933e-10, + 3.4562114281655454e-10, + 3.4606426058125805e-10 + ], + "bp_grad_norms_F": [ + 3.178826091243536e-06, + 1.2512856528701377e-08, + 1.2208544397651622e-08, + 1.2205639166040783e-08, + 1.2213387634574246e-08 + ], + "gamma_dfa": 0.09542209599749185, + "acc_eval": 0.3046875, + "loss_eval": 1.9549853801727295, + "epoch": 56 + }, + { + "hidden_norms": [ + 34344.76171875, + 60294200.0, + 216821792.0, + 398493824.0, + 499371840.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.7367511629990986e-08, + 3.416208427253764e-10, + 3.378898272288211e-10, + 3.377436663676292e-10, + 3.386138314187548e-10 + ], + "bp_grad_norms_F": [ + 3.2603361432848033e-06, + 1.2295201301526504e-08, + 1.2022674411582557e-08, + 1.2019833128817936e-08, + 1.2027326690144946e-08 + ], + "gamma_dfa": 0.09621504079404986, + "acc_eval": 0.294921875, + "loss_eval": 1.9597327709197998, + "epoch": 57 + }, + { + "hidden_norms": [ + 34621.87109375, + 62004936.0, + 222707536.0, + 409299680.0, + 512662208.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.6534943837505125e-08, + 3.356194766546139e-10, + 3.3068575655548216e-10, + 3.3087257933495096e-10, + 3.3104252672444545e-10 + ], + "bp_grad_norms_F": [ + 3.325955731270369e-06, + 1.2073825494951507e-08, + 1.1812358202689666e-08, + 1.1809524025352403e-08, + 1.1816909228912209e-08 + ], + "gamma_dfa": 0.09621665377926547, + "acc_eval": 0.3017578125, + "loss_eval": 1.9411261081695557, + "epoch": 58 + }, + { + "hidden_norms": [ + 34892.69921875, + 63619864.0, + 228332912.0, + 419524224.0, + 525474048.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.6131870707076814e-08, + 3.3116545616884707e-10, + 3.281262206389357e-10, + 3.2806185545908306e-10, + 3.281940552657403e-10 + ], + "bp_grad_norms_F": [ + 3.306513235656894e-06, + 1.1909767394513437e-08, + 1.165356344756674e-08, + 1.1650684861308491e-08, + 1.1658000786951561e-08 + ], + "gamma_dfa": 0.09604647590094828, + "acc_eval": 0.30078125, + "loss_eval": 1.9494699239730835, + "epoch": 59 + }, + { + "hidden_norms": [ + 35134.12890625, + 65285940.0, + 233831760.0, + 429654048.0, + 537931904.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.542536740676951e-08, + 3.2549649087165733e-10, + 3.224807365587168e-10, + 3.2198288479889925e-10, + 3.2189514942437825e-10 + ], + "bp_grad_norms_F": [ + 3.2077998639579164e-06, + 1.1713971126425804e-08, + 1.1479991179896842e-08, + 1.147721562233528e-08, + 1.1484392992144876e-08 + ], + "gamma_dfa": 0.09610223810159368, + "acc_eval": 0.298828125, + "loss_eval": 1.947687029838562, + "epoch": 60 + }, + { + "hidden_norms": [ + 35383.89453125, + 66896316.0, + 239557328.0, + 439032672.0, + 549329344.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.55890657949476e-08, + 3.2204855449080583e-10, + 3.1836161484832814e-10, + 3.185524344306856e-10, + 3.1883792828146795e-10 + ], + "bp_grad_norms_F": [ + 3.19811397275771e-06, + 1.1587792059231106e-08, + 1.1364262419988336e-08, + 1.1361324325775968e-08, + 1.1368459951199839e-08 + ], + "gamma_dfa": 0.09620415412791772, + "acc_eval": 0.3046875, + "loss_eval": 1.9550621509552002, + "epoch": 61 + }, + { + "hidden_norms": [ + 35603.75390625, + 68393976.0, + 244906672.0, + 448738336.0, + 561222784.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.4847117070266904e-08, + 3.208481536010055e-10, + 3.1700905789300293e-10, + 3.1679742162893376e-10, + 3.169834394967097e-10 + ], + "bp_grad_norms_F": [ + 3.1413667329616146e-06, + 1.1423910706298557e-08, + 1.1206890526693769e-08, + 1.1204000394116065e-08, + 1.1211046313519546e-08 + ], + "gamma_dfa": 0.09554143912100699, + "acc_eval": 0.302734375, + "loss_eval": 1.9572508335113525, + "epoch": 62 + }, + { + "hidden_norms": [ + 35840.75, + 69909448.0, + 249732624.0, + 457790144.0, + 572499584.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.482150200464275e-08, + 3.132541726014182e-10, + 3.1085201079861235e-10, + 3.1094149477439714e-10, + 3.1132280087220465e-10 + ], + "bp_grad_norms_F": [ + 3.1111580938159022e-06, + 1.1274166489272375e-08, + 1.1068144623038734e-08, + 1.1065306892987792e-08, + 1.1072265770906142e-08 + ], + "gamma_dfa": 0.09598036286843126, + "acc_eval": 0.2939453125, + "loss_eval": 1.9514048099517822, + "epoch": 63 + }, + { + "hidden_norms": [ + 36044.14453125, + 71301840.0, + 254043168.0, + 466339968.0, + 583323328.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.41697069422753e-08, + 3.088812261520246e-10, + 3.0549318630335165e-10, + 3.051613683968668e-10, + 3.050981411956144e-10 + ], + "bp_grad_norms_F": [ + 3.063583790208213e-06, + 1.1131353616633533e-08, + 1.0936378025405702e-08, + 1.0933466576545925e-08, + 1.0940373940115933e-08 + ], + "gamma_dfa": 0.09560732997124433, + "acc_eval": 0.3076171875, + "loss_eval": 1.9496949911117554, + "epoch": 64 + }, + { + "hidden_norms": [ + 36240.3046875, + 72753064.0, + 259111488.0, + 475471840.0, + 594591872.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.367900612895937e-08, + 3.0714322751812517e-10, + 3.043856555695612e-10, + 3.04040070897571e-10, + 3.043043039774318e-10 + ], + "bp_grad_norms_F": [ + 3.096502268817858e-06, + 1.1002981636920595e-08, + 1.0808172135057248e-08, + 1.0805252692591694e-08, + 1.0812099660029162e-08 + ], + "gamma_dfa": 0.09588889799488243, + "acc_eval": 0.2978515625, + "loss_eval": 1.951111078262329, + "epoch": 65 + }, + { + "hidden_norms": [ + 36427.96484375, + 74044192.0, + 263715872.0, + 483414560.0, + 604480512.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3715726977543454e-08, + 3.022930794571721e-10, + 2.992986969374556e-10, + 2.9908994725325044e-10, + 2.9924074329557016e-10 + ], + "bp_grad_norms_F": [ + 3.0333421818795614e-06, + 1.0890616408687492e-08, + 1.0706762587631147e-08, + 1.0703858244198727e-08, + 1.071066169089363e-08 + ], + "gamma_dfa": 0.09630945282333414, + "acc_eval": 0.30078125, + "loss_eval": 1.949332594871521, + "epoch": 66 + }, + { + "hidden_norms": [ + 36613.015625, + 75303768.0, + 267802576.0, + 490809920.0, + 613719616.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.348211473688025e-08, + 3.012197435925401e-10, + 2.9878169383046327e-10, + 2.9841951132425493e-10, + 2.984068825373498e-10 + ], + "bp_grad_norms_F": [ + 3.008998646691907e-06, + 1.0781116444036343e-08, + 1.0603616651394532e-08, + 1.0600682998074262e-08, + 1.0607434930420823e-08 + ], + "gamma_dfa": 0.0960872639734589, + "acc_eval": 0.310546875, + "loss_eval": 1.9464266300201416, + "epoch": 67 + }, + { + "hidden_norms": [ + 36784.2265625, + 76478576.0, + 271792224.0, + 498011968.0, + 622710336.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.403291680750044e-08, + 3.0129157502223336e-10, + 2.977850743768329e-10, + 2.975975854635493e-10, + 2.9797145306709183e-10 + ], + "bp_grad_norms_F": [ + 2.9997727324371226e-06, + 1.0701310948491027e-08, + 1.052768094922385e-08, + 1.0524773941256171e-08, + 1.0531463701113353e-08 + ], + "gamma_dfa": 0.09624087948759552, + "acc_eval": 0.2939453125, + "loss_eval": 1.9560136795043945, + "epoch": 68 + }, + { + "hidden_norms": [ + 36953.8671875, + 77622176.0, + 275419712.0, + 504592704.0, + 630923392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3204310290766443e-08, + 2.9739929963135125e-10, + 2.9424951364376284e-10, + 2.9405439194718497e-10, + 2.94715835069681e-10 + ], + "bp_grad_norms_F": [ + 2.95851918963308e-06, + 1.0595774924127e-08, + 1.0427880781094245e-08, + 1.042505370918434e-08, + 1.0431726593651547e-08 + ], + "gamma_dfa": 0.09637677710998105, + "acc_eval": 0.2978515625, + "loss_eval": 1.950129747390747, + "epoch": 69 + }, + { + "hidden_norms": [ + 37103.0546875, + 78713944.0, + 279082240.0, + 511376384.0, + 639270976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.3287564583115454e-08, + 2.9558042125010786e-10, + 2.94046592630437e-10, + 2.936023091315576e-10, + 2.9353278141464045e-10 + ], + "bp_grad_norms_F": [ + 2.9398986498563318e-06, + 1.0504810354916572e-08, + 1.034081797968156e-08, + 1.0337980249630618e-08, + 1.0344593626143705e-08 + ], + "gamma_dfa": 0.09638382289995207, + "acc_eval": 0.29296875, + "loss_eval": 1.9502758979797363, + "epoch": 70 + }, + { + "hidden_norms": [ + 37248.1015625, + 79737480.0, + 282511072.0, + 517720224.0, + 647238976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.260229585246634e-08, + 2.899096518405031e-10, + 2.8717414557455356e-10, + 2.8704966181791747e-10, + 2.871551885164081e-10 + ], + "bp_grad_norms_F": [ + 2.9307011573109776e-06, + 1.0423523377767197e-08, + 1.0264206373733487e-08, + 1.0261346439222052e-08, + 1.0267889649639983e-08 + ], + "gamma_dfa": 0.0963258501906239, + "acc_eval": 0.3017578125, + "loss_eval": 1.949232816696167, + "epoch": 71 + }, + { + "hidden_norms": [ + 37381.0390625, + 80657776.0, + 285833920.0, + 523738208.0, + 654706368.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.2669339112298985e-08, + 2.929272380214343e-10, + 2.8994415202099333e-10, + 2.898675188767186e-10, + 2.900694684448979e-10 + ], + "bp_grad_norms_F": [ + 2.912831860157894e-06, + 1.0341300260563457e-08, + 1.018425699328418e-08, + 1.0181377518847512e-08, + 1.0187909182945987e-08 + ], + "gamma_dfa": 0.09613002402329585, + "acc_eval": 0.2958984375, + "loss_eval": 1.9482614994049072, + "epoch": 72 + }, + { + "hidden_norms": [ + 37505.28515625, + 81612512.0, + 289044000.0, + 529475296.0, + 661837376.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.200942965188915e-08, + 2.875680804592662e-10, + 2.8434027354862224e-10, + 2.8415880759524725e-10, + 2.840882251664567e-10 + ], + "bp_grad_norms_F": [ + 2.9117632038833108e-06, + 1.0266585803719863e-08, + 1.0111568471415922e-08, + 1.0108765380323348e-08, + 1.0115227766505086e-08 + ], + "gamma_dfa": 0.09620579873444512, + "acc_eval": 0.2958984375, + "loss_eval": 1.949747085571289, + "epoch": 73 + }, + { + "hidden_norms": [ + 37622.05078125, + 82508960.0, + 292035424.0, + 534928544.0, + 668760064.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.211632014834322e-08, + 2.8521121575586506e-10, + 2.8250474182200946e-10, + 2.822122813217476e-10, + 2.8265498275281686e-10 + ], + "bp_grad_norms_F": [ + 2.9012180675636046e-06, + 1.0211213208322079e-08, + 1.0059093114023199e-08, + 1.0056256272150677e-08, + 1.0062689348444565e-08 + ], + "gamma_dfa": 0.09616703895881074, + "acc_eval": 0.2998046875, + "loss_eval": 1.9510722160339355, + "epoch": 74 + }, + { + "hidden_norms": [ + 37739.125, + 83378024.0, + 294890528.0, + 540384832.0, + 675452224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.20015284166675e-08, + 2.812508559379978e-10, + 2.7935267987722057e-10, + 2.7908611532900807e-10, + 2.792987507937994e-10 + ], + "bp_grad_norms_F": [ + 2.858193283827859e-06, + 1.0136964156970407e-08, + 9.987989102455685e-09, + 9.985158477832101e-09, + 9.991581784163373e-09 + ], + "gamma_dfa": 0.09625962336212979, + "acc_eval": 0.306640625, + "loss_eval": 1.949669599533081, + "epoch": 75 + }, + { + "hidden_norms": [ + 37841.23828125, + 84099792.0, + 297324992.0, + 545087552.0, + 681202944.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.180555717743118e-08, + 2.81841883165157e-10, + 2.790032094246442e-10, + 2.7877883335136744e-10, + 2.790592201762365e-10 + ], + "bp_grad_norms_F": [ + 2.8341921733954223e-06, + 1.0072185752107998e-08, + 9.925220645357058e-09, + 9.922425547870262e-09, + 9.928815103421584e-09 + ], + "gamma_dfa": 0.09619013674819143, + "acc_eval": 0.2958984375, + "loss_eval": 1.947105884552002, + "epoch": 76 + }, + { + "hidden_norms": [ + 37933.76953125, + 84846568.0, + 299677280.0, + 549384448.0, + 686714688.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.136923775239666e-08, + 2.810240096184913e-10, + 2.7924595968897847e-10, + 2.7894245246962157e-10, + 2.789228015220857e-10 + ], + "bp_grad_norms_F": [ + 2.822413307512761e-06, + 1.0021487639733095e-08, + 9.876163886701761e-09, + 9.873332373899757e-09, + 9.879697948633748e-09 + ], + "gamma_dfa": 0.09583658421615837, + "acc_eval": 0.306640625, + "loss_eval": 1.9495177268981934, + "epoch": 77 + }, + { + "hidden_norms": [ + 38020.0, + 85562224.0, + 301864096.0, + 553597760.0, + 691941760.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.160018545780076e-08, + 2.8198060553208393e-10, + 2.797063691772905e-10, + 2.7946911451692813e-10, + 2.796869680299352e-10 + ], + "bp_grad_norms_F": [ + 2.7969890652457252e-06, + 9.96650406648314e-09, + 9.82430670148915e-09, + 9.821477853222405e-09, + 9.827816782603804e-09 + ], + "gamma_dfa": 0.09604255547674256, + "acc_eval": 0.298828125, + "loss_eval": 1.9492969512939453, + "epoch": 78 + }, + { + "hidden_norms": [ + 38095.6171875, + 86194680.0, + 304047168.0, + 557639872.0, + 696924224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.120950063997043e-08, + 2.782411523405415e-10, + 2.750368821580196e-10, + 2.7475391406461824e-10, + 2.748750949077561e-10 + ], + "bp_grad_norms_F": [ + 2.7781038625107612e-06, + 9.913026843832995e-09, + 9.771905951083681e-09, + 9.769114406310564e-09, + 9.775444453907767e-09 + ], + "gamma_dfa": 0.09590470486728009, + "acc_eval": 0.3037109375, + "loss_eval": 1.9471888542175293, + "epoch": 79 + }, + { + "hidden_norms": [ + 38161.02734375, + 86761784.0, + 305935040.0, + 560989248.0, + 701039488.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.1234330555871566e-08, + 2.762826911695271e-10, + 2.737765292248895e-10, + 2.7344454478495095e-10, + 2.735327242486818e-10 + ], + "bp_grad_norms_F": [ + 2.7851888262375724e-06, + 9.883654783493512e-09, + 9.742406881230181e-09, + 9.73962688277652e-09, + 9.74590719238222e-09 + ], + "gamma_dfa": 0.0961023918025603, + "acc_eval": 0.306640625, + "loss_eval": 1.9466722011566162, + "epoch": 80 + }, + { + "hidden_norms": [ + 38225.30859375, + 87283448.0, + 307635232.0, + 564114432.0, + 704943360.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.112997669698416e-08, + 2.7494201360056536e-10, + 2.7230390164945106e-10, + 2.724628855865774e-10, + 2.7264715485308955e-10 + ], + "bp_grad_norms_F": [ + 2.775808070509811e-06, + 9.851329529908526e-09, + 9.711465409623088e-09, + 9.708682746634167e-09, + 9.714950621741991e-09 + ], + "gamma_dfa": 0.09609865310994792, + "acc_eval": 0.30078125, + "loss_eval": 1.9487848281860352, + "epoch": 81 + }, + { + "hidden_norms": [ + 38286.74609375, + 87760048.0, + 309161312.0, + 566976960.0, + 708521920.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.100326561091606e-08, + 2.750530914141791e-10, + 2.7221699894219853e-10, + 2.720162428637707e-10, + 2.72086408958927e-10 + ], + "bp_grad_norms_F": [ + 2.76197988569038e-06, + 9.813816426174071e-09, + 9.67496749382235e-09, + 9.672206147115503e-09, + 9.678448265049155e-09 + ], + "gamma_dfa": 0.09604053818475222, + "acc_eval": 0.3017578125, + "loss_eval": 1.946324110031128, + "epoch": 82 + }, + { + "hidden_norms": [ + 38345.609375, + 88198008.0, + 310597792.0, + 569628928.0, + 711849600.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.150431903189201e-08, + 2.739733162560043e-10, + 2.706747326275405e-10, + 2.703801071923806e-10, + 2.703643420254309e-10 + ], + "bp_grad_norms_F": [ + 2.754284651018679e-06, + 9.79015535307326e-09, + 9.652834087603424e-09, + 9.650069188182897e-09, + 9.656329069684944e-09 + ], + "gamma_dfa": 0.09618356187274912, + "acc_eval": 0.3017578125, + "loss_eval": 1.952025294303894, + "epoch": 83 + }, + { + "hidden_norms": [ + 38393.00390625, + 88631992.0, + 311868064.0, + 571956672.0, + 714769600.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.135545677603659e-08, + 2.741361304625656e-10, + 2.7016161530113436e-10, + 2.7007868164119486e-10, + 2.702876256144293e-10 + ], + "bp_grad_norms_F": [ + 2.7439270979812136e-06, + 9.758214680744004e-09, + 9.621899721423688e-09, + 9.619145480144198e-09, + 9.625373387223135e-09 + ], + "gamma_dfa": 0.09624775896372739, + "acc_eval": 0.302734375, + "loss_eval": 1.9458943605422974, + "epoch": 84 + }, + { + "hidden_norms": [ + 38432.8515625, + 89003520.0, + 313081504.0, + 574038272.0, + 717387392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.1023032909824906e-08, + 2.709044100157598e-10, + 2.6825267007701825e-10, + 2.6804419794856926e-10, + 2.6862953528272726e-10 + ], + "bp_grad_norms_F": [ + 2.7511816824699054e-06, + 9.751657259471358e-09, + 9.615223284242802e-09, + 9.612453943930177e-09, + 9.618667640154399e-09 + ], + "gamma_dfa": 0.09613665863071219, + "acc_eval": 0.3095703125, + "loss_eval": 1.9508092403411865, + "epoch": 85 + }, + { + "hidden_norms": [ + 38471.12890625, + 89306096.0, + 314023616.0, + 575863488.0, + 719706496.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.104102740460803e-08, + 2.722161940305057e-10, + 2.698590240157728e-10, + 2.697040091259595e-10, + 2.698894441266475e-10 + ], + "bp_grad_norms_F": [ + 2.731306722125737e-06, + 9.717195048608573e-09, + 9.582218574166745e-09, + 9.579466997422514e-09, + 9.585680693646736e-09 + ], + "gamma_dfa": 0.09615167022275273, + "acc_eval": 0.296875, + "loss_eval": 1.9497017860412598, + "epoch": 86 + }, + { + "hidden_norms": [ + 38506.49609375, + 89593104.0, + 314968672.0, + 577511168.0, + 721761728.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.099763100702148e-08, + 2.7151769721456276e-10, + 2.698610224172171e-10, + 2.6943663966605413e-10, + 2.6953861365086595e-10 + ], + "bp_grad_norms_F": [ + 2.73057457889081e-06, + 9.698882585951196e-09, + 9.564125491579034e-09, + 9.561379243905321e-09, + 9.567577841096409e-09 + ], + "gamma_dfa": 0.09604650201799814, + "acc_eval": 0.2998046875, + "loss_eval": 1.948227882385254, + "epoch": 87 + }, + { + "hidden_norms": [ + 38536.46875, + 89827632.0, + 315715328.0, + 578913664.0, + 723505408.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.074277709127273e-08, + 2.7221166987168033e-10, + 2.7026783588901537e-10, + 2.700663026544703e-10, + 2.7004307123768e-10 + ], + "bp_grad_norms_F": [ + 2.727413175307447e-06, + 9.684548274435656e-09, + 9.549998125635284e-09, + 9.547248325247892e-09, + 9.553437152476363e-09 + ], + "gamma_dfa": 0.09602321147394832, + "acc_eval": 0.2978515625, + "loss_eval": 1.9482835531234741, + "epoch": 88 + }, + { + "hidden_norms": [ + 38560.86328125, + 90036944.0, + 316345728.0, + 580143808.0, + 725043392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.10075821580358e-08, + 2.70407807256845e-10, + 2.6787719265009e-10, + 2.677959520802631e-10, + 2.679190480581184e-10 + ], + "bp_grad_norms_F": [ + 2.7208343453821726e-06, + 9.672045386821537e-09, + 9.538242196072133e-09, + 9.535500389290519e-09, + 9.541698986481606e-09 + ], + "gamma_dfa": 0.09616725159867201, + "acc_eval": 0.3017578125, + "loss_eval": 1.9490463733673096, + "epoch": 89 + }, + { + "hidden_norms": [ + 38581.62890625, + 90197056.0, + 316901888.0, + 581085248.0, + 726214080.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.062888064344406e-08, + 2.7050772732906125e-10, + 2.680498045748436e-10, + 2.6770730077174676e-10, + 2.6768456895531756e-10 + ], + "bp_grad_norms_F": [ + 2.7148839762958232e-06, + 9.659022026653474e-09, + 9.525311206459719e-09, + 9.522568511499685e-09, + 9.528759115084995e-09 + ], + "gamma_dfa": 0.09604255046724575, + "acc_eval": 0.2998046875, + "loss_eval": 1.9472681283950806, + "epoch": 90 + }, + { + "hidden_norms": [ + 38598.60546875, + 90331488.0, + 317399072.0, + 581959360.0, + 727306816.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.070089059699967e-08, + 2.706254109696715e-10, + 2.6912555517455417e-10, + 2.687201572371123e-10, + 2.686441624710767e-10 + ], + "bp_grad_norms_F": [ + 2.7157270778843667e-06, + 9.650602983413137e-09, + 9.516874399650987e-09, + 9.514130816512534e-09, + 9.520310761956807e-09 + ], + "gamma_dfa": 0.09604466614109697, + "acc_eval": 0.296875, + "loss_eval": 1.9475460052490234, + "epoch": 91 + }, + { + "hidden_norms": [ + 38612.046875, + 90438432.0, + 317761152.0, + 582634240.0, + 728132928.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.071476039120171e-08, + 2.693741063541921e-10, + 2.670912935265335e-10, + 2.670463572496118e-10, + 2.6704632949403617e-10 + ], + "bp_grad_norms_F": [ + 2.7161215712112607e-06, + 9.646365484172748e-09, + 9.512908683007026e-09, + 9.51017486983119e-09, + 9.516351262561784e-09 + ], + "gamma_dfa": 0.09614986698579742, + "acc_eval": 0.3017578125, + "loss_eval": 1.947176218032837, + "epoch": 92 + }, + { + "hidden_norms": [ + 38622.60546875, + 90514344.0, + 318023872.0, + 583138880.0, + 728758976.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.0669719087181875e-08, + 2.7007937553058525e-10, + 2.6770055616687216e-10, + 2.676309729388038e-10, + 2.678066102212995e-10 + ], + "bp_grad_norms_F": [ + 2.715124537644442e-06, + 9.639773423941733e-09, + 9.506337939058085e-09, + 9.503595244098051e-09, + 9.509768084114967e-09 + ], + "gamma_dfa": 0.09608547511743382, + "acc_eval": 0.30078125, + "loss_eval": 1.9474897384643555, + "epoch": 93 + }, + { + "hidden_norms": [ + 38631.16796875, + 90589928.0, + 318254208.0, + 583549632.0, + 729273152.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.0695071251993795e-08, + 2.704435009270867e-10, + 2.6853075318911124e-10, + 2.682237765228024e-10, + 2.6814858666845964e-10 + ], + "bp_grad_norms_F": [ + 2.7134594802191714e-06, + 9.634878672670766e-09, + 9.501549769197482e-09, + 9.498809738772707e-09, + 9.504978137897524e-09 + ], + "gamma_dfa": 0.0960953844114556, + "acc_eval": 0.2978515625, + "loss_eval": 1.9472770690917969, + "epoch": 94 + }, + { + "hidden_norms": [ + 38638.31640625, + 90643280.0, + 318415136.0, + 583858560.0, + 729656640.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.078240761235975e-08, + 2.6967122979115743e-10, + 2.669718335290838e-10, + 2.6691132637424175e-10, + 2.6697202781811313e-10 + ], + "bp_grad_norms_F": [ + 2.711297611313057e-06, + 9.631804687160184e-09, + 9.498727138179675e-09, + 9.495988884111739e-09, + 9.502159947771815e-09 + ], + "gamma_dfa": 0.09613717825050117, + "acc_eval": 0.2998046875, + "loss_eval": 1.94759202003479, + "epoch": 95 + }, + { + "hidden_norms": [ + 38642.26171875, + 90677816.0, + 318520992.0, + 584046976.0, + 729889984.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.069002995128358e-08, + 2.6985705336990407e-10, + 2.6735619274020905e-10, + 2.671637633344659e-10, + 2.6708837919109385e-10 + ], + "bp_grad_norms_F": [ + 2.7110704650112893e-06, + 9.629748554118578e-09, + 9.496692321420142e-09, + 9.493953179173786e-09, + 9.500122466477023e-09 + ], + "gamma_dfa": 0.09612438916155952, + "acc_eval": 0.2998046875, + "loss_eval": 1.9474642276763916, + "epoch": 96 + }, + { + "hidden_norms": [ + 38644.16015625, + 90695256.0, + 318576288.0, + 584137856.0, + 730003328.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.070784681038276e-08, + 2.6936791686082984e-10, + 2.671484977678773e-10, + 2.668835430430505e-10, + 2.671484977678773e-10 + ], + "bp_grad_norms_F": [ + 2.710563421715051e-06, + 9.628578823139833e-09, + 9.495578545681838e-09, + 9.492838515257063e-09, + 9.499009578917139e-09 + ], + "gamma_dfa": 0.09612188487153617, + "acc_eval": 0.298828125, + "loss_eval": 1.9476267099380493, + "epoch": 97 + }, + { + "hidden_norms": [ + 38646.0625, + 90710400.0, + 318627968.0, + 584229760.0, + 730119232.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.075278863841959e-08, + 2.692224221334527e-10, + 2.671664001141494e-10, + 2.669355292361786e-10, + 2.6700280875147087e-10 + ], + "bp_grad_norms_F": [ + 2.7103426418761956e-06, + 9.62763913037179e-09, + 9.494667274623225e-09, + 9.49192813237687e-09, + 9.498098307858527e-09 + ], + "gamma_dfa": 0.09612667236069683, + "acc_eval": 0.2998046875, + "loss_eval": 1.9476723670959473, + "epoch": 98 + }, + { + "hidden_norms": [ + 38646.953125, + 90717408.0, + 318651872.0, + 584275776.0, + 730176960.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.076975639894954e-08, + 2.691815659261465e-10, + 2.671429466527542e-10, + 2.669321430559535e-10, + 2.669318377446217e-10 + ], + "bp_grad_norms_F": [ + 2.7102296371595003e-06, + 9.62716750763093e-09, + 9.494214303629178e-09, + 9.491475161382823e-09, + 9.4976462250429e-09 + ], + "gamma_dfa": 0.09612801273397054, + "acc_eval": 0.2998046875, + "loss_eval": 1.9476864337921143, + "epoch": 99 + }, + { + "hidden_norms": [ + 38646.98046875, + 90717592.0, + 318652416.0, + 584276736.0, + 730178112.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.076372033840926e-08, + 2.692036038531853e-10, + 2.6715371581609304e-10, + 2.669119369969053e-10, + 2.6695023969125486e-10 + ], + "bp_grad_norms_F": [ + 2.710211447265465e-06, + 9.627171060344608e-09, + 9.494216968164437e-09, + 9.491476937739662e-09, + 9.497648001399739e-09 + ], + "gamma_dfa": 0.09612751441454748, + "acc_eval": 0.2998046875, + "loss_eval": 1.947685956954956, + "epoch": 100 + } + ] +}
\ No newline at end of file |
