summaryrefslogtreecommitdiff
path: root/results/snapshot_evolution_v2/snapshot_evolution_s456.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s456.json')
-rw-r--r--results/snapshot_evolution_v2/snapshot_evolution_s456.json5473
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s456.json b/results/snapshot_evolution_v2/snapshot_evolution_s456.json
new file mode 100644
index 0000000..f78065f
--- /dev/null
+++ b/results/snapshot_evolution_v2/snapshot_evolution_s456.json
@@ -0,0 +1,5473 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_evolution_v2",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 456,
+ "depth": 4,
+ "d_hidden": 256,
+ "log_every": 1
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.696551322937012,
+ 8.737784385681152,
+ 8.813130378723145,
+ 8.844642639160156,
+ 8.889528274536133
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010079912608489394,
+ 0.0010035138111561537,
+ 0.0009970925748348236,
+ 0.0009936393471434712,
+ 0.000986678060144186
+ ],
+ "bp_grad_norms_F": [
+ 0.035574451088905334,
+ 0.035288579761981964,
+ 0.035048045217990875,
+ 0.0346725769340992,
+ 0.03439188003540039
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.0927734375,
+ "loss_eval": 2.4863264560699463,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 79.9596176147461,
+ 82.38219451904297,
+ 86.97193145751953,
+ 92.46615600585938,
+ 99.17337799072266
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.704927025362849e-05,
+ 5.414035331341438e-05,
+ 5.3104751714272425e-05,
+ 5.354730456019752e-05,
+ 5.5780339607736096e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00240120361559093,
+ 0.0021707164123654366,
+ 0.002052225871011615,
+ 0.0020026240963488817,
+ 0.002049861242994666
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.400390625,
+ "loss_eval": 1.6942739486694336,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 95.21885681152344,
+ 97.9500732421875,
+ 101.84932708740234,
+ 108.15538787841797,
+ 115.16011810302734
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.467168764676899e-05,
+ 4.3202508095419034e-05,
+ 4.3004638428101316e-05,
+ 4.286228431737982e-05,
+ 4.4292191887507215e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018949288642033935,
+ 0.0017146588070318103,
+ 0.0016399234300479293,
+ 0.001598119386471808,
+ 0.0016228299355134368
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4599609375,
+ "loss_eval": 1.5051867961883545,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 112.65824890136719,
+ 111.87681579589844,
+ 114.76032257080078,
+ 118.74363708496094,
+ 125.05441284179688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4033156882505864e-05,
+ 4.2794465116458014e-05,
+ 4.2031828343169764e-05,
+ 4.134616028750315e-05,
+ 4.226301462040283e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018527565989643335,
+ 0.0017638156423345208,
+ 0.0016669610049575567,
+ 0.0015881577273830771,
+ 0.0015705813420936465
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4931640625,
+ "loss_eval": 1.4331163167953491,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 126.20967102050781,
+ 125.90274810791016,
+ 128.2918243408203,
+ 131.685302734375,
+ 136.71499633789062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.358301157481037e-05,
+ 4.267259282642044e-05,
+ 4.196130612399429e-05,
+ 4.08500200137496e-05,
+ 4.0281276596942917e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018887611804530025,
+ 0.0017927174922078848,
+ 0.0016837789444252849,
+ 0.0015876276884227991,
+ 0.0015263468958437443
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.490234375,
+ "loss_eval": 1.4055290222167969,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 137.673583984375,
+ 136.8435516357422,
+ 138.64651489257812,
+ 141.41473388671875,
+ 147.87835693359375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.085261025466025e-05,
+ 4.06657018174883e-05,
+ 3.941181785194203e-05,
+ 3.858502532239072e-05,
+ 3.7998870539013296e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001770049100741744,
+ 0.0016922445502132177,
+ 0.0016029543476179242,
+ 0.0015241446672007442,
+ 0.0014664788031950593
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.50390625,
+ "loss_eval": 1.3763911724090576,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 150.45315551757812,
+ 148.60609436035156,
+ 150.3750457763672,
+ 152.9460906982422,
+ 158.2902069091797
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.8344696804415435e-05,
+ 3.8422465877374634e-05,
+ 3.834897142951377e-05,
+ 3.7070902180857956e-05,
+ 3.6289642594056204e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017990845954045653,
+ 0.001743242726661265,
+ 0.0016358466818928719,
+ 0.0015305348206311464,
+ 0.0014392968732863665
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5166015625,
+ "loss_eval": 1.373401165008545,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 162.06126403808594,
+ 159.53811645507812,
+ 158.62655639648438,
+ 160.54307556152344,
+ 165.60415649414062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.797870522248559e-05,
+ 3.766914960579015e-05,
+ 3.7873480323469266e-05,
+ 3.735603968380019e-05,
+ 3.6521956644719467e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001707478309981525,
+ 0.0016470234841108322,
+ 0.0015834521036595106,
+ 0.001506388420239091,
+ 0.001406461582519114
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5283203125,
+ "loss_eval": 1.3223559856414795,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 169.8936309814453,
+ 168.42221069335938,
+ 169.54115295410156,
+ 171.452880859375,
+ 176.4298553466797
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.760562321986072e-05,
+ 3.8139285607030615e-05,
+ 3.7332967622205615e-05,
+ 3.670771184260957e-05,
+ 3.4867567592300475e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001674071652814746,
+ 0.0016396756982430816,
+ 0.001556537114083767,
+ 0.001464220928028226,
+ 0.0013669237960129976
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.529296875,
+ "loss_eval": 1.3310301303863525,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 177.821044921875,
+ 176.60687255859375,
+ 177.76409912109375,
+ 179.53733825683594,
+ 184.176513671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.643108357209712e-05,
+ 3.605252277338877e-05,
+ 3.6002034903503954e-05,
+ 3.529640525812283e-05,
+ 3.386645403224975e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016080558998510242,
+ 0.0015692447777837515,
+ 0.0014910849276930094,
+ 0.0014210963854566216,
+ 0.0013221093686297536
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5390625,
+ "loss_eval": 1.3072502613067627,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 188.1353759765625,
+ 184.39834594726562,
+ 184.91822814941406,
+ 185.82460021972656,
+ 191.45692443847656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.544713035807945e-05,
+ 3.5891316656488925e-05,
+ 3.613864828366786e-05,
+ 3.507022120174952e-05,
+ 3.361281778779812e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015651460271328688,
+ 0.0015296414494514465,
+ 0.0014787326799705625,
+ 0.0014131872449070215,
+ 0.0013114992761984468
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5537109375,
+ "loss_eval": 1.2935423851013184,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 193.53599548339844,
+ 189.33700561523438,
+ 190.08908081054688,
+ 192.31288146972656,
+ 198.0936737060547
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3899334084708244e-05,
+ 3.468272552709095e-05,
+ 3.463856774033047e-05,
+ 3.383589137229137e-05,
+ 3.240162550355308e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001495138043537736,
+ 0.0014781414065510035,
+ 0.0014301009941846132,
+ 0.0013711795909330249,
+ 0.0012839946430176497
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.544921875,
+ "loss_eval": 1.2766207456588745,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 199.85023498535156,
+ 194.9699249267578,
+ 193.4657440185547,
+ 194.60928344726562,
+ 199.97662353515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.289094092906453e-05,
+ 3.539410317898728e-05,
+ 3.491900861263275e-05,
+ 3.4397991839796305e-05,
+ 3.252939859521575e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015656249597668648,
+ 0.0015614606672897935,
+ 0.0015110056847333908,
+ 0.0014306820230558515,
+ 0.00130200176499784
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5439453125,
+ "loss_eval": 1.2812860012054443,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 206.15440368652344,
+ 199.86099243164062,
+ 199.35470581054688,
+ 201.66831970214844,
+ 206.71054077148438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.430957076488994e-05,
+ 3.5125638532917947e-05,
+ 3.523785198922269e-05,
+ 3.404217568458989e-05,
+ 3.245573316235095e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015102275647222996,
+ 0.0015037795528769493,
+ 0.001468595233745873,
+ 0.0013989906292408705,
+ 0.0012804438592866063
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5517578125,
+ "loss_eval": 1.2559274435043335,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 209.39404296875,
+ 203.8543243408203,
+ 201.63771057128906,
+ 202.7413787841797,
+ 209.64585876464844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3599189919186756e-05,
+ 3.511353497742675e-05,
+ 3.4795291867339984e-05,
+ 3.415898390812799e-05,
+ 3.225719046895392e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015785910654813051,
+ 0.0015854343073442578,
+ 0.0015357385855168104,
+ 0.00144979078322649,
+ 0.0013052559224888682
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5478515625,
+ "loss_eval": 1.2778449058532715,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 214.74293518066406,
+ 208.2928924560547,
+ 206.78591918945312,
+ 207.79452514648438,
+ 213.0249481201172
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.347836172906682e-05,
+ 3.457088314462453e-05,
+ 3.509481393848546e-05,
+ 3.4477459848858416e-05,
+ 3.169552292092703e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015018024714663625,
+ 0.0015100837917998433,
+ 0.0014814585447311401,
+ 0.0014098759274929762,
+ 0.0012745971325784922
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5693359375,
+ "loss_eval": 1.2316113710403442,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 223.09906005859375,
+ 214.6353302001953,
+ 211.16726684570312,
+ 210.60520935058594,
+ 214.28952026367188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5336081054992974e-05,
+ 3.693878170452081e-05,
+ 3.7104789953446016e-05,
+ 3.635902612586506e-05,
+ 3.3355980121996254e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015461220173165202,
+ 0.0015768769662827253,
+ 0.0015498694265261292,
+ 0.001453379518352449,
+ 0.0013068238040432334
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.55078125,
+ "loss_eval": 1.2516858577728271,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 225.36517333984375,
+ 217.36669921875,
+ 214.27880859375,
+ 215.62054443359375,
+ 219.76197814941406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.474476397968829e-05,
+ 3.609717168728821e-05,
+ 3.612042564782314e-05,
+ 3.547673986759037e-05,
+ 3.216006007278338e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001510953065007925,
+ 0.0015347315929830074,
+ 0.0015160846523940563,
+ 0.001440546941012144,
+ 0.0012782461708411574
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.583984375,
+ "loss_eval": 1.2262325286865234,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 230.7099151611328,
+ 222.3380889892578,
+ 218.67819213867188,
+ 217.3147735595703,
+ 221.999755859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.285402272013016e-05,
+ 3.4367294574622065e-05,
+ 3.490627204882912e-05,
+ 3.413260492379777e-05,
+ 3.064925112994388e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015693235909566283,
+ 0.0015950833912938833,
+ 0.0015582602936774492,
+ 0.001467122812755406,
+ 0.0012723723193630576
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5751953125,
+ "loss_eval": 1.2127145528793335,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 235.28932189941406,
+ 226.01202392578125,
+ 222.56756591796875,
+ 222.25152587890625,
+ 226.0247344970703
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.336059671710245e-05,
+ 3.488900983938947e-05,
+ 3.518831363180652e-05,
+ 3.5047873097937554e-05,
+ 3.1955056329024956e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015264152316376567,
+ 0.0015387749299407005,
+ 0.0015209508128464222,
+ 0.001451890799216926,
+ 0.00127940543461591
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5673828125,
+ "loss_eval": 1.2340281009674072,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 239.98486328125,
+ 230.95614624023438,
+ 226.7176513671875,
+ 225.3818359375,
+ 231.0238037109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4207379940198734e-05,
+ 3.5167759051546454e-05,
+ 3.5256896808277816e-05,
+ 3.462574022705667e-05,
+ 3.117474989267066e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015223841182887554,
+ 0.0015598630998283625,
+ 0.0015445069875568151,
+ 0.0014689662493765354,
+ 0.0012761331163346767
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.2441283464431763,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 245.0663299560547,
+ 233.2012939453125,
+ 227.60426330566406,
+ 226.96006774902344,
+ 229.30145263671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.25386063195765e-05,
+ 3.39963698934298e-05,
+ 3.503257903503254e-05,
+ 3.4624255931703374e-05,
+ 3.013665264006704e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001554132904857397,
+ 0.0015968671068549156,
+ 0.001575724920257926,
+ 0.0014765377854928374,
+ 0.0012655528262257576
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.595703125,
+ "loss_eval": 1.1905839443206787,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 246.93258666992188,
+ 235.25485229492188,
+ 232.71095275878906,
+ 231.27796936035156,
+ 235.4611358642578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.248557914048433e-05,
+ 3.448772622505203e-05,
+ 3.525316424202174e-05,
+ 3.4218086511828005e-05,
+ 2.997798401338514e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001511804643087089,
+ 0.0015418389812111855,
+ 0.001536028808914125,
+ 0.0014609270729124546,
+ 0.001262559788301587
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.2032543420791626,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 251.2838592529297,
+ 237.0211639404297,
+ 234.6432342529297,
+ 233.30433654785156,
+ 238.11598205566406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3030770282493904e-05,
+ 3.484229455352761e-05,
+ 3.59142868546769e-05,
+ 3.533583367243409e-05,
+ 3.1214847695082426e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015120860189199448,
+ 0.00155613012611866,
+ 0.0015533699188381433,
+ 0.001477457000873983,
+ 0.0012758751399815083
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.568359375,
+ "loss_eval": 1.220862627029419,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 253.3640594482422,
+ 242.6001739501953,
+ 237.11773681640625,
+ 237.31105041503906,
+ 241.1314697265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.295885835541412e-05,
+ 3.492692485451698e-05,
+ 3.562758502084762e-05,
+ 3.515293064992875e-05,
+ 3.0970571970101446e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001516172313131392,
+ 0.0015499184373766184,
+ 0.0015383078716695309,
+ 0.0014658188447356224,
+ 0.0012659834465011954
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1925604343414307,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 258.6325378417969,
+ 245.05575561523438,
+ 239.04722595214844,
+ 237.04385375976562,
+ 240.51011657714844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.258220021962188e-05,
+ 3.459660729276948e-05,
+ 3.553628994268365e-05,
+ 3.461805317783728e-05,
+ 3.001722870976664e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015354488277807832,
+ 0.001572331297211349,
+ 0.0015721773961558938,
+ 0.0014915125211700797,
+ 0.0012740870006382465
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58203125,
+ "loss_eval": 1.1843492984771729,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 262.35577392578125,
+ 247.456298828125,
+ 241.52687072753906,
+ 239.8603057861328,
+ 242.48818969726562
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.335328074172139e-05,
+ 3.581988130463287e-05,
+ 3.6700876080431044e-05,
+ 3.52635579474736e-05,
+ 3.091046164627187e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015506797935813665,
+ 0.0016048819525167346,
+ 0.0016078166663646698,
+ 0.0015189298428595066,
+ 0.001287299208343029
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.2021183967590332,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 262.69769287109375,
+ 248.58924865722656,
+ 243.61415100097656,
+ 242.7408905029297,
+ 243.58761596679688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.363215728313662e-05,
+ 3.542406557244249e-05,
+ 3.617940456024371e-05,
+ 3.522956103552133e-05,
+ 3.093081613769755e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015515872510150075,
+ 0.0015918170101940632,
+ 0.0015870564384385943,
+ 0.0015067857457324862,
+ 0.001285396981984377
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.1753299236297607,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 264.57330322265625,
+ 252.62904357910156,
+ 246.43833923339844,
+ 245.4523468017578,
+ 247.43896484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3458851248724386e-05,
+ 3.510742317303084e-05,
+ 3.596700116759166e-05,
+ 3.530932735884562e-05,
+ 3.0871200578985736e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015561054460704327,
+ 0.0015992044936865568,
+ 0.0016016490990296006,
+ 0.0015203922521322966,
+ 0.001274992828257382
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.587890625,
+ "loss_eval": 1.1872658729553223,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 268.63336181640625,
+ 253.74609375,
+ 247.2230224609375,
+ 244.07066345214844,
+ 248.91635131835938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.388441837159917e-05,
+ 3.55305674020201e-05,
+ 3.711709723575041e-05,
+ 3.565939550753683e-05,
+ 3.06438232655637e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015880814753472805,
+ 0.001632494037039578,
+ 0.0016352345701307058,
+ 0.001542495796456933,
+ 0.001282386132515967
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1748178005218506,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 269.5155944824219,
+ 254.65687561035156,
+ 249.08070373535156,
+ 246.4084930419922,
+ 248.03065490722656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.340150215080939e-05,
+ 3.542837657732889e-05,
+ 3.656153057818301e-05,
+ 3.62997452612035e-05,
+ 3.134588405373506e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015988025115802884,
+ 0.0016428054077550769,
+ 0.0016343789175152779,
+ 0.00154898373875767,
+ 0.001290567102842033
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.184614658355713,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 273.0482482910156,
+ 255.88157653808594,
+ 249.6538543701172,
+ 246.09181213378906,
+ 250.09861755371094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.485401612124406e-05,
+ 3.613552325987257e-05,
+ 3.727355215232819e-05,
+ 3.6410303437151015e-05,
+ 3.111722253379412e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016218513483181596,
+ 0.001677986583672464,
+ 0.0016929754056036472,
+ 0.001593436230905354,
+ 0.0013143697287887335
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5673828125,
+ "loss_eval": 1.2012369632720947,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 274.05010986328125,
+ 255.77792358398438,
+ 247.96664428710938,
+ 246.15379333496094,
+ 248.44847106933594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.431778895901516e-05,
+ 3.609380655689165e-05,
+ 3.7377911212388426e-05,
+ 3.6012417695019394e-05,
+ 3.0985673220129684e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016116296174004674,
+ 0.0016683804569765925,
+ 0.0016786488704383373,
+ 0.0015687323175370693,
+ 0.001289981184527278
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5986328125,
+ "loss_eval": 1.1654620170593262,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 274.6156921386719,
+ 257.166259765625,
+ 251.9473876953125,
+ 251.01661682128906,
+ 252.84222412109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.185174864483997e-05,
+ 3.433173696976155e-05,
+ 3.572784407879226e-05,
+ 3.4680619137361646e-05,
+ 2.997389128722716e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015743848634883761,
+ 0.001610185718163848,
+ 0.0016222007106989622,
+ 0.0015360275283455849,
+ 0.0012806184822693467
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58984375,
+ "loss_eval": 1.1679120063781738,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 274.3385009765625,
+ 256.1404724121094,
+ 249.90264892578125,
+ 247.3904266357422,
+ 249.5623016357422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.419954009586945e-05,
+ 3.6830995668424293e-05,
+ 3.8464357203338295e-05,
+ 3.64230691047851e-05,
+ 3.0958552088122815e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016346886986866593,
+ 0.0016823107143864036,
+ 0.0016956342151388526,
+ 0.0015958002768456936,
+ 0.0013100137002766132
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.1599082946777344,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 276.65985107421875,
+ 258.50543212890625,
+ 251.1997833251953,
+ 247.7036895751953,
+ 248.07545471191406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.384043520782143e-05,
+ 3.567537714843638e-05,
+ 3.686825220938772e-05,
+ 3.5754670534515753e-05,
+ 3.0301211154437624e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016451155534014106,
+ 0.0016956959152594209,
+ 0.001703266054391861,
+ 0.0016015227884054184,
+ 0.0013142916141077876
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.148215889930725,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 279.6298522949219,
+ 261.1481018066406,
+ 253.67742919921875,
+ 250.86221313476562,
+ 250.6768035888672
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.341220144648105e-05,
+ 3.499272861517966e-05,
+ 3.6701327189803123e-05,
+ 3.602671858971007e-05,
+ 3.081390605075285e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016287019243463874,
+ 0.0016769150970503688,
+ 0.0016951658762991428,
+ 0.0015969424275681376,
+ 0.0013187138829380274
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.1451219320297241,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 277.2866516113281,
+ 258.4331359863281,
+ 251.4995880126953,
+ 249.0448455810547,
+ 248.5166015625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2723561162129045e-05,
+ 3.4428499930072576e-05,
+ 3.571901106624864e-05,
+ 3.4436179703334346e-05,
+ 2.9252587410155684e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016638770466670394,
+ 0.0017149352934211493,
+ 0.0017208203207701445,
+ 0.0016291715437546372,
+ 0.0013402353506535292
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.145239233970642,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 279.7109680175781,
+ 259.3131103515625,
+ 250.73587036132812,
+ 247.214111328125,
+ 249.20944213867188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.449835639912635e-05,
+ 3.682902752188966e-05,
+ 3.780073166126385e-05,
+ 3.652105442597531e-05,
+ 3.046718666155357e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001753124757669866,
+ 0.0018144651548936963,
+ 0.0018306451383978128,
+ 0.0017095789080485702,
+ 0.001379602705128491
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5908203125,
+ "loss_eval": 1.1677792072296143,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 279.9946594238281,
+ 260.2458190917969,
+ 252.0008087158203,
+ 250.56716918945312,
+ 250.73135375976562
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.489958180580288e-05,
+ 3.730110984179191e-05,
+ 3.791403287323192e-05,
+ 3.650010330602527e-05,
+ 3.076100256294012e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017145961755886674,
+ 0.0017580300336703658,
+ 0.001775139826349914,
+ 0.0016669962788000703,
+ 0.0013597821816802025
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1510668992996216,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 280.5132751464844,
+ 260.75970458984375,
+ 252.2814178466797,
+ 249.84548950195312,
+ 248.41783142089844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.552919588400982e-05,
+ 3.777973688556813e-05,
+ 3.952483166358434e-05,
+ 3.783141073654406e-05,
+ 3.1490348192164674e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017431442392989993,
+ 0.0017984459409490228,
+ 0.0018199888290837407,
+ 0.0017078405944630504,
+ 0.0013792469399049878
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1412110328674316,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 279.3873596191406,
+ 259.55096435546875,
+ 251.9462432861328,
+ 247.29443359375,
+ 247.82852172851562
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.456972990534268e-05,
+ 3.654780448414385e-05,
+ 3.848340566037223e-05,
+ 3.736113285413012e-05,
+ 3.1597948691342026e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017544032307341695,
+ 0.0018107325304299593,
+ 0.0018319039372727275,
+ 0.0017261328175663948,
+ 0.0013868761016055942
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1418483257293701,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 282.4360656738281,
+ 261.22149658203125,
+ 251.49090576171875,
+ 247.5189208984375,
+ 247.03427124023438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5179280530428514e-05,
+ 3.728548108483665e-05,
+ 3.779769394895993e-05,
+ 3.6327692214399576e-05,
+ 3.026284321094863e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017881252570077777,
+ 0.0018441356951370835,
+ 0.0018691252917051315,
+ 0.0017487212317064404,
+ 0.0013921407517045736
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1468144655227661,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 283.1267395019531,
+ 261.29425048828125,
+ 252.38563537597656,
+ 248.00192260742188,
+ 246.58505249023438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.485176421236247e-05,
+ 3.699021544889547e-05,
+ 3.812833165284246e-05,
+ 3.7145182432141155e-05,
+ 3.1198313081404194e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017692983383312821,
+ 0.0018438888946548104,
+ 0.001876220339909196,
+ 0.0017641744343563914,
+ 0.0014044356066733599
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1329892873764038,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 281.29327392578125,
+ 259.43359375,
+ 249.52906799316406,
+ 246.0892333984375,
+ 243.162109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.586204911698587e-05,
+ 3.787377499975264e-05,
+ 3.9215286960825324e-05,
+ 3.7436715501826257e-05,
+ 3.160976120852865e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018376735970377922,
+ 0.0019067999674007297,
+ 0.0019337635021656752,
+ 0.0017983472207561135,
+ 0.001438757055439055
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6181640625,
+ "loss_eval": 1.144508957862854,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 282.5230407714844,
+ 259.55322265625,
+ 248.72308349609375,
+ 245.0394287109375,
+ 243.0651092529297
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.6309906136011705e-05,
+ 3.868114436045289e-05,
+ 4.0484872442903e-05,
+ 3.8203681469894946e-05,
+ 3.144023139611818e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018340122187510133,
+ 0.0019134157337248325,
+ 0.0019425065256655216,
+ 0.0018252682639285922,
+ 0.001443033921532333
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.1290326118469238,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 280.8598327636719,
+ 260.14111328125,
+ 250.84779357910156,
+ 245.9561767578125,
+ 243.0910186767578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4626806154847145e-05,
+ 3.693445250974037e-05,
+ 3.8311845855787396e-05,
+ 3.7721722037531435e-05,
+ 3.145459049846977e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018591763218864799,
+ 0.0019209657330065966,
+ 0.0019388735527172685,
+ 0.001830682042054832,
+ 0.001447839429602027
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1423537731170654,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 280.17266845703125,
+ 259.26568603515625,
+ 248.45452880859375,
+ 243.45750427246094,
+ 241.2735137939453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.609486884670332e-05,
+ 3.887504499289207e-05,
+ 4.01619981857948e-05,
+ 3.9294092857744545e-05,
+ 3.1412804673891515e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018975000130012631,
+ 0.0019804267212748528,
+ 0.002001592656597495,
+ 0.0018729616422206163,
+ 0.0014571875799447298
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.1366385221481323,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 281.79833984375,
+ 259.25860595703125,
+ 249.18551635742188,
+ 244.24977111816406,
+ 240.67100524902344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.47710374626331e-05,
+ 3.7153975426917896e-05,
+ 3.885528349201195e-05,
+ 3.792768620769493e-05,
+ 3.113777347607538e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019318967824801803,
+ 0.0019981141667813063,
+ 0.0020311782136559486,
+ 0.0018996316939592361,
+ 0.0014788025291636586
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6162109375,
+ "loss_eval": 1.138331651687622,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 282.3840637207031,
+ 258.1807861328125,
+ 248.13995361328125,
+ 243.45587158203125,
+ 239.51858520507812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.68369001080282e-05,
+ 3.935660788556561e-05,
+ 4.189974788459949e-05,
+ 3.9929436752572656e-05,
+ 3.188087430316955e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019372758688405156,
+ 0.0020036858040839434,
+ 0.0020287453662604094,
+ 0.001896715839393437,
+ 0.0014835885958746076
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1377842426300049,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 280.9283142089844,
+ 257.81524658203125,
+ 248.47984313964844,
+ 241.96157836914062,
+ 238.4756317138672
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.7310775951482356e-05,
+ 3.98769298044499e-05,
+ 4.1753111872822046e-05,
+ 4.021048516733572e-05,
+ 3.21856678056065e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019433718407526612,
+ 0.0020235073752701283,
+ 0.002055324148386717,
+ 0.0019370814552530646,
+ 0.0015049076173454523
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.133098840713501,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 279.66400146484375,
+ 256.7322082519531,
+ 246.65223693847656,
+ 241.45947265625,
+ 236.65582275390625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.620017014327459e-05,
+ 3.800772174145095e-05,
+ 4.072795491083525e-05,
+ 3.888807259500027e-05,
+ 3.182498039677739e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019729172345250845,
+ 0.002036863239482045,
+ 0.0020802877843379974,
+ 0.0019662927370518446,
+ 0.0015235996106639504
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.1315571069717407,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 280.00152587890625,
+ 258.0238037109375,
+ 247.4223175048828,
+ 240.8101348876953,
+ 237.3229217529297
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.6401659599505365e-05,
+ 3.855170143651776e-05,
+ 4.065703978994861e-05,
+ 3.844475213554688e-05,
+ 3.1645795388612896e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019983802922070026,
+ 0.0020701857283711433,
+ 0.002107742242515087,
+ 0.001981276087462902,
+ 0.0015306670684367418
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.137194037437439,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 278.19708251953125,
+ 255.23036193847656,
+ 245.5857696533203,
+ 239.48196411132812,
+ 235.09983825683594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.97727417293936e-05,
+ 4.185501529718749e-05,
+ 4.392741175252013e-05,
+ 4.302372326492332e-05,
+ 3.48737376043573e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002044696593657136,
+ 0.00211329385638237,
+ 0.002144050318747759,
+ 0.0020148823969066143,
+ 0.0015573638956993818
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1354646682739258,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 276.7043762207031,
+ 255.62408447265625,
+ 243.71484375,
+ 238.2984161376953,
+ 233.8153076171875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.715257116709836e-05,
+ 3.887641287292354e-05,
+ 4.099323268746957e-05,
+ 3.948296944145113e-05,
+ 3.221148654120043e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020365805830806494,
+ 0.00209893099963665,
+ 0.0021342532709240913,
+ 0.0020123852882534266,
+ 0.0015702869277447462
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.1295127868652344,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 279.308349609375,
+ 255.30587768554688,
+ 243.6786651611328,
+ 237.71823120117188,
+ 232.89991760253906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.9407084841514006e-05,
+ 4.1900668293237686e-05,
+ 4.364689812064171e-05,
+ 4.154618363827467e-05,
+ 3.264051701989956e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021011638455092907,
+ 0.002175872679799795,
+ 0.002217113971710205,
+ 0.002071501687169075,
+ 0.0015880379360169172
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.1201554536819458,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 276.9933166503906,
+ 253.379638671875,
+ 244.23390197753906,
+ 238.01930236816406,
+ 233.3076171875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.799827391048893e-05,
+ 4.017200990347192e-05,
+ 4.2665858927648515e-05,
+ 4.083341627847403e-05,
+ 3.210103386663832e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002064710482954979,
+ 0.0021362933330237865,
+ 0.0021728368010371923,
+ 0.0020478416699916124,
+ 0.0015873984666541219
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.1222728490829468,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 276.41168212890625,
+ 251.91033935546875,
+ 241.81382751464844,
+ 234.8279266357422,
+ 230.53956604003906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.770063631236553e-05,
+ 3.94962407881394e-05,
+ 4.150882887188345e-05,
+ 4.040042040287517e-05,
+ 3.2475280022481456e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002123177284374833,
+ 0.0021965675987303257,
+ 0.00223328173160553,
+ 0.0020905195269733667,
+ 0.0016039537731558084
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.1091526746749878,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 274.760986328125,
+ 250.0972442626953,
+ 239.511474609375,
+ 233.29798889160156,
+ 228.16070556640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.728809315362014e-05,
+ 4.0525967051507905e-05,
+ 4.239326517563313e-05,
+ 4.087138222530484e-05,
+ 3.216422919649631e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021635335870087147,
+ 0.0022461507469415665,
+ 0.0022873859852552414,
+ 0.002144098049029708,
+ 0.001636566361412406
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6416015625,
+ "loss_eval": 1.1180500984191895,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 273.91064453125,
+ 249.49452209472656,
+ 238.54373168945312,
+ 232.80734252929688,
+ 225.6833953857422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.966117583331652e-05,
+ 4.1986208088928834e-05,
+ 4.316144259064458e-05,
+ 4.332280877861194e-05,
+ 3.44519030477386e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021825931034982204,
+ 0.0022617392241954803,
+ 0.0023092019837349653,
+ 0.00216560042463243,
+ 0.0016612708568572998
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6279296875,
+ "loss_eval": 1.131789207458496,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 274.90008544921875,
+ 250.0712127685547,
+ 238.57467651367188,
+ 231.15719604492188,
+ 225.55587768554688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.130819797865115e-05,
+ 4.363877815194428e-05,
+ 4.489632920012809e-05,
+ 4.4512398744700477e-05,
+ 3.470887531875633e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002240521367639303,
+ 0.002310203853994608,
+ 0.0023576009552925825,
+ 0.002204722724854946,
+ 0.0016799044096842408
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6240234375,
+ "loss_eval": 1.1323366165161133,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 275.4504699707031,
+ 249.5341796875,
+ 237.540283203125,
+ 230.39208984375,
+ 224.43321228027344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.056218676851131e-05,
+ 4.288182390155271e-05,
+ 4.5818003854947165e-05,
+ 4.356648423708975e-05,
+ 3.492152245598845e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002249655080959201,
+ 0.0023316002916544676,
+ 0.002382595557719469,
+ 0.002231382764875889,
+ 0.00168902100995183
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1275749206542969,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 273.6263122558594,
+ 248.43479919433594,
+ 234.8235321044922,
+ 228.0020751953125,
+ 222.4278106689453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.0597744373371825e-05,
+ 4.323143730289303e-05,
+ 4.647616151487455e-05,
+ 4.4688425987260416e-05,
+ 3.521826511132531e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002307126997038722,
+ 0.0023877634666860104,
+ 0.0024417925160378218,
+ 0.0022813305258750916,
+ 0.001714664394967258
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.1252907514572144,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 271.7508239746094,
+ 246.79209899902344,
+ 233.84280395507812,
+ 226.96934509277344,
+ 220.57888793945312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.177554728812538e-05,
+ 4.393904600874521e-05,
+ 4.635817458620295e-05,
+ 4.428510874276981e-05,
+ 3.396430111024529e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002355988370254636,
+ 0.0024527544155716896,
+ 0.0025022663176059723,
+ 0.0023387460969388485,
+ 0.0017370774876326323
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1249933242797852,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 271.7035217285156,
+ 246.70675659179688,
+ 233.96661376953125,
+ 226.53175354003906,
+ 220.52359008789062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.2499312257859856e-05,
+ 4.503092714003287e-05,
+ 4.670799171435647e-05,
+ 4.5866876462241635e-05,
+ 3.720118911587633e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002408105880022049,
+ 0.0024944571778178215,
+ 0.002545328810811043,
+ 0.002381332218647003,
+ 0.0017641197191551328
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.625,
+ "loss_eval": 1.1418037414550781,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 271.0970153808594,
+ 246.78770446777344,
+ 234.2436065673828,
+ 226.7012176513672,
+ 219.61680603027344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.040581188746728e-05,
+ 4.3224725231993943e-05,
+ 4.4494401663541794e-05,
+ 4.3532105337362736e-05,
+ 3.4612559829838574e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024068003986030817,
+ 0.002485552802681923,
+ 0.002538430504500866,
+ 0.002368941670283675,
+ 0.0017652952810749412
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.1279454231262207,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 270.66473388671875,
+ 244.8525390625,
+ 232.8356475830078,
+ 224.2222137451172,
+ 217.24554443359375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.1549992602085695e-05,
+ 4.493525193538517e-05,
+ 4.7448877012357116e-05,
+ 4.479651397559792e-05,
+ 3.5401590139372274e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002463088370859623,
+ 0.002551029436290264,
+ 0.002594881458207965,
+ 0.0024160456378012896,
+ 0.001803302438929677
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6376953125,
+ "loss_eval": 1.1330325603485107,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 269.8645935058594,
+ 243.50497436523438,
+ 231.37692260742188,
+ 222.27967834472656,
+ 215.22059631347656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.1519095248077065e-05,
+ 4.487609476200305e-05,
+ 4.708006963483058e-05,
+ 4.4878328480990604e-05,
+ 3.578457108233124e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024854058865457773,
+ 0.0025721373967826366,
+ 0.0026270432863384485,
+ 0.0024401266127824783,
+ 0.0018134783022105694
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.63671875,
+ "loss_eval": 1.123876690864563,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 269.28570556640625,
+ 242.04359436035156,
+ 229.53497314453125,
+ 221.24327087402344,
+ 215.1306610107422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.279898348613642e-05,
+ 4.6176737669156864e-05,
+ 4.813459236174822e-05,
+ 4.609950337908231e-05,
+ 3.566763552953489e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024860126432031393,
+ 0.002575797727331519,
+ 0.0026342689525336027,
+ 0.0024608916137367487,
+ 0.0018216874450445175
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.122079849243164,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 268.3481140136719,
+ 242.3759765625,
+ 229.19241333007812,
+ 220.78233337402344,
+ 213.58587646484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.163750054431148e-05,
+ 4.50872685178183e-05,
+ 4.8797548515722156e-05,
+ 4.597716542775743e-05,
+ 3.505409767967649e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025033215060830116,
+ 0.002596172271296382,
+ 0.002654082840308547,
+ 0.002480126451700926,
+ 0.0018305372213944793
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6328125,
+ "loss_eval": 1.1238645315170288,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 267.92425537109375,
+ 239.90985107421875,
+ 228.08212280273438,
+ 219.12835693359375,
+ 212.38052368164062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.42373457190115e-05,
+ 4.6515069698216394e-05,
+ 4.823393464903347e-05,
+ 4.762738535646349e-05,
+ 3.6444154829951e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025684935972094536,
+ 0.002675230847671628,
+ 0.0027295781765133142,
+ 0.0025394319090992212,
+ 0.0018643162911757827
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.135793685913086,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 266.2279052734375,
+ 239.37680053710938,
+ 226.3264923095703,
+ 218.04910278320312,
+ 210.68836975097656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4824198994319886e-05,
+ 4.7638000978622586e-05,
+ 4.962517414242029e-05,
+ 4.7396664740517735e-05,
+ 3.5957502404926345e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002600227715447545,
+ 0.002714222064241767,
+ 0.002763595897704363,
+ 0.0025755097158253193,
+ 0.0018772372277453542
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.623046875,
+ "loss_eval": 1.123576283454895,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 266.4837951660156,
+ 239.67581176757812,
+ 227.51805114746094,
+ 218.58811950683594,
+ 211.26596069335938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.245663512847386e-05,
+ 4.560768138617277e-05,
+ 4.797001020051539e-05,
+ 4.539322981145233e-05,
+ 3.4807548217941076e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025984421372413635,
+ 0.002703956561163068,
+ 0.002762222196906805,
+ 0.002577459439635277,
+ 0.0018865292659029365
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.61328125,
+ "loss_eval": 1.1362444162368774,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 264.8100891113281,
+ 237.96121215820312,
+ 226.14822387695312,
+ 217.3454132080078,
+ 208.98077392578125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.217765308567323e-05,
+ 4.603620618581772e-05,
+ 4.735886977869086e-05,
+ 4.5346474507823586e-05,
+ 3.594472218537703e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026375274173915386,
+ 0.0027397233061492443,
+ 0.0028012648690491915,
+ 0.0026011927984654903,
+ 0.0018980697495862842
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6318359375,
+ "loss_eval": 1.1286330223083496,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 264.8172302246094,
+ 238.0478057861328,
+ 225.0303497314453,
+ 217.1344757080078,
+ 209.569580078125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.242224895278923e-05,
+ 4.6696859499206766e-05,
+ 4.831598562304862e-05,
+ 4.5893459173385054e-05,
+ 3.54531584889628e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026500027161091566,
+ 0.002760941395536065,
+ 0.0028223067056387663,
+ 0.0026202781591564417,
+ 0.001915424014441669
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.1304678916931152,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 264.7013854980469,
+ 237.4438018798828,
+ 225.43527221679688,
+ 216.18502807617188,
+ 208.08302307128906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.43761091446504e-05,
+ 4.801220347872004e-05,
+ 4.9817157560028136e-05,
+ 4.829527097172104e-05,
+ 3.73583534383215e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002686889609321952,
+ 0.0028029615059494972,
+ 0.002866453491151333,
+ 0.002669648267328739,
+ 0.0019349679350852966
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6240234375,
+ "loss_eval": 1.1350867748260498,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 264.3004455566406,
+ 236.1824188232422,
+ 223.4772186279297,
+ 214.64682006835938,
+ 207.52272033691406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.3003376049455255e-05,
+ 4.6196739276638255e-05,
+ 4.8772617446957156e-05,
+ 4.7264005843317136e-05,
+ 3.6179160815663636e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027191757690161467,
+ 0.0028310383204370737,
+ 0.0028950762934982777,
+ 0.002689448418095708,
+ 0.0019433586858212948
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1378443241119385,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 262.62811279296875,
+ 235.80126953125,
+ 222.7261199951172,
+ 213.42430114746094,
+ 205.99493408203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4399519538274035e-05,
+ 4.737091148854233e-05,
+ 4.900431667920202e-05,
+ 4.768445069203153e-05,
+ 3.608842962421477e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027450472116470337,
+ 0.0028562990482896566,
+ 0.0029378861654549837,
+ 0.0027161173056811094,
+ 0.0019581648521125317
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6220703125,
+ "loss_eval": 1.137312889099121,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 262.612060546875,
+ 235.62489318847656,
+ 222.1566925048828,
+ 212.93875122070312,
+ 205.24142456054688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.443951911525801e-05,
+ 4.7095887566683814e-05,
+ 4.906025424133986e-05,
+ 4.8352503654314205e-05,
+ 3.6001758417114615e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002745443256571889,
+ 0.002859732834622264,
+ 0.002942001214250922,
+ 0.002725319005548954,
+ 0.001969744684174657
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6279296875,
+ "loss_eval": 1.126712441444397,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 262.6611633300781,
+ 235.52174377441406,
+ 221.89093017578125,
+ 213.1799774169922,
+ 204.9930877685547
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5766752009512857e-05,
+ 4.834473293158226e-05,
+ 5.181043525226414e-05,
+ 4.826926306122914e-05,
+ 3.573719732230529e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027218428440392017,
+ 0.002838012296706438,
+ 0.002919211983680725,
+ 0.0027209871914237738,
+ 0.001970200566574931
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62109375,
+ "loss_eval": 1.1352139711380005,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 261.58856201171875,
+ 234.9381103515625,
+ 221.2636260986328,
+ 211.9308624267578,
+ 204.54647827148438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5460306864697486e-05,
+ 4.857210296904668e-05,
+ 4.9856924306368455e-05,
+ 4.823243580176495e-05,
+ 3.731804099516012e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002767088357359171,
+ 0.0028805267065763474,
+ 0.0029621378052979708,
+ 0.00275496207177639,
+ 0.001986011164262891
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.134087324142456,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 261.3812561035156,
+ 234.79383850097656,
+ 220.678955078125,
+ 211.66114807128906,
+ 203.9405517578125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.64644399471581e-05,
+ 5.052189590060152e-05,
+ 5.2927574870409444e-05,
+ 5.0570299208629876e-05,
+ 3.7252495530992746e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027735778130590916,
+ 0.002885127207264304,
+ 0.0029686433263123035,
+ 0.002763227093964815,
+ 0.0019980284851044416
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.135728359222412,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 261.2560729980469,
+ 233.66014099121094,
+ 220.25682067871094,
+ 211.13511657714844,
+ 203.18130493164062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6268629375845194e-05,
+ 4.9701800890034065e-05,
+ 5.169105133973062e-05,
+ 5.069339385954663e-05,
+ 3.80978781322483e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028223153203725815,
+ 0.0029419492930173874,
+ 0.0030234854202717543,
+ 0.002805375959724188,
+ 0.002015760401263833
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.619140625,
+ "loss_eval": 1.1317980289459229,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 260.62255859375,
+ 233.12937927246094,
+ 219.89907836914062,
+ 210.4191436767578,
+ 202.494873046875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5126867917133495e-05,
+ 4.8572586820228025e-05,
+ 5.1520797569537535e-05,
+ 4.971070302417502e-05,
+ 3.838812335743569e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028271761257201433,
+ 0.002944816369563341,
+ 0.003029909450560808,
+ 0.0028170389123260975,
+ 0.002025141380727291
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6259765625,
+ "loss_eval": 1.1392892599105835,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 260.0465393066406,
+ 232.27760314941406,
+ 218.845458984375,
+ 209.7770233154297,
+ 201.92831420898438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.730001455754973e-05,
+ 5.118208355270326e-05,
+ 5.1580365834524855e-05,
+ 4.936498589813709e-05,
+ 3.706002826220356e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028656981885433197,
+ 0.002991823712363839,
+ 0.0030798574443906546,
+ 0.0028517318423837423,
+ 0.0020406947005540133
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.625,
+ "loss_eval": 1.1393200159072876,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 259.99285888671875,
+ 232.2432403564453,
+ 218.6685333251953,
+ 209.5802001953125,
+ 201.7836456298828
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4883607188239694e-05,
+ 4.9325379222864285e-05,
+ 5.1563201850512996e-05,
+ 4.9446705816080794e-05,
+ 3.641278817667626e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002843427937477827,
+ 0.0029685739427804947,
+ 0.0030620063189417124,
+ 0.0028350763022899628,
+ 0.0020346841774880886
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.625,
+ "loss_eval": 1.136763572692871,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 259.7002868652344,
+ 232.1937713623047,
+ 218.6339569091797,
+ 209.42572021484375,
+ 201.48532104492188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.557083229883574e-05,
+ 5.006462743040174e-05,
+ 5.1964529120596126e-05,
+ 5.040188261773437e-05,
+ 3.70733359886799e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002866365248337388,
+ 0.0029951538890600204,
+ 0.0030862949788570404,
+ 0.0028592217713594437,
+ 0.002047886373475194
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.139750361442566,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 259.22808837890625,
+ 232.3558807373047,
+ 218.42848205566406,
+ 209.1579132080078,
+ 201.5212860107422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5765504182782024e-05,
+ 4.875436570728198e-05,
+ 5.104453521198593e-05,
+ 5.005718412576243e-05,
+ 3.675639891298488e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002878013998270035,
+ 0.003002135781571269,
+ 0.0030916042160242796,
+ 0.002861205255612731,
+ 0.0020479748491197824
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1344283819198608,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 259.1551513671875,
+ 232.05300903320312,
+ 218.15708923339844,
+ 208.9161834716797,
+ 201.6800537109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.611797339748591e-05,
+ 4.964259278494865e-05,
+ 5.252738264971413e-05,
+ 5.0600574468262494e-05,
+ 3.820879283011891e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028855716809630394,
+ 0.003010405693203211,
+ 0.0031016215216368437,
+ 0.002874146681278944,
+ 0.0020545709412544966
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.135157823562622,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 259.21893310546875,
+ 231.72747802734375,
+ 217.7665252685547,
+ 208.59022521972656,
+ 201.1155548095703
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6835561079205945e-05,
+ 5.060776311438531e-05,
+ 5.325842721504159e-05,
+ 5.128757766215131e-05,
+ 3.774667493416928e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002893448108807206,
+ 0.0030188425444066525,
+ 0.0031124993693083525,
+ 0.002883171197026968,
+ 0.002058332087472081
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6298828125,
+ "loss_eval": 1.1357543468475342,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 258.88385009765625,
+ 230.9880828857422,
+ 217.33352661132812,
+ 208.3406524658203,
+ 200.54083251953125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.6940938773332164e-05,
+ 5.0942355301231146e-05,
+ 5.368283382267691e-05,
+ 5.184212204767391e-05,
+ 3.746367656276561e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029224599711596966,
+ 0.0030530549120157957,
+ 0.003145798807963729,
+ 0.0029114321805536747,
+ 0.0020718672312796116
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6279296875,
+ "loss_eval": 1.1398890018463135,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 258.7764587402344,
+ 231.19357299804688,
+ 217.22779846191406,
+ 207.97528076171875,
+ 199.982421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.70306295028422e-05,
+ 5.185308327781968e-05,
+ 5.281997437123209e-05,
+ 5.1426530262688175e-05,
+ 3.7254685594234616e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002924826927483082,
+ 0.0030514320824295282,
+ 0.0031429482623934746,
+ 0.0029119658283889294,
+ 0.0020754521246999502
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.138663411140442,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 258.7837829589844,
+ 230.58901977539062,
+ 217.062255859375,
+ 207.7244873046875,
+ 199.89395141601562
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.688404078478925e-05,
+ 5.141457950230688e-05,
+ 5.3491079597733915e-05,
+ 5.087396493763663e-05,
+ 3.739634121302515e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029230716172605753,
+ 0.0030518025159835815,
+ 0.0031419326551258564,
+ 0.002910938812419772,
+ 0.00207503535784781
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.626953125,
+ "loss_eval": 1.1365739107131958,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 258.7561950683594,
+ 230.4254913330078,
+ 217.07546997070312,
+ 207.6160125732422,
+ 199.7816162109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.680828351411037e-05,
+ 5.096250242786482e-05,
+ 5.211709503782913e-05,
+ 5.09246347064618e-05,
+ 3.779645703616552e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002931967144832015,
+ 0.0030605625361204147,
+ 0.00315046776086092,
+ 0.0029180829878896475,
+ 0.002077121753245592
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1363377571105957,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 258.76409912109375,
+ 230.5386505126953,
+ 216.76475524902344,
+ 207.16859436035156,
+ 199.2827911376953
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.749056097352877e-05,
+ 5.2020419389009476e-05,
+ 5.3769603255204856e-05,
+ 5.178397987037897e-05,
+ 3.789216498262249e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029493479523807764,
+ 0.0030784173868596554,
+ 0.0031682881526649,
+ 0.0029316784348338842,
+ 0.002084067091345787
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6298828125,
+ "loss_eval": 1.1382873058319092,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 258.7884826660156,
+ 230.40945434570312,
+ 216.70376586914062,
+ 207.1806182861328,
+ 199.41917419433594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.741501834359951e-05,
+ 5.169968062546104e-05,
+ 5.352263542590663e-05,
+ 5.053802306065336e-05,
+ 3.758866660064086e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002947731176391244,
+ 0.003076745430007577,
+ 0.0031680618412792683,
+ 0.0029321794863790274,
+ 0.0020845714025199413
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.630859375,
+ "loss_eval": 1.1382077932357788,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 258.766845703125,
+ 230.38992309570312,
+ 216.7628173828125,
+ 207.26092529296875,
+ 199.36366271972656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.718741183751263e-05,
+ 5.1928480388596654e-05,
+ 5.3666040912503377e-05,
+ 5.089692058390938e-05,
+ 3.752821430680342e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002943811472505331,
+ 0.003073457395657897,
+ 0.0031646883580833673,
+ 0.0029298998415470123,
+ 0.002084212377667427
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.138296365737915,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 258.8481140136719,
+ 230.38389587402344,
+ 216.7748260498047,
+ 207.24560546875,
+ 199.39401245117188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.728109706775285e-05,
+ 5.156427505426109e-05,
+ 5.3663239668821916e-05,
+ 5.139272616361268e-05,
+ 3.7748181057395414e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002947240835055709,
+ 0.003076959168538451,
+ 0.0031680231913924217,
+ 0.0029323517810553312,
+ 0.0020851469598710537
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1388041973114014,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 258.77734375,
+ 230.3692626953125,
+ 216.7212677001953,
+ 207.1890869140625,
+ 199.34091186523438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.7204313887050375e-05,
+ 5.154019163455814e-05,
+ 5.373918611439876e-05,
+ 5.1062332204310223e-05,
+ 3.7904177588643506e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029484080150723457,
+ 0.0030780842062085867,
+ 0.0031695417128503323,
+ 0.0029333126731216908,
+ 0.002085541607812047
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.138832688331604,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 258.7897644042969,
+ 230.38552856445312,
+ 216.73997497558594,
+ 207.1963653564453,
+ 199.38656616210938
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.726059705717489e-05,
+ 5.1730185077758506e-05,
+ 5.3854040743317455e-05,
+ 5.0960083171958104e-05,
+ 3.793121504713781e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00294809159822762,
+ 0.003077775239944458,
+ 0.003169153118506074,
+ 0.0029330949764698744,
+ 0.0020853858441114426
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.1388249397277832,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 258.7891845703125,
+ 230.38888549804688,
+ 216.73963928222656,
+ 207.19769287109375,
+ 199.4077606201172
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.725577309727669e-05,
+ 5.174486432224512e-05,
+ 5.38085114385467e-05,
+ 5.098402107250877e-05,
+ 3.7933263229206204e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002948042470961809,
+ 0.0030777468346059322,
+ 0.003169137053191662,
+ 0.002933081705123186,
+ 0.0020853858441114426
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6279296875,
+ "loss_eval": 1.1387826204299927,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.696551322937012,
+ 8.737784385681152,
+ 8.813130378723145,
+ 8.844642639160156,
+ 8.889528274536133
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010079912608489394,
+ 0.0010035138111561537,
+ 0.0009970925748348236,
+ 0.0009936393471434712,
+ 0.000986678060144186
+ ],
+ "bp_grad_norms_F": [
+ 0.035574451088905334,
+ 0.035288579761981964,
+ 0.035048045217990875,
+ 0.0346725769340992,
+ 0.03439188003540039
+ ],
+ "gamma_dfa": 0.0033523982419865206,
+ "acc_eval": 0.0927734375,
+ "loss_eval": 2.4863264560699463,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 900.3377685546875,
+ 3463.92626953125,
+ 6660.5166015625,
+ 10478.5126953125,
+ 13466.513671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.017142833210528e-06,
+ 7.972002435963077e-07,
+ 7.783806381667091e-07,
+ 7.758338256280695e-07,
+ 7.810436954969191e-07
+ ],
+ "bp_grad_norms_F": [
+ 0.00013047464017290622,
+ 7.321321754716337e-05,
+ 7.131113670766354e-05,
+ 7.113779429346323e-05,
+ 7.09498199285008e-05
+ ],
+ "gamma_dfa": 0.1028625147882849,
+ "acc_eval": 0.2861328125,
+ "loss_eval": 1.970402717590332,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1784.805419921875,
+ 14085.2138671875,
+ 36523.9375,
+ 61422.50390625,
+ 73870.3359375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.087140711017128e-07,
+ 1.772240381114898e-07,
+ 1.705584367073243e-07,
+ 1.7156033038645546e-07,
+ 1.728751612972701e-07
+ ],
+ "bp_grad_norms_F": [
+ 4.7445286327274516e-05,
+ 1.1973520486208145e-05,
+ 9.698592293716501e-06,
+ 9.335580216429662e-06,
+ 9.154121471510734e-06
+ ],
+ "gamma_dfa": 0.09588160619023256,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9628738164901733,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 2670.88134765625,
+ 35761.4921875,
+ 99927.7890625,
+ 170223.953125,
+ 201448.390625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.815078338855528e-07,
+ 7.772520405069372e-08,
+ 7.527528111950232e-08,
+ 7.557918735301428e-08,
+ 7.57173737042649e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.8944486984983087e-05,
+ 3.2005805223889183e-06,
+ 2.6765355869429186e-06,
+ 2.639568720042007e-06,
+ 2.6436800908413716e-06
+ ],
+ "gamma_dfa": 0.09442083747126162,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9821033477783203,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 3506.001220703125,
+ 70233.9375,
+ 205054.078125,
+ 348792.375,
+ 416698.5625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5228594558466284e-07,
+ 4.338783554658221e-08,
+ 4.114394869247917e-08,
+ 4.122260932604149e-08,
+ 4.124275321260029e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.319143823115155e-05,
+ 1.7165241388283903e-06,
+ 1.3772670399703202e-06,
+ 1.3777447520624264e-06,
+ 1.3796359326079255e-06
+ ],
+ "gamma_dfa": 0.09172606549691409,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9661527872085571,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 4351.04052734375,
+ 120982.0390625,
+ 361547.03125,
+ 633667.3125,
+ 764198.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.632259790720127e-07,
+ 2.6118947005215887e-08,
+ 2.4913996199416033e-08,
+ 2.494128636953974e-08,
+ 2.4942012899487054e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.894752676889766e-05,
+ 1.1090510270150844e-06,
+ 8.424218549407669e-07,
+ 8.403117703892349e-07,
+ 8.407336054006009e-07
+ ],
+ "gamma_dfa": 0.08992433547973633,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.980475664138794,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 5174.9833984375,
+ 189817.0625,
+ 576763.3125,
+ 1012734.125,
+ 1235217.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.340334444601467e-07,
+ 1.826493090106851e-08,
+ 1.7263264595612782e-08,
+ 1.730784759956805e-08,
+ 1.7305337607353977e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.7139096598839387e-05,
+ 7.582453918075771e-07,
+ 5.794162802885694e-07,
+ 5.812879635413992e-07,
+ 5.813373604723893e-07
+ ],
+ "gamma_dfa": 0.08752730302512646,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.9696743488311768,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 5963.3935546875,
+ 276686.75,
+ 861517.375,
+ 1555059.75,
+ 1913322.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.834741223978199e-07,
+ 1.3120247110975924e-08,
+ 1.2326365705916942e-08,
+ 1.2353129186237766e-08,
+ 1.2349524958210623e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.4978587387304287e-05,
+ 5.169860628484457e-07,
+ 4.2094282548532647e-07,
+ 4.222391680741566e-07,
+ 4.222146685606276e-07
+ ],
+ "gamma_dfa": 0.08884745300747454,
+ "acc_eval": 0.2919921875,
+ "loss_eval": 1.9592503309249878,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 6751.1630859375,
+ 390990.65625,
+ 1268157.625,
+ 2303462.75,
+ 2850455.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.5272595394199016e-07,
+ 9.644952392307005e-09,
+ 9.213153795428752e-09,
+ 9.189856875480018e-09,
+ 9.217835383878992e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3214407772466075e-05,
+ 3.7820277043465467e-07,
+ 3.14011003865744e-07,
+ 3.1468064776163374e-07,
+ 3.146610936255456e-07
+ ],
+ "gamma_dfa": 0.08774545323103666,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9636309146881104,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 7557.10302734375,
+ 541741.25,
+ 1767146.375,
+ 3237576.25,
+ 4005094.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.3122942138797953e-07,
+ 7.519741274109037e-09,
+ 7.2226606917524805e-09,
+ 7.218183384338772e-09,
+ 7.221534037427091e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.196970697492361e-05,
+ 2.9184533900661336e-07,
+ 2.4720966962377133e-07,
+ 2.4752529270699597e-07,
+ 2.4754368155299744e-07
+ ],
+ "gamma_dfa": 0.08941872720606625,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9587393999099731,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 8353.015625,
+ 720288.5625,
+ 2367034.25,
+ 4437438.5,
+ 5500873.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.1009967099416826e-07,
+ 6.096115612308495e-09,
+ 5.8281148795913396e-09,
+ 5.816529036195561e-09,
+ 5.823292070772368e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0853039384528529e-05,
+ 2.2833219759377243e-07,
+ 1.979581298883204e-07,
+ 1.9814572738141578e-07,
+ 1.9820384977720096e-07
+ ],
+ "gamma_dfa": 0.09132041316479445,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9605882167816162,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 9134.4443359375,
+ 924688.8125,
+ 3108971.25,
+ 5809310.0,
+ 7180875.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.9402843065563502e-07,
+ 4.977510403847418e-09,
+ 4.8141264308299014e-09,
+ 4.791541829973767e-09,
+ 4.794175723077387e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0063903573609423e-05,
+ 1.9364638603747153e-07,
+ 1.6622837506474752e-07,
+ 1.6636218447274587e-07,
+ 1.6641583044929575e-07
+ ],
+ "gamma_dfa": 0.08994872949551791,
+ "acc_eval": 0.2822265625,
+ "loss_eval": 1.9717106819152832,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 9934.0107421875,
+ 1171186.5,
+ 4059807.75,
+ 7477705.0,
+ 9248714.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.802942222184356e-07,
+ 4.213630333538276e-09,
+ 4.032348677185382e-09,
+ 4.031016409555832e-09,
+ 4.033940292913485e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.375374247611035e-06,
+ 1.60658984782458e-07,
+ 1.398711617639492e-07,
+ 1.399746452079853e-07,
+ 1.4004145043600147e-07
+ ],
+ "gamma_dfa": 0.09168496390338987,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9513648748397827,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 10690.2216796875,
+ 1474348.375,
+ 5210694.5,
+ 9539616.0,
+ 11795722.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7011585384807404e-07,
+ 3.5948770626959003e-09,
+ 3.444458496204561e-09,
+ 3.439692752849055e-09,
+ 3.4398179860062328e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.913790225051343e-06,
+ 1.346561759874021e-07,
+ 1.1880944583708697e-07,
+ 1.1887690476442003e-07,
+ 1.1894194784645151e-07
+ ],
+ "gamma_dfa": 0.0931803259300068,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.959463357925415,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11428.3076171875,
+ 1789460.25,
+ 6431273.0,
+ 11810251.0,
+ 14610525.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5823535193248972e-07,
+ 3.1298097447063356e-09,
+ 3.012203153573978e-09,
+ 3.010908633527265e-09,
+ 3.010648619294898e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.233506378019229e-06,
+ 1.1668681310084139e-07,
+ 1.0298786889961775e-07,
+ 1.0303519104581937e-07,
+ 1.0309597797686365e-07
+ ],
+ "gamma_dfa": 0.09336384548805654,
+ "acc_eval": 0.2861328125,
+ "loss_eval": 1.9515889883041382,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 12175.4384765625,
+ 2177908.0,
+ 7886216.5,
+ 14475684.0,
+ 17927020.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5137742082060868e-07,
+ 2.705691448667835e-09,
+ 2.5981530260565933e-09,
+ 2.5995214869567462e-09,
+ 2.6000293029682098e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.800716048222966e-06,
+ 1.0053086896277819e-07,
+ 8.984200405848242e-08,
+ 8.987952071493055e-08,
+ 8.993622913067156e-08
+ ],
+ "gamma_dfa": 0.09357930033002049,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9580912590026855,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 12918.6787109375,
+ 2622644.5,
+ 9573671.0,
+ 17460572.0,
+ 21682046.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.432233602827182e-07,
+ 2.359643591631766e-09,
+ 2.2714441438864696e-09,
+ 2.2688442236074025e-09,
+ 2.2694950363444377e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.43454029361601e-06,
+ 8.846858889910436e-08,
+ 7.942762891843813e-08,
+ 7.945371294226788e-08,
+ 7.950914238108453e-08
+ ],
+ "gamma_dfa": 0.09332277777139097,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9656270742416382,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 13676.931640625,
+ 3144179.5,
+ 11421599.0,
+ 20832254.0,
+ 25907438.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.3402345189206244e-07,
+ 2.1064472388587774e-09,
+ 2.0263852817947736e-09,
+ 2.0199610872850826e-09,
+ 2.0222397090208233e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.909830062795663e-06,
+ 7.773559929091789e-08,
+ 7.076827301943922e-08,
+ 7.077783692466255e-08,
+ 7.082799413637986e-08
+ ],
+ "gamma_dfa": 0.0945073509356007,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9510960578918457,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 14410.64453125,
+ 3691622.0,
+ 13302875.0,
+ 24659928.0,
+ 30700242.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2569752527724631e-07,
+ 1.8540845525549798e-09,
+ 1.8018908587436044e-09,
+ 1.8003264434796051e-09,
+ 1.802896276714705e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.58303315503872e-06,
+ 6.894391191281102e-08,
+ 6.3350469758916e-08,
+ 6.336826174901944e-08,
+ 6.340740554833246e-08
+ ],
+ "gamma_dfa": 0.09388192358892411,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9456725120544434,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 15102.634765625,
+ 4270070.0,
+ 15687016.0,
+ 28858048.0,
+ 35882240.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2314617947595252e-07,
+ 1.6925943979728686e-09,
+ 1.6383979728473719e-09,
+ 1.6367472932543592e-09,
+ 1.6394127166918793e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.343140285025584e-06,
+ 6.240136940505181e-08,
+ 5.757489418556361e-08,
+ 5.7587019597349354e-08,
+ 5.7624333749117795e-08
+ ],
+ "gamma_dfa": 0.09518493304494768,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9497833251953125,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 15809.6728515625,
+ 4913181.0,
+ 18109688.0,
+ 33281892.0,
+ 41436228.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1704661773137559e-07,
+ 1.533212445892218e-09,
+ 1.483607681151966e-09,
+ 1.4837684414459318e-09,
+ 1.4838255069093975e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.079233116906835e-06,
+ 5.7217945936827164e-08,
+ 5.270470992968512e-08,
+ 5.2718213794378244e-08,
+ 5.2752689327917324e-08
+ ],
+ "gamma_dfa": 0.09407007653499022,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.961036205291748,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 16522.783203125,
+ 5620503.0,
+ 20819020.0,
+ 38391960.0,
+ 47723272.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1146808986950418e-07,
+ 1.4118024527220996e-09,
+ 1.3678460586419305e-09,
+ 1.3669514409286876e-09,
+ 1.3668450815629285e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.778397280664649e-06,
+ 5.162353389209784e-08,
+ 4.8153967924235985e-08,
+ 4.816252285877454e-08,
+ 4.8193449231348495e-08
+ ],
+ "gamma_dfa": 0.09494083630852401,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.9576481580734253,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 17230.27734375,
+ 6437730.5,
+ 23789486.0,
+ 43960328.0,
+ 54569096.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0952022932997352e-07,
+ 1.2858689668604484e-09,
+ 1.246260317167014e-09,
+ 1.2462959553261044e-09,
+ 1.2484926426026277e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.637425147142494e-06,
+ 4.732414282671016e-08,
+ 4.430494371376881e-08,
+ 4.431280586913999e-08,
+ 4.434128086927558e-08
+ ],
+ "gamma_dfa": 0.09481688600499183,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9625442028045654,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 17916.12890625,
+ 7217473.5,
+ 26969020.0,
+ 49888804.0,
+ 62010184.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.043977349013403e-07,
+ 1.1912204556097095e-09,
+ 1.159051632448893e-09,
+ 1.1590449711107453e-09,
+ 1.159014662022173e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.385433269111672e-06,
+ 4.3334623001101136e-08,
+ 4.083162963297582e-08,
+ 4.0836408032873805e-08,
+ 4.0863898931320364e-08
+ ],
+ "gamma_dfa": 0.0946647283853963,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.9656811952590942,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 18617.46875,
+ 8095365.0,
+ 30241864.0,
+ 56059896.0,
+ 69702984.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.001103129283365e-07,
+ 1.1034658742303805e-09,
+ 1.0674757744411068e-09,
+ 1.0666105776380164e-09,
+ 1.0677670969627684e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.150916877028067e-06,
+ 3.999087283546032e-08,
+ 3.779740609388682e-08,
+ 3.780221291549424e-08,
+ 3.782682256314729e-08
+ ],
+ "gamma_dfa": 0.09509630355751142,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9476948976516724,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 19248.7890625,
+ 9047595.0,
+ 33634812.0,
+ 62495088.0,
+ 77796536.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.749370377676314e-08,
+ 1.0280801765460978e-09,
+ 9.980430926148642e-10,
+ 9.978470272287154e-10,
+ 9.990493987643845e-10
+ ],
+ "bp_grad_norms_F": [
+ 5.017087005398935e-06,
+ 3.7442834610601494e-08,
+ 3.536156611971819e-08,
+ 3.536548476290591e-08,
+ 3.538822213045023e-08
+ ],
+ "gamma_dfa": 0.09479212731821463,
+ "acc_eval": 0.2861328125,
+ "loss_eval": 1.9604804515838623,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 19902.470703125,
+ 10030725.0,
+ 37252656.0,
+ 69351704.0,
+ 86270768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.411947843318558e-08,
+ 9.563448921667828e-10,
+ 9.361866837309663e-10,
+ 9.359075736625755e-10,
+ 9.361766917237446e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.873440502706217e-06,
+ 3.4947159832654506e-08,
+ 3.313299146157078e-08,
+ 3.3137865784738096e-08,
+ 3.315915364510147e-08
+ ],
+ "gamma_dfa": 0.09510701123508625,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9498941898345947,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 20513.66796875,
+ 11086393.0,
+ 41223968.0,
+ 76828584.0,
+ 95694480.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.249640697817085e-08,
+ 9.003223166992314e-10,
+ 8.743661350507637e-10,
+ 8.736535939135592e-10,
+ 8.752278901624777e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.75014485346037e-06,
+ 3.290759664764664e-08,
+ 3.1125043875590563e-08,
+ 3.1127818544973707e-08,
+ 3.11488683735206e-08
+ ],
+ "gamma_dfa": 0.09552363055991009,
+ "acc_eval": 0.2841796875,
+ "loss_eval": 1.9527215957641602,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 21161.345703125,
+ 12263719.0,
+ 45533684.0,
+ 84877296.0,
+ 105753224.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.900443049242313e-08,
+ 8.457264888406257e-10,
+ 8.261510919815862e-10,
+ 8.261567541190118e-10,
+ 8.276057061884501e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.624974280886818e-06,
+ 3.0792985938887796e-08,
+ 2.9227694042788244e-08,
+ 2.9232776199705768e-08,
+ 2.9251353339532216e-08
+ ],
+ "gamma_dfa": 0.09527035459177569,
+ "acc_eval": 0.2890625,
+ "loss_eval": 1.950648307800293,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 21787.568359375,
+ 13358760.0,
+ 49723396.0,
+ 92840264.0,
+ 115901424.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.79872459336184e-08,
+ 8.034463094830357e-10,
+ 7.846168159630906e-10,
+ 7.837334670135476e-10,
+ 7.841179927581265e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.530191290541552e-06,
+ 2.9184068495169413e-08,
+ 2.7723606521590227e-08,
+ 2.7726789753046432e-08,
+ 2.7744931685447227e-08
+ ],
+ "gamma_dfa": 0.09598725114483386,
+ "acc_eval": 0.2919921875,
+ "loss_eval": 1.9504928588867188,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 22378.34765625,
+ 14611837.0,
+ 54335560.0,
+ 101350864.0,
+ 126710488.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.497670478391228e-08,
+ 7.560595483013799e-10,
+ 7.353461728420996e-10,
+ 7.342743080229752e-10,
+ 7.348425756781296e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.383283339848276e-06,
+ 2.7485034692631416e-08,
+ 2.6182895851434296e-08,
+ 2.618475392068831e-08,
+ 2.620201833281044e-08
+ ],
+ "gamma_dfa": 0.09509110247017816,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.9564056396484375,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 22972.798828125,
+ 15931348.0,
+ 59291124.0,
+ 110237776.0,
+ 138020368.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.252197858382715e-08,
+ 7.193445838993284e-10,
+ 6.977300404109599e-10,
+ 6.966639487515636e-10,
+ 6.977723399081981e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.255563453625655e-06,
+ 2.5971447215056287e-08,
+ 2.4833044065530885e-08,
+ 2.4835205891804435e-08,
+ 2.4851219748711628e-08
+ ],
+ "gamma_dfa": 0.0951943755208049,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9508299827575684,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 23525.689453125,
+ 17283022.0,
+ 64234984.0,
+ 119317480.0,
+ 149347744.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.036072784989301e-08,
+ 6.884249836858203e-10,
+ 6.666004415123439e-10,
+ 6.656397100179845e-10,
+ 6.674217845059616e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.212505245959619e-06,
+ 2.4864668546342727e-08,
+ 2.375563212808629e-08,
+ 2.3757841915994504e-08,
+ 2.3773273127858374e-08
+ ],
+ "gamma_dfa": 0.09534151147818193,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.95639967918396,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 24102.95703125,
+ 18811968.0,
+ 69193392.0,
+ 128823560.0,
+ 161700704.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.921565980950618e-08,
+ 6.526117424243694e-10,
+ 6.390621365426341e-10,
+ 6.381262185328751e-10,
+ 6.384171524764781e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.09630820286111e-06,
+ 2.3687046990517047e-08,
+ 2.2686869272092736e-08,
+ 2.2687553169475905e-08,
+ 2.2702355551018627e-08
+ ],
+ "gamma_dfa": 0.0947199320216896,
+ "acc_eval": 0.2880859375,
+ "loss_eval": 1.960526943206787,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 24687.955078125,
+ 20313542.0,
+ 74389296.0,
+ 138258576.0,
+ 173791248.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.937118340350935e-08,
+ 6.360312831965587e-10,
+ 6.205357339084117e-10,
+ 6.196035906569364e-10,
+ 6.196675395031548e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.070574505021796e-06,
+ 2.2864428572688666e-08,
+ 2.1894738466698982e-08,
+ 2.1895061763643753e-08,
+ 2.1909569269951135e-08
+ ],
+ "gamma_dfa": 0.09556430295924656,
+ "acc_eval": 0.2822265625,
+ "loss_eval": 1.97263765335083,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 25226.55078125,
+ 21851366.0,
+ 80000824.0,
+ 148574480.0,
+ 186595952.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.592127104771862e-08,
+ 6.044152955908544e-10,
+ 5.892630272619215e-10,
+ 5.896260146798227e-10,
+ 5.900769872724254e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.966818894696189e-06,
+ 2.1824051898988728e-08,
+ 2.093374718015184e-08,
+ 2.093443285389185e-08,
+ 2.0947767964685227e-08
+ ],
+ "gamma_dfa": 0.09587649442255497,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9495991468429565,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 25759.50390625,
+ 23391128.0,
+ 85561480.0,
+ 158667136.0,
+ 198961760.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.493858333873504e-08,
+ 5.860726903783586e-10,
+ 5.731417562770957e-10,
+ 5.733850616529423e-10,
+ 5.73569580719635e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.896147973136976e-06,
+ 2.099926454945944e-08,
+ 2.0218029916918567e-08,
+ 2.0218159590967844e-08,
+ 2.0230830344303286e-08
+ ],
+ "gamma_dfa": 0.09563440945930779,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.954901099205017,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 26267.0859375,
+ 25111884.0,
+ 91593392.0,
+ 169479968.0,
+ 212491408.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.387680511783401e-08,
+ 5.612941222921108e-10,
+ 5.475105369079358e-10,
+ 5.468157038279742e-10,
+ 5.479569020749864e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.838411430479027e-06,
+ 2.0261547106770195e-08,
+ 1.9493551661753372e-08,
+ 1.949278782831243e-08,
+ 1.9505332460312275e-08
+ ],
+ "gamma_dfa": 0.09528586096712388,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9556396007537842,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 26761.587890625,
+ 26706742.0,
+ 97554944.0,
+ 180407616.0,
+ 226265728.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.260722156843258e-08,
+ 5.407673198121188e-10,
+ 5.32608401826451e-10,
+ 5.31698407524317e-10,
+ 5.328552044048251e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.7372303722804645e-06,
+ 1.9519287519642603e-08,
+ 1.8807236656925852e-08,
+ 1.8806394663783976e-08,
+ 1.8818212765836506e-08
+ ],
+ "gamma_dfa": 0.09491665422683582,
+ "acc_eval": 0.2890625,
+ "loss_eval": 1.963973879814148,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 27302.328125,
+ 28336562.0,
+ 103781320.0,
+ 191401696.0,
+ 240130064.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.187927053564636e-08,
+ 5.305865746763061e-10,
+ 5.205576525391109e-10,
+ 5.20661624925367e-10,
+ 5.217564713611011e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.734877054739627e-06,
+ 1.88775892695503e-08,
+ 1.8220953634795478e-08,
+ 1.8220212893993448e-08,
+ 1.8231482101782603e-08
+ ],
+ "gamma_dfa": 0.0957885464449646,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9604723453521729,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 27801.44140625,
+ 30051226.0,
+ 109945288.0,
+ 203002704.0,
+ 254881776.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.894305215610075e-08,
+ 5.044222262107212e-10,
+ 4.932855790507062e-10,
+ 4.934126440758746e-10,
+ 4.940316489232544e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.610647127061384e-06,
+ 1.8150354108570355e-08,
+ 1.753623024569606e-08,
+ 1.7534704355171016e-08,
+ 1.7545806585417267e-08
+ ],
+ "gamma_dfa": 0.09517717303242534,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.9589688777923584,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 28266.703125,
+ 31897594.0,
+ 116263888.0,
+ 215162448.0,
+ 270215296.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.807566421684896e-08,
+ 4.835814526593651e-10,
+ 4.775287942848649e-10,
+ 4.773109685274335e-10,
+ 4.784843632421598e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.590413371057366e-06,
+ 1.7596850199197434e-08,
+ 1.705259222717359e-08,
+ 1.7050926004458233e-08,
+ 1.7061644541627174e-08
+ ],
+ "gamma_dfa": 0.0961545761092566,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9595096111297607,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 28755.66015625,
+ 33582328.0,
+ 122605680.0,
+ 226378480.0,
+ 284438688.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.689399612014313e-08,
+ 4.746543713629592e-10,
+ 4.678599174745557e-10,
+ 4.68083238835959e-10,
+ 4.683119447790318e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5121436212648405e-06,
+ 1.7124380136124273e-08,
+ 1.6555107507087996e-08,
+ 1.655343240258844e-08,
+ 1.656368908697914e-08
+ ],
+ "gamma_dfa": 0.09569378412561491,
+ "acc_eval": 0.287109375,
+ "loss_eval": 1.9612011909484863,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 29227.5703125,
+ 35443612.0,
+ 129229904.0,
+ 238040368.0,
+ 299000064.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.582912703834154e-08,
+ 4.575871348500016e-10,
+ 4.493441174702184e-10,
+ 4.48520082185766e-10,
+ 4.485415650012925e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4321058137720684e-06,
+ 1.6602150765265833e-08,
+ 1.6083028242519504e-08,
+ 1.6080972997656318e-08,
+ 1.609118882583971e-08
+ ],
+ "gamma_dfa": 0.09606127908773487,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9551353454589844,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 29665.798828125,
+ 37243032.0,
+ 135839760.0,
+ 250377328.0,
+ 314433920.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.588776813032382e-08,
+ 4.4936304677278827e-10,
+ 4.4115311403913893e-10,
+ 4.406963405312325e-10,
+ 4.4055534220710513e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.3984799756581197e-06,
+ 1.6157997606569552e-08,
+ 1.564128204734061e-08,
+ 1.5638891071034777e-08,
+ 1.564865925729464e-08
+ ],
+ "gamma_dfa": 0.09547593681054423,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9503705501556396,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 30096.123046875,
+ 39014544.0,
+ 141817168.0,
+ 261217760.0,
+ 328197248.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.549055342475185e-08,
+ 4.3991607578952596e-10,
+ 4.348142956800416e-10,
+ 4.3428130536149467e-10,
+ 4.349899329625373e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.382166596566094e-06,
+ 1.5776649320287106e-08,
+ 1.5299850275596327e-08,
+ 1.5297549893489304e-08,
+ 1.5307026757227504e-08
+ ],
+ "gamma_dfa": 0.09610002994304523,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.952854037284851,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 30554.974609375,
+ 40873780.0,
+ 148087312.0,
+ 272436128.0,
+ 342258336.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.514299855098216e-08,
+ 4.291983157767021e-10,
+ 4.228755678958862e-10,
+ 4.2251957488304015e-10,
+ 4.227345695717588e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.3793355669331504e-06,
+ 1.5485536408732514e-08,
+ 1.4993654318118388e-08,
+ 1.499121538017789e-08,
+ 1.5000590991576246e-08
+ ],
+ "gamma_dfa": 0.09557013235462364,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9633105993270874,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 30981.4765625,
+ 42548124.0,
+ 153904848.0,
+ 283882112.0,
+ 356627616.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.343542224840348e-08,
+ 4.1842326825580756e-10,
+ 4.139384113255318e-10,
+ 4.141494092113618e-10,
+ 4.1477912771092917e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.3046233056666097e-06,
+ 1.508391989091251e-08,
+ 1.4620022525946297e-08,
+ 1.4617588028897899e-08,
+ 1.462664656060042e-08
+ ],
+ "gamma_dfa": 0.09567815247282851,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.958325982093811,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 31383.2578125,
+ 44333160.0,
+ 160058736.0,
+ 295685184.0,
+ 371288096.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.18988522660402e-08,
+ 4.057836289206307e-10,
+ 4.0004452528386025e-10,
+ 3.9987613220660023e-10,
+ 4.004964138104583e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2255043151963037e-06,
+ 1.4663311453944061e-08,
+ 1.4252069746589768e-08,
+ 1.424969386931707e-08,
+ 1.4258660918642363e-08
+ ],
+ "gamma_dfa": 0.09609431066201068,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9508600234985352,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 31750.03125,
+ 46204072.0,
+ 166757840.0,
+ 307620864.0,
+ 385856832.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.133605978675405e-08,
+ 3.9670436380312424e-10,
+ 3.904292722456404e-10,
+ 3.9002356899686674e-10,
+ 3.9039230181892037e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2063508115243167e-06,
+ 1.4354414545891814e-08,
+ 1.3938280751801813e-08,
+ 1.3935605558401676e-08,
+ 1.394456727865645e-08
+ ],
+ "gamma_dfa": 0.09565898558139452,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9467211961746216,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 32133.1484375,
+ 47907484.0,
+ 173083168.0,
+ 319475424.0,
+ 400677984.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.030914079246941e-08,
+ 3.8645733835274143e-10,
+ 3.81215115030642e-10,
+ 3.812981042017327e-10,
+ 3.811861937208505e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.177025973855052e-06,
+ 1.4072985443647212e-08,
+ 1.368274382684831e-08,
+ 1.3679918531295243e-08,
+ 1.368857649453048e-08
+ ],
+ "gamma_dfa": 0.09606298332801089,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9524433612823486,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 32483.716796875,
+ 49794588.0,
+ 179046160.0,
+ 330962240.0,
+ 414954912.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.051003254015086e-08,
+ 3.794887737385011e-10,
+ 3.751928767670165e-10,
+ 3.752734789586043e-10,
+ 3.7574471312140645e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.154751766487607e-06,
+ 1.3766489281863414e-08,
+ 1.339402011524271e-08,
+ 1.3391274755747418e-08,
+ 1.3399712450734569e-08
+ ],
+ "gamma_dfa": 0.09573800596626825,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.952356219291687,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 32825.296875,
+ 51662352.0,
+ 185889568.0,
+ 343223360.0,
+ 430225696.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.9168662858155585e-08,
+ 3.7636679883767954e-10,
+ 3.7184264001233203e-10,
+ 3.7154498921943e-10,
+ 3.7157116272723556e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0909043289284455e-06,
+ 1.346105005239906e-08,
+ 1.3102917861829155e-08,
+ 1.3100156515122308e-08,
+ 1.3108366836434016e-08
+ ],
+ "gamma_dfa": 0.09539097778178984,
+ "acc_eval": 0.291015625,
+ "loss_eval": 1.9585516452789307,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 33148.9453125,
+ 53487464.0,
+ 192413680.0,
+ 354830112.0,
+ 444651488.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.949418024897568e-08,
+ 3.692673389288359e-10,
+ 3.6510769407804844e-10,
+ 3.6480282683548637e-10,
+ 3.65057900575394e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0807416351308348e-06,
+ 1.3205962545725924e-08,
+ 1.2856014031115137e-08,
+ 1.2853148767533185e-08,
+ 1.2861222309368259e-08
+ ],
+ "gamma_dfa": 0.09566472223013989,
+ "acc_eval": 0.2880859375,
+ "loss_eval": 1.9538320302963257,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 33465.359375,
+ 55258308.0,
+ 198680688.0,
+ 365875680.0,
+ 458634560.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.9228732141036744e-08,
+ 3.640579226971141e-10,
+ 3.6045816331764513e-10,
+ 3.6029040861862427e-10,
+ 3.6025293859154317e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.058711854464491e-06,
+ 1.294814744312589e-08,
+ 1.2619584488504643e-08,
+ 1.2616848898971966e-08,
+ 1.2624772338654111e-08
+ ],
+ "gamma_dfa": 0.09607254836737411,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9489495754241943,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 33763.53125,
+ 56920656.0,
+ 204554208.0,
+ 376681216.0,
+ 472155680.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.756867338391203e-08,
+ 3.4894195866108646e-10,
+ 3.4671995829960167e-10,
+ 3.464649955819965e-10,
+ 3.4666045034548176e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.092292217843351e-06,
+ 1.2733584853208413e-08,
+ 1.2427238793577544e-08,
+ 1.2424394846277664e-08,
+ 1.2432122886707475e-08
+ ],
+ "gamma_dfa": 0.09629741777825984,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9477816820144653,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 34061.03125,
+ 58650568.0,
+ 210577584.0,
+ 387585472.0,
+ 485747168.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.70959208801014e-08,
+ 3.4928168690662176e-10,
+ 3.46003392603933e-10,
+ 3.4562114281655454e-10,
+ 3.4606426058125805e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.178826091243536e-06,
+ 1.2512856528701377e-08,
+ 1.2208544397651622e-08,
+ 1.2205639166040783e-08,
+ 1.2213387634574246e-08
+ ],
+ "gamma_dfa": 0.09542209599749185,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9549853801727295,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 34344.76171875,
+ 60294200.0,
+ 216821792.0,
+ 398493824.0,
+ 499371840.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.7367511629990986e-08,
+ 3.416208427253764e-10,
+ 3.378898272288211e-10,
+ 3.377436663676292e-10,
+ 3.386138314187548e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2603361432848033e-06,
+ 1.2295201301526504e-08,
+ 1.2022674411582557e-08,
+ 1.2019833128817936e-08,
+ 1.2027326690144946e-08
+ ],
+ "gamma_dfa": 0.09621504079404986,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.9597327709197998,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 34621.87109375,
+ 62004936.0,
+ 222707536.0,
+ 409299680.0,
+ 512662208.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.6534943837505125e-08,
+ 3.356194766546139e-10,
+ 3.3068575655548216e-10,
+ 3.3087257933495096e-10,
+ 3.3104252672444545e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.325955731270369e-06,
+ 1.2073825494951507e-08,
+ 1.1812358202689666e-08,
+ 1.1809524025352403e-08,
+ 1.1816909228912209e-08
+ ],
+ "gamma_dfa": 0.09621665377926547,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9411261081695557,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 34892.69921875,
+ 63619864.0,
+ 228332912.0,
+ 419524224.0,
+ 525474048.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.6131870707076814e-08,
+ 3.3116545616884707e-10,
+ 3.281262206389357e-10,
+ 3.2806185545908306e-10,
+ 3.281940552657403e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.306513235656894e-06,
+ 1.1909767394513437e-08,
+ 1.165356344756674e-08,
+ 1.1650684861308491e-08,
+ 1.1658000786951561e-08
+ ],
+ "gamma_dfa": 0.09604647590094828,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9494699239730835,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 35134.12890625,
+ 65285940.0,
+ 233831760.0,
+ 429654048.0,
+ 537931904.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.542536740676951e-08,
+ 3.2549649087165733e-10,
+ 3.224807365587168e-10,
+ 3.2198288479889925e-10,
+ 3.2189514942437825e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2077998639579164e-06,
+ 1.1713971126425804e-08,
+ 1.1479991179896842e-08,
+ 1.147721562233528e-08,
+ 1.1484392992144876e-08
+ ],
+ "gamma_dfa": 0.09610223810159368,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.947687029838562,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 35383.89453125,
+ 66896316.0,
+ 239557328.0,
+ 439032672.0,
+ 549329344.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.55890657949476e-08,
+ 3.2204855449080583e-10,
+ 3.1836161484832814e-10,
+ 3.185524344306856e-10,
+ 3.1883792828146795e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.19811397275771e-06,
+ 1.1587792059231106e-08,
+ 1.1364262419988336e-08,
+ 1.1361324325775968e-08,
+ 1.1368459951199839e-08
+ ],
+ "gamma_dfa": 0.09620415412791772,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9550621509552002,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 35603.75390625,
+ 68393976.0,
+ 244906672.0,
+ 448738336.0,
+ 561222784.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.4847117070266904e-08,
+ 3.208481536010055e-10,
+ 3.1700905789300293e-10,
+ 3.1679742162893376e-10,
+ 3.169834394967097e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.1413667329616146e-06,
+ 1.1423910706298557e-08,
+ 1.1206890526693769e-08,
+ 1.1204000394116065e-08,
+ 1.1211046313519546e-08
+ ],
+ "gamma_dfa": 0.09554143912100699,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9572508335113525,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 35840.75,
+ 69909448.0,
+ 249732624.0,
+ 457790144.0,
+ 572499584.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.482150200464275e-08,
+ 3.132541726014182e-10,
+ 3.1085201079861235e-10,
+ 3.1094149477439714e-10,
+ 3.1132280087220465e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.1111580938159022e-06,
+ 1.1274166489272375e-08,
+ 1.1068144623038734e-08,
+ 1.1065306892987792e-08,
+ 1.1072265770906142e-08
+ ],
+ "gamma_dfa": 0.09598036286843126,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.9514048099517822,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 36044.14453125,
+ 71301840.0,
+ 254043168.0,
+ 466339968.0,
+ 583323328.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.41697069422753e-08,
+ 3.088812261520246e-10,
+ 3.0549318630335165e-10,
+ 3.051613683968668e-10,
+ 3.050981411956144e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.063583790208213e-06,
+ 1.1131353616633533e-08,
+ 1.0936378025405702e-08,
+ 1.0933466576545925e-08,
+ 1.0940373940115933e-08
+ ],
+ "gamma_dfa": 0.09560732997124433,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9496949911117554,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 36240.3046875,
+ 72753064.0,
+ 259111488.0,
+ 475471840.0,
+ 594591872.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.367900612895937e-08,
+ 3.0714322751812517e-10,
+ 3.043856555695612e-10,
+ 3.04040070897571e-10,
+ 3.043043039774318e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.096502268817858e-06,
+ 1.1002981636920595e-08,
+ 1.0808172135057248e-08,
+ 1.0805252692591694e-08,
+ 1.0812099660029162e-08
+ ],
+ "gamma_dfa": 0.09588889799488243,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.951111078262329,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 36427.96484375,
+ 74044192.0,
+ 263715872.0,
+ 483414560.0,
+ 604480512.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.3715726977543454e-08,
+ 3.022930794571721e-10,
+ 2.992986969374556e-10,
+ 2.9908994725325044e-10,
+ 2.9924074329557016e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0333421818795614e-06,
+ 1.0890616408687492e-08,
+ 1.0706762587631147e-08,
+ 1.0703858244198727e-08,
+ 1.071066169089363e-08
+ ],
+ "gamma_dfa": 0.09630945282333414,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.949332594871521,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 36613.015625,
+ 75303768.0,
+ 267802576.0,
+ 490809920.0,
+ 613719616.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.348211473688025e-08,
+ 3.012197435925401e-10,
+ 2.9878169383046327e-10,
+ 2.9841951132425493e-10,
+ 2.984068825373498e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.008998646691907e-06,
+ 1.0781116444036343e-08,
+ 1.0603616651394532e-08,
+ 1.0600682998074262e-08,
+ 1.0607434930420823e-08
+ ],
+ "gamma_dfa": 0.0960872639734589,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9464266300201416,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 36784.2265625,
+ 76478576.0,
+ 271792224.0,
+ 498011968.0,
+ 622710336.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.403291680750044e-08,
+ 3.0129157502223336e-10,
+ 2.977850743768329e-10,
+ 2.975975854635493e-10,
+ 2.9797145306709183e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9997727324371226e-06,
+ 1.0701310948491027e-08,
+ 1.052768094922385e-08,
+ 1.0524773941256171e-08,
+ 1.0531463701113353e-08
+ ],
+ "gamma_dfa": 0.09624087948759552,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.9560136795043945,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 36953.8671875,
+ 77622176.0,
+ 275419712.0,
+ 504592704.0,
+ 630923392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.3204310290766443e-08,
+ 2.9739929963135125e-10,
+ 2.9424951364376284e-10,
+ 2.9405439194718497e-10,
+ 2.94715835069681e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.95851918963308e-06,
+ 1.0595774924127e-08,
+ 1.0427880781094245e-08,
+ 1.042505370918434e-08,
+ 1.0431726593651547e-08
+ ],
+ "gamma_dfa": 0.09637677710998105,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.950129747390747,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 37103.0546875,
+ 78713944.0,
+ 279082240.0,
+ 511376384.0,
+ 639270976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.3287564583115454e-08,
+ 2.9558042125010786e-10,
+ 2.94046592630437e-10,
+ 2.936023091315576e-10,
+ 2.9353278141464045e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9398986498563318e-06,
+ 1.0504810354916572e-08,
+ 1.034081797968156e-08,
+ 1.0337980249630618e-08,
+ 1.0344593626143705e-08
+ ],
+ "gamma_dfa": 0.09638382289995207,
+ "acc_eval": 0.29296875,
+ "loss_eval": 1.9502758979797363,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 37248.1015625,
+ 79737480.0,
+ 282511072.0,
+ 517720224.0,
+ 647238976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.260229585246634e-08,
+ 2.899096518405031e-10,
+ 2.8717414557455356e-10,
+ 2.8704966181791747e-10,
+ 2.871551885164081e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9307011573109776e-06,
+ 1.0423523377767197e-08,
+ 1.0264206373733487e-08,
+ 1.0261346439222052e-08,
+ 1.0267889649639983e-08
+ ],
+ "gamma_dfa": 0.0963258501906239,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.949232816696167,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 37381.0390625,
+ 80657776.0,
+ 285833920.0,
+ 523738208.0,
+ 654706368.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.2669339112298985e-08,
+ 2.929272380214343e-10,
+ 2.8994415202099333e-10,
+ 2.898675188767186e-10,
+ 2.900694684448979e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.912831860157894e-06,
+ 1.0341300260563457e-08,
+ 1.018425699328418e-08,
+ 1.0181377518847512e-08,
+ 1.0187909182945987e-08
+ ],
+ "gamma_dfa": 0.09613002402329585,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.9482614994049072,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 37505.28515625,
+ 81612512.0,
+ 289044000.0,
+ 529475296.0,
+ 661837376.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.200942965188915e-08,
+ 2.875680804592662e-10,
+ 2.8434027354862224e-10,
+ 2.8415880759524725e-10,
+ 2.840882251664567e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9117632038833108e-06,
+ 1.0266585803719863e-08,
+ 1.0111568471415922e-08,
+ 1.0108765380323348e-08,
+ 1.0115227766505086e-08
+ ],
+ "gamma_dfa": 0.09620579873444512,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.949747085571289,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 37622.05078125,
+ 82508960.0,
+ 292035424.0,
+ 534928544.0,
+ 668760064.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.211632014834322e-08,
+ 2.8521121575586506e-10,
+ 2.8250474182200946e-10,
+ 2.822122813217476e-10,
+ 2.8265498275281686e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9012180675636046e-06,
+ 1.0211213208322079e-08,
+ 1.0059093114023199e-08,
+ 1.0056256272150677e-08,
+ 1.0062689348444565e-08
+ ],
+ "gamma_dfa": 0.09616703895881074,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9510722160339355,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 37739.125,
+ 83378024.0,
+ 294890528.0,
+ 540384832.0,
+ 675452224.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.20015284166675e-08,
+ 2.812508559379978e-10,
+ 2.7935267987722057e-10,
+ 2.7908611532900807e-10,
+ 2.792987507937994e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.858193283827859e-06,
+ 1.0136964156970407e-08,
+ 9.987989102455685e-09,
+ 9.985158477832101e-09,
+ 9.991581784163373e-09
+ ],
+ "gamma_dfa": 0.09625962336212979,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.949669599533081,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 37841.23828125,
+ 84099792.0,
+ 297324992.0,
+ 545087552.0,
+ 681202944.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.180555717743118e-08,
+ 2.81841883165157e-10,
+ 2.790032094246442e-10,
+ 2.7877883335136744e-10,
+ 2.790592201762365e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.8341921733954223e-06,
+ 1.0072185752107998e-08,
+ 9.925220645357058e-09,
+ 9.922425547870262e-09,
+ 9.928815103421584e-09
+ ],
+ "gamma_dfa": 0.09619013674819143,
+ "acc_eval": 0.2958984375,
+ "loss_eval": 1.947105884552002,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 37933.76953125,
+ 84846568.0,
+ 299677280.0,
+ 549384448.0,
+ 686714688.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.136923775239666e-08,
+ 2.810240096184913e-10,
+ 2.7924595968897847e-10,
+ 2.7894245246962157e-10,
+ 2.789228015220857e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.822413307512761e-06,
+ 1.0021487639733095e-08,
+ 9.876163886701761e-09,
+ 9.873332373899757e-09,
+ 9.879697948633748e-09
+ ],
+ "gamma_dfa": 0.09583658421615837,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9495177268981934,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 38020.0,
+ 85562224.0,
+ 301864096.0,
+ 553597760.0,
+ 691941760.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.160018545780076e-08,
+ 2.8198060553208393e-10,
+ 2.797063691772905e-10,
+ 2.7946911451692813e-10,
+ 2.796869680299352e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7969890652457252e-06,
+ 9.96650406648314e-09,
+ 9.82430670148915e-09,
+ 9.821477853222405e-09,
+ 9.827816782603804e-09
+ ],
+ "gamma_dfa": 0.09604255547674256,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9492969512939453,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 38095.6171875,
+ 86194680.0,
+ 304047168.0,
+ 557639872.0,
+ 696924224.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.120950063997043e-08,
+ 2.782411523405415e-10,
+ 2.750368821580196e-10,
+ 2.7475391406461824e-10,
+ 2.748750949077561e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7781038625107612e-06,
+ 9.913026843832995e-09,
+ 9.771905951083681e-09,
+ 9.769114406310564e-09,
+ 9.775444453907767e-09
+ ],
+ "gamma_dfa": 0.09590470486728009,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9471888542175293,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 38161.02734375,
+ 86761784.0,
+ 305935040.0,
+ 560989248.0,
+ 701039488.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.1234330555871566e-08,
+ 2.762826911695271e-10,
+ 2.737765292248895e-10,
+ 2.7344454478495095e-10,
+ 2.735327242486818e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7851888262375724e-06,
+ 9.883654783493512e-09,
+ 9.742406881230181e-09,
+ 9.73962688277652e-09,
+ 9.74590719238222e-09
+ ],
+ "gamma_dfa": 0.0961023918025603,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9466722011566162,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 38225.30859375,
+ 87283448.0,
+ 307635232.0,
+ 564114432.0,
+ 704943360.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.112997669698416e-08,
+ 2.7494201360056536e-10,
+ 2.7230390164945106e-10,
+ 2.724628855865774e-10,
+ 2.7264715485308955e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.775808070509811e-06,
+ 9.851329529908526e-09,
+ 9.711465409623088e-09,
+ 9.708682746634167e-09,
+ 9.714950621741991e-09
+ ],
+ "gamma_dfa": 0.09609865310994792,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9487848281860352,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 38286.74609375,
+ 87760048.0,
+ 309161312.0,
+ 566976960.0,
+ 708521920.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.100326561091606e-08,
+ 2.750530914141791e-10,
+ 2.7221699894219853e-10,
+ 2.720162428637707e-10,
+ 2.72086408958927e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.76197988569038e-06,
+ 9.813816426174071e-09,
+ 9.67496749382235e-09,
+ 9.672206147115503e-09,
+ 9.678448265049155e-09
+ ],
+ "gamma_dfa": 0.09604053818475222,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.946324110031128,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 38345.609375,
+ 88198008.0,
+ 310597792.0,
+ 569628928.0,
+ 711849600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.150431903189201e-08,
+ 2.739733162560043e-10,
+ 2.706747326275405e-10,
+ 2.703801071923806e-10,
+ 2.703643420254309e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.754284651018679e-06,
+ 9.79015535307326e-09,
+ 9.652834087603424e-09,
+ 9.650069188182897e-09,
+ 9.656329069684944e-09
+ ],
+ "gamma_dfa": 0.09618356187274912,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.952025294303894,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 38393.00390625,
+ 88631992.0,
+ 311868064.0,
+ 571956672.0,
+ 714769600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.135545677603659e-08,
+ 2.741361304625656e-10,
+ 2.7016161530113436e-10,
+ 2.7007868164119486e-10,
+ 2.702876256144293e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7439270979812136e-06,
+ 9.758214680744004e-09,
+ 9.621899721423688e-09,
+ 9.619145480144198e-09,
+ 9.625373387223135e-09
+ ],
+ "gamma_dfa": 0.09624775896372739,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9458943605422974,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 38432.8515625,
+ 89003520.0,
+ 313081504.0,
+ 574038272.0,
+ 717387392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.1023032909824906e-08,
+ 2.709044100157598e-10,
+ 2.6825267007701825e-10,
+ 2.6804419794856926e-10,
+ 2.6862953528272726e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7511816824699054e-06,
+ 9.751657259471358e-09,
+ 9.615223284242802e-09,
+ 9.612453943930177e-09,
+ 9.618667640154399e-09
+ ],
+ "gamma_dfa": 0.09613665863071219,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9508092403411865,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 38471.12890625,
+ 89306096.0,
+ 314023616.0,
+ 575863488.0,
+ 719706496.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.104102740460803e-08,
+ 2.722161940305057e-10,
+ 2.698590240157728e-10,
+ 2.697040091259595e-10,
+ 2.698894441266475e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.731306722125737e-06,
+ 9.717195048608573e-09,
+ 9.582218574166745e-09,
+ 9.579466997422514e-09,
+ 9.585680693646736e-09
+ ],
+ "gamma_dfa": 0.09615167022275273,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9497017860412598,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 38506.49609375,
+ 89593104.0,
+ 314968672.0,
+ 577511168.0,
+ 721761728.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.099763100702148e-08,
+ 2.7151769721456276e-10,
+ 2.698610224172171e-10,
+ 2.6943663966605413e-10,
+ 2.6953861365086595e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.73057457889081e-06,
+ 9.698882585951196e-09,
+ 9.564125491579034e-09,
+ 9.561379243905321e-09,
+ 9.567577841096409e-09
+ ],
+ "gamma_dfa": 0.09604650201799814,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.948227882385254,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 38536.46875,
+ 89827632.0,
+ 315715328.0,
+ 578913664.0,
+ 723505408.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.074277709127273e-08,
+ 2.7221166987168033e-10,
+ 2.7026783588901537e-10,
+ 2.700663026544703e-10,
+ 2.7004307123768e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.727413175307447e-06,
+ 9.684548274435656e-09,
+ 9.549998125635284e-09,
+ 9.547248325247892e-09,
+ 9.553437152476363e-09
+ ],
+ "gamma_dfa": 0.09602321147394832,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9482835531234741,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 38560.86328125,
+ 90036944.0,
+ 316345728.0,
+ 580143808.0,
+ 725043392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.10075821580358e-08,
+ 2.70407807256845e-10,
+ 2.6787719265009e-10,
+ 2.677959520802631e-10,
+ 2.679190480581184e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7208343453821726e-06,
+ 9.672045386821537e-09,
+ 9.538242196072133e-09,
+ 9.535500389290519e-09,
+ 9.541698986481606e-09
+ ],
+ "gamma_dfa": 0.09616725159867201,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9490463733673096,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 38581.62890625,
+ 90197056.0,
+ 316901888.0,
+ 581085248.0,
+ 726214080.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.062888064344406e-08,
+ 2.7050772732906125e-10,
+ 2.680498045748436e-10,
+ 2.6770730077174676e-10,
+ 2.6768456895531756e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7148839762958232e-06,
+ 9.659022026653474e-09,
+ 9.525311206459719e-09,
+ 9.522568511499685e-09,
+ 9.528759115084995e-09
+ ],
+ "gamma_dfa": 0.09604255046724575,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9472681283950806,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 38598.60546875,
+ 90331488.0,
+ 317399072.0,
+ 581959360.0,
+ 727306816.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.070089059699967e-08,
+ 2.706254109696715e-10,
+ 2.6912555517455417e-10,
+ 2.687201572371123e-10,
+ 2.686441624710767e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7157270778843667e-06,
+ 9.650602983413137e-09,
+ 9.516874399650987e-09,
+ 9.514130816512534e-09,
+ 9.520310761956807e-09
+ ],
+ "gamma_dfa": 0.09604466614109697,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9475460052490234,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 38612.046875,
+ 90438432.0,
+ 317761152.0,
+ 582634240.0,
+ 728132928.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.071476039120171e-08,
+ 2.693741063541921e-10,
+ 2.670912935265335e-10,
+ 2.670463572496118e-10,
+ 2.6704632949403617e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7161215712112607e-06,
+ 9.646365484172748e-09,
+ 9.512908683007026e-09,
+ 9.51017486983119e-09,
+ 9.516351262561784e-09
+ ],
+ "gamma_dfa": 0.09614986698579742,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.947176218032837,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 38622.60546875,
+ 90514344.0,
+ 318023872.0,
+ 583138880.0,
+ 728758976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0669719087181875e-08,
+ 2.7007937553058525e-10,
+ 2.6770055616687216e-10,
+ 2.676309729388038e-10,
+ 2.678066102212995e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.715124537644442e-06,
+ 9.639773423941733e-09,
+ 9.506337939058085e-09,
+ 9.503595244098051e-09,
+ 9.509768084114967e-09
+ ],
+ "gamma_dfa": 0.09608547511743382,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9474897384643555,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 38631.16796875,
+ 90589928.0,
+ 318254208.0,
+ 583549632.0,
+ 729273152.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0695071251993795e-08,
+ 2.704435009270867e-10,
+ 2.6853075318911124e-10,
+ 2.682237765228024e-10,
+ 2.6814858666845964e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7134594802191714e-06,
+ 9.634878672670766e-09,
+ 9.501549769197482e-09,
+ 9.498809738772707e-09,
+ 9.504978137897524e-09
+ ],
+ "gamma_dfa": 0.0960953844114556,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9472770690917969,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 38638.31640625,
+ 90643280.0,
+ 318415136.0,
+ 583858560.0,
+ 729656640.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.078240761235975e-08,
+ 2.6967122979115743e-10,
+ 2.669718335290838e-10,
+ 2.6691132637424175e-10,
+ 2.6697202781811313e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.711297611313057e-06,
+ 9.631804687160184e-09,
+ 9.498727138179675e-09,
+ 9.495988884111739e-09,
+ 9.502159947771815e-09
+ ],
+ "gamma_dfa": 0.09613717825050117,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.94759202003479,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 38642.26171875,
+ 90677816.0,
+ 318520992.0,
+ 584046976.0,
+ 729889984.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.069002995128358e-08,
+ 2.6985705336990407e-10,
+ 2.6735619274020905e-10,
+ 2.671637633344659e-10,
+ 2.6708837919109385e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7110704650112893e-06,
+ 9.629748554118578e-09,
+ 9.496692321420142e-09,
+ 9.493953179173786e-09,
+ 9.500122466477023e-09
+ ],
+ "gamma_dfa": 0.09612438916155952,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9474642276763916,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 38644.16015625,
+ 90695256.0,
+ 318576288.0,
+ 584137856.0,
+ 730003328.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.070784681038276e-08,
+ 2.6936791686082984e-10,
+ 2.671484977678773e-10,
+ 2.668835430430505e-10,
+ 2.671484977678773e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.710563421715051e-06,
+ 9.628578823139833e-09,
+ 9.495578545681838e-09,
+ 9.492838515257063e-09,
+ 9.499009578917139e-09
+ ],
+ "gamma_dfa": 0.09612188487153617,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.9476267099380493,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 38646.0625,
+ 90710400.0,
+ 318627968.0,
+ 584229760.0,
+ 730119232.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.075278863841959e-08,
+ 2.692224221334527e-10,
+ 2.671664001141494e-10,
+ 2.669355292361786e-10,
+ 2.6700280875147087e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7103426418761956e-06,
+ 9.62763913037179e-09,
+ 9.494667274623225e-09,
+ 9.49192813237687e-09,
+ 9.498098307858527e-09
+ ],
+ "gamma_dfa": 0.09612667236069683,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9476723670959473,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 38646.953125,
+ 90717408.0,
+ 318651872.0,
+ 584275776.0,
+ 730176960.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.076975639894954e-08,
+ 2.691815659261465e-10,
+ 2.671429466527542e-10,
+ 2.669321430559535e-10,
+ 2.669318377446217e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7102296371595003e-06,
+ 9.62716750763093e-09,
+ 9.494214303629178e-09,
+ 9.491475161382823e-09,
+ 9.4976462250429e-09
+ ],
+ "gamma_dfa": 0.09612801273397054,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9476864337921143,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 38646.98046875,
+ 90717592.0,
+ 318652416.0,
+ 584276736.0,
+ 730178112.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.076372033840926e-08,
+ 2.692036038531853e-10,
+ 2.6715371581609304e-10,
+ 2.669119369969053e-10,
+ 2.6695023969125486e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.710211447265465e-06,
+ 9.627171060344608e-09,
+ 9.494216968164437e-09,
+ 9.491476937739662e-09,
+ 9.497648001399739e-09
+ ],
+ "gamma_dfa": 0.09612751441454748,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.947685956954956,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file