{ "config": { "output_dir": "results/snapshot_evolution_v2", "epochs": 100, "lr": 0.001, "wd": 0.01, "seed": 42, "depth": 4, "d_hidden": 256, "log_every": 1 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652 ], "bp_grad_norms_per_sample_med": [ 0.0010068593546748161, 0.000997236929833889, 0.0009934091940522194, 0.0009870644425973296, 0.0009829498594626784 ], "bp_grad_norms_F": [ 0.03544403985142708, 0.03507080301642418, 0.03477022796869278, 0.03443896397948265, 0.03407429903745651 ], "gamma_dfa": NaN, "acc_eval": 0.115234375, "loss_eval": 2.383650302886963, "epoch": 0 }, { "hidden_norms": [ 77.06888580322266, 79.12034606933594, 82.7389144897461, 87.31297302246094, 93.80765533447266 ], "bp_grad_norms_per_sample_med": [ 5.941955532762222e-05, 5.619435978587717e-05, 5.499917097040452e-05, 5.5899512517498806e-05, 5.7389137509744614e-05 ], "bp_grad_norms_F": [ 0.0026216788683086634, 0.0023027872666716576, 0.002111479640007019, 0.002080164849758148, 0.0021061261650174856 ], "gamma_dfa": NaN, "acc_eval": 0.3798828125, "loss_eval": 1.6751981973648071, "epoch": 1 }, { "hidden_norms": [ 98.86981201171875, 98.9476089477539, 102.55016326904297, 106.3559341430664, 112.6939697265625 ], "bp_grad_norms_per_sample_med": [ 4.658113539335318e-05, 4.402571721584536e-05, 4.2862800910370424e-05, 4.381770850159228e-05, 4.3870313675142825e-05 ], "bp_grad_norms_F": [ 0.00196655560284853, 0.0018041934818029404, 0.0016866555670276284, 0.0016513779992237687, 0.0016559252981096506 ], "gamma_dfa": NaN, "acc_eval": 0.4541015625, "loss_eval": 1.5228025913238525, "epoch": 2 }, { "hidden_norms": [ 110.40647888183594, 112.07202911376953, 114.70049285888672, 117.17343139648438, 124.54205322265625 ], "bp_grad_norms_per_sample_med": [ 4.4490061554824933e-05, 4.3751915654866025e-05, 4.270448334864341e-05, 4.182140401098877e-05, 4.151134271523915e-05 ], "bp_grad_norms_F": [ 0.0019047901732847095, 0.0017693191766738892, 0.0016821600729599595, 0.0016251102788373828, 0.0015800207620486617 ], "gamma_dfa": NaN, "acc_eval": 0.4697265625, "loss_eval": 1.4416429996490479, "epoch": 3 }, { "hidden_norms": [ 125.09136199951172, 126.65565490722656, 128.4573974609375, 130.39990234375, 138.1091766357422 ], "bp_grad_norms_per_sample_med": [ 4.1048842831514776e-05, 4.0168823034036905e-05, 3.916600326192565e-05, 3.953508348786272e-05, 3.938759255106561e-05 ], "bp_grad_norms_F": [ 0.0017511667683720589, 0.001639657886698842, 0.0015659942291676998, 0.0015107291983440518, 0.0014574137749150395 ], "gamma_dfa": NaN, "acc_eval": 0.50390625, "loss_eval": 1.3718887567520142, "epoch": 4 }, { "hidden_norms": [ 139.76705932617188, 139.05606079101562, 139.5422821044922, 141.0078582763672, 148.9493865966797 ], "bp_grad_norms_per_sample_med": [ 3.957379158237018e-05, 4.0101109334500507e-05, 3.9158370782388374e-05, 3.927717261831276e-05, 3.796629243879579e-05 ], "bp_grad_norms_F": [ 0.0017042789841070771, 0.001630594371818006, 0.0015700262738391757, 0.0015037605771794915, 0.0014294973807409406 ], "gamma_dfa": NaN, "acc_eval": 0.498046875, "loss_eval": 1.367867112159729, "epoch": 5 }, { "hidden_norms": [ 147.73207092285156, 148.01638793945312, 148.1798553466797, 149.07754516601562, 156.61810302734375 ], "bp_grad_norms_per_sample_med": [ 3.987981835962273e-05, 3.9670325350016356e-05, 3.970034231315367e-05, 3.8273319660220295e-05, 3.6929654015693814e-05 ], "bp_grad_norms_F": [ 0.0017687880899757147, 0.001693942816928029, 0.0016310750506818295, 0.0015193652361631393, 0.0014129421906545758 ], "gamma_dfa": NaN, "acc_eval": 0.5234375, "loss_eval": 1.3461639881134033, "epoch": 6 }, { "hidden_norms": [ 159.30731201171875, 158.4180450439453, 158.36903381347656, 158.61819458007812, 165.9392547607422 ], "bp_grad_norms_per_sample_med": [ 3.744649075088091e-05, 3.805281448876485e-05, 3.727989678736776e-05, 3.5814937291434035e-05, 3.422912777750753e-05 ], "bp_grad_norms_F": [ 0.0017357978504151106, 0.0016663926653563976, 0.0016097063198685646, 0.0014966910239309072, 0.001379394088871777 ], "gamma_dfa": NaN, "acc_eval": 0.5283203125, "loss_eval": 1.3227663040161133, "epoch": 7 }, { "hidden_norms": [ 171.02230834960938, 169.76348876953125, 168.44949340820312, 168.26429748535156, 176.89520263671875 ], "bp_grad_norms_per_sample_med": [ 3.716369246831164e-05, 3.8349648093571886e-05, 3.801397542702034e-05, 3.6082456063013524e-05, 3.359258334967308e-05 ], "bp_grad_norms_F": [ 0.0016445739893242717, 0.001604317338205874, 0.0015634173760190606, 0.0014586447505280375, 0.0013399318559095263 ], "gamma_dfa": NaN, "acc_eval": 0.541015625, "loss_eval": 1.2933616638183594, "epoch": 8 }, { "hidden_norms": [ 177.41796875, 177.29603576660156, 175.89486694335938, 175.0777587890625, 181.38400268554688 ], "bp_grad_norms_per_sample_med": [ 3.602267679525539e-05, 3.6796918720938265e-05, 3.648500933195464e-05, 3.566688246792182e-05, 3.4070406400132924e-05 ], "bp_grad_norms_F": [ 0.0015903833555057645, 0.0015696624759584665, 0.0015270623844116926, 0.0014402325032278895, 0.0013178731314837933 ], "gamma_dfa": NaN, "acc_eval": 0.5478515625, "loss_eval": 1.2806801795959473, "epoch": 9 }, { "hidden_norms": [ 187.4056854248047, 186.72698974609375, 186.21583557128906, 185.0518035888672, 193.2371063232422 ], "bp_grad_norms_per_sample_med": [ 3.3276784961344674e-05, 3.436602492001839e-05, 3.432494486332871e-05, 3.371347702341154e-05, 3.1834206311032176e-05 ], "bp_grad_norms_F": [ 0.0014970082556828856, 0.0014613966923207045, 0.001435543643310666, 0.001374539453536272, 0.0012561712646856904 ], "gamma_dfa": NaN, "acc_eval": 0.56640625, "loss_eval": 1.2740942239761353, "epoch": 10 }, { "hidden_norms": [ 194.4965057373047, 191.25531005859375, 189.80703735351562, 188.18850708007812, 195.7776336669922 ], "bp_grad_norms_per_sample_med": [ 3.298965748399496e-05, 3.40789083566051e-05, 3.381206624908373e-05, 3.3352327591273934e-05, 3.1442876206710935e-05 ], "bp_grad_norms_F": [ 0.0015152172418311238, 0.001501554623246193, 0.0014814225723966956, 0.001403055852279067, 0.001272345893085003 ], "gamma_dfa": NaN, "acc_eval": 0.560546875, "loss_eval": 1.265188455581665, "epoch": 11 }, { "hidden_norms": [ 200.5504913330078, 197.28366088867188, 195.27011108398438, 192.64669799804688, 200.8507843017578 ], "bp_grad_norms_per_sample_med": [ 3.453825775068253e-05, 3.5414250305620953e-05, 3.575523442123085e-05, 3.455601472523995e-05, 3.2858857593964785e-05 ], "bp_grad_norms_F": [ 0.001518857548944652, 0.001502488274127245, 0.0014838415663689375, 0.001404650043696165, 0.0012748484732583165 ], "gamma_dfa": NaN, "acc_eval": 0.5458984375, "loss_eval": 1.2733395099639893, "epoch": 12 }, { "hidden_norms": [ 207.21469116210938, 202.24969482421875, 198.8241424560547, 197.5497283935547, 207.32147216796875 ], "bp_grad_norms_per_sample_med": [ 3.2123080018209293e-05, 3.345572258695029e-05, 3.3888838515849784e-05, 3.344774086144753e-05, 3.095310239586979e-05 ], "bp_grad_norms_F": [ 0.0014620382571592927, 0.0014708929229527712, 0.0014657732099294662, 0.0013834136771038175, 0.0012381445849314332 ], "gamma_dfa": NaN, "acc_eval": 0.56640625, "loss_eval": 1.2357412576675415, "epoch": 13 }, { "hidden_norms": [ 214.6268310546875, 208.3655242919922, 205.5032501220703, 202.8442840576172, 211.64646911621094 ], "bp_grad_norms_per_sample_med": [ 3.207657573511824e-05, 3.362155257491395e-05, 3.38435493176803e-05, 3.330525942146778e-05, 3.142434434266761e-05 ], "bp_grad_norms_F": [ 0.0014900992391631007, 0.0015044353203848004, 0.001489310641773045, 0.0014063691487535834, 0.0012448005145415664 ], "gamma_dfa": NaN, "acc_eval": 0.56640625, "loss_eval": 1.2451550960540771, "epoch": 14 }, { "hidden_norms": [ 220.40109252929688, 213.53439331054688, 209.3384552001953, 206.62062072753906, 213.82391357421875 ], "bp_grad_norms_per_sample_med": [ 3.227095294278115e-05, 3.415472019696608e-05, 3.4918764868052676e-05, 3.409514465602115e-05, 3.082074908888899e-05 ], "bp_grad_norms_F": [ 0.0015189005061984062, 0.001544533297419548, 0.0015320393722504377, 0.0014468894805759192, 0.0012609416153281927 ], "gamma_dfa": NaN, "acc_eval": 0.564453125, "loss_eval": 1.248854398727417, "epoch": 15 }, { "hidden_norms": [ 226.32350158691406, 219.70506286621094, 213.84132385253906, 210.67050170898438, 219.11776733398438 ], "bp_grad_norms_per_sample_med": [ 3.360298796906136e-05, 3.4720324038062245e-05, 3.473780452623032e-05, 3.412307341932319e-05, 3.0327399144880474e-05 ], "bp_grad_norms_F": [ 0.0014919604873284698, 0.0015073713148012757, 0.001499581034295261, 0.001411686884239316, 0.0012323390692472458 ], "gamma_dfa": NaN, "acc_eval": 0.57421875, "loss_eval": 1.2207037210464478, "epoch": 16 }, { "hidden_norms": [ 230.78538513183594, 223.432373046875, 216.73037719726562, 212.86383056640625, 220.8701171875 ], "bp_grad_norms_per_sample_med": [ 3.253064278396778e-05, 3.3939610148081556e-05, 3.490943709039129e-05, 3.4084565413650125e-05, 3.0307599445222877e-05 ], "bp_grad_norms_F": [ 0.0015068502398207784, 0.0015421892749145627, 0.0015326113207265735, 0.0014369196724146605, 0.0012492147507146 ], "gamma_dfa": NaN, "acc_eval": 0.560546875, "loss_eval": 1.216906189918518, "epoch": 17 }, { "hidden_norms": [ 234.5084991455078, 225.73875427246094, 219.08822631835938, 214.42320251464844, 222.92369079589844 ], "bp_grad_norms_per_sample_med": [ 3.451363227213733e-05, 3.6047003959538415e-05, 3.654924512375146e-05, 3.617065158323385e-05, 3.275999551988207e-05 ], "bp_grad_norms_F": [ 0.001566705177538097, 0.0015968933003023267, 0.0015981856267899275, 0.0014931216137483716, 0.0012800253462046385 ], "gamma_dfa": NaN, "acc_eval": 0.5556640625, "loss_eval": 1.2483153343200684, "epoch": 18 }, { "hidden_norms": [ 238.0281219482422, 229.677734375, 223.0265350341797, 217.872314453125, 225.45947265625 ], "bp_grad_norms_per_sample_med": [ 3.4922632039524615e-05, 3.6500507121672854e-05, 3.762893902603537e-05, 3.615105015342124e-05, 3.2680742151569575e-05 ], "bp_grad_norms_F": [ 0.0015319561352953315, 0.001577642629854381, 0.001574998372234404, 0.0014754259027540684, 0.0012637749314308167 ], "gamma_dfa": NaN, "acc_eval": 0.5576171875, "loss_eval": 1.2469550371170044, "epoch": 19 }, { "hidden_norms": [ 241.45298767089844, 233.28753662109375, 226.9265899658203, 222.43453979492188, 229.83859252929688 ], "bp_grad_norms_per_sample_med": [ 3.368386751390062e-05, 3.570445187506266e-05, 3.622082658694126e-05, 3.5024619137402624e-05, 3.180970816174522e-05 ], "bp_grad_norms_F": [ 0.0015120706520974636, 0.0015433274675160646, 0.0015402185963466763, 0.0014465245185419917, 0.001252179266884923 ], "gamma_dfa": NaN, "acc_eval": 0.5634765625, "loss_eval": 1.2113828659057617, "epoch": 20 }, { "hidden_norms": [ 246.53602600097656, 236.25527954101562, 231.07940673828125, 227.7357940673828, 235.99017333984375 ], "bp_grad_norms_per_sample_med": [ 3.2015348551794887e-05, 3.388321783859283e-05, 3.521092003211379e-05, 3.46749002346769e-05, 3.079533780692145e-05 ], "bp_grad_norms_F": [ 0.0014757646713405848, 0.001517578144557774, 0.0015156606677919626, 0.00144051609095186, 0.0012491638772189617 ], "gamma_dfa": NaN, "acc_eval": 0.576171875, "loss_eval": 1.2042850255966187, "epoch": 21 }, { "hidden_norms": [ 250.74209594726562, 241.11993408203125, 232.76829528808594, 228.410400390625, 237.100341796875 ], "bp_grad_norms_per_sample_med": [ 3.173810910084285e-05, 3.328004459035583e-05, 3.405071402085014e-05, 3.34872274834197e-05, 3.07901827909518e-05 ], "bp_grad_norms_F": [ 0.0014801323413848877, 0.0015176001470535994, 0.0015198889886960387, 0.0014302636263892055, 0.001232756651006639 ], "gamma_dfa": NaN, "acc_eval": 0.587890625, "loss_eval": 1.1819555759429932, "epoch": 22 }, { "hidden_norms": [ 251.96310424804688, 242.98260498046875, 235.83056640625, 229.86978149414062, 238.271240234375 ], "bp_grad_norms_per_sample_med": [ 3.078249574173242e-05, 3.301461765659042e-05, 3.3559550502104685e-05, 3.2682331948308274e-05, 2.9418402846204117e-05 ], "bp_grad_norms_F": [ 0.00149905972648412, 0.0015357647789642215, 0.0015457755653187633, 0.0014610268408432603, 0.0012446421897038817 ], "gamma_dfa": NaN, "acc_eval": 0.5732421875, "loss_eval": 1.1770297288894653, "epoch": 23 }, { "hidden_norms": [ 255.878662109375, 244.79376220703125, 236.5006561279297, 233.29434204101562, 239.50732421875 ], "bp_grad_norms_per_sample_med": [ 3.191530049662106e-05, 3.370656486367807e-05, 3.539594035828486e-05, 3.486185596557334e-05, 3.131559424218722e-05 ], "bp_grad_norms_F": [ 0.001507170731201768, 0.0015490618534386158, 0.0015714912442490458, 0.0014840371441096067, 0.0012607484823092818 ], "gamma_dfa": NaN, "acc_eval": 0.572265625, "loss_eval": 1.2011631727218628, "epoch": 24 }, { "hidden_norms": [ 256.66448974609375, 244.18772888183594, 236.46058654785156, 231.88583374023438, 238.06246948242188 ], "bp_grad_norms_per_sample_med": [ 3.2962809200398624e-05, 3.441200897214003e-05, 3.570063927327283e-05, 3.488562651909888e-05, 3.0770879675401375e-05 ], "bp_grad_norms_F": [ 0.0015825299778953195, 0.0016350955702364445, 0.0016404123743996024, 0.0015316286589950323, 0.0012829666957259178 ], "gamma_dfa": NaN, "acc_eval": 0.5703125, "loss_eval": 1.192138433456421, "epoch": 25 }, { "hidden_norms": [ 259.5942687988281, 247.43173217773438, 239.85533142089844, 233.21835327148438, 241.53346252441406 ], "bp_grad_norms_per_sample_med": [ 3.1691903132013977e-05, 3.34988217218779e-05, 3.45351618307177e-05, 3.441058288444765e-05, 3.0752617021789774e-05 ], "bp_grad_norms_F": [ 0.0015797498635947704, 0.0016322932206094265, 0.001641901326365769, 0.0015325341373682022, 0.0012732355389744043 ], "gamma_dfa": NaN, "acc_eval": 0.5791015625, "loss_eval": 1.1775751113891602, "epoch": 26 }, { "hidden_norms": [ 260.6902770996094, 249.26528930664062, 240.86239624023438, 235.91477966308594, 242.1553497314453 ], "bp_grad_norms_per_sample_med": [ 3.32598174281884e-05, 3.471180752967484e-05, 3.609888517530635e-05, 3.496996214380488e-05, 3.091244798270054e-05 ], "bp_grad_norms_F": [ 0.0015408779727295041, 0.001589508610777557, 0.0016157848294824362, 0.0015165223740041256, 0.0012689991854131222 ], "gamma_dfa": NaN, "acc_eval": 0.5859375, "loss_eval": 1.1941479444503784, "epoch": 27 }, { "hidden_norms": [ 265.0726623535156, 253.6020050048828, 244.876953125, 239.7056427001953, 248.2157440185547 ], "bp_grad_norms_per_sample_med": [ 3.255613773944788e-05, 3.457435013842769e-05, 3.5964570997748524e-05, 3.529110108502209e-05, 3.089939127676189e-05 ], "bp_grad_norms_F": [ 0.001513357157818973, 0.0015594394644722342, 0.0015772230690345168, 0.001489063142798841, 0.0012491336092352867 ], "gamma_dfa": NaN, "acc_eval": 0.5810546875, "loss_eval": 1.1790356636047363, "epoch": 28 }, { "hidden_norms": [ 266.9394836425781, 253.8067169189453, 243.13002014160156, 236.81365966796875, 245.42434692382812 ], "bp_grad_norms_per_sample_med": [ 3.378500332473777e-05, 3.5516346542863175e-05, 3.742165063158609e-05, 3.6865043512079865e-05, 3.170729542034678e-05 ], "bp_grad_norms_F": [ 0.0015557212755084038, 0.0016067115357145667, 0.001632526982575655, 0.0015416526002809405, 0.0012708577560260892 ], "gamma_dfa": NaN, "acc_eval": 0.5888671875, "loss_eval": 1.1785690784454346, "epoch": 29 }, { "hidden_norms": [ 271.3736572265625, 257.6708984375, 246.3377685546875, 240.7875213623047, 248.55162048339844 ], "bp_grad_norms_per_sample_med": [ 3.2452040613861755e-05, 3.456772174104117e-05, 3.550515975803137e-05, 3.530189496814273e-05, 3.098960587522015e-05 ], "bp_grad_norms_F": [ 0.0015420741401612759, 0.0016120158834382892, 0.0016289768973365426, 0.0015373170608654618, 0.0012695658951997757 ], "gamma_dfa": NaN, "acc_eval": 0.57421875, "loss_eval": 1.1686367988586426, "epoch": 30 }, { "hidden_norms": [ 270.6155090332031, 256.5137634277344, 246.4404296875, 238.71493530273438, 245.14651489257812 ], "bp_grad_norms_per_sample_med": [ 3.4225693525513634e-05, 3.6208981327945367e-05, 3.771808042074554e-05, 3.671547892736271e-05, 3.175914389430545e-05 ], "bp_grad_norms_F": [ 0.0016278985422104597, 0.00169221474789083, 0.0017131771892309189, 0.0016123101813718677, 0.001308745937421918 ], "gamma_dfa": NaN, "acc_eval": 0.572265625, "loss_eval": 1.1706045866012573, "epoch": 31 }, { "hidden_norms": [ 271.2703552246094, 258.5479431152344, 247.48568725585938, 241.0449676513672, 248.61419677734375 ], "bp_grad_norms_per_sample_med": [ 3.370125705259852e-05, 3.563391510397196e-05, 3.776583253056742e-05, 3.622193253249861e-05, 3.1177536584436893e-05 ], "bp_grad_norms_F": [ 0.001631051884032786, 0.0016799280419945717, 0.0016939701745286584, 0.001596588990651071, 0.0012989162933081388 ], "gamma_dfa": NaN, "acc_eval": 0.576171875, "loss_eval": 1.1757416725158691, "epoch": 32 }, { "hidden_norms": [ 271.5987854003906, 257.3157043457031, 247.04425048828125, 239.22933959960938, 247.08534240722656 ], "bp_grad_norms_per_sample_med": [ 3.276485949754715e-05, 3.4356282412773e-05, 3.570897752069868e-05, 3.5391843994148076e-05, 3.004215977853164e-05 ], "bp_grad_norms_F": [ 0.0015858211554586887, 0.0016445693327113986, 0.0016775003168731928, 0.0015801271656528115, 0.0012829708866775036 ], "gamma_dfa": NaN, "acc_eval": 0.5947265625, "loss_eval": 1.1316245794296265, "epoch": 33 }, { "hidden_norms": [ 276.85565185546875, 262.14959716796875, 248.80125427246094, 239.6945037841797, 246.55982971191406 ], "bp_grad_norms_per_sample_med": [ 3.424682654440403e-05, 3.617212496465072e-05, 3.731884135049768e-05, 3.583814759622328e-05, 3.1317249522544444e-05 ], "bp_grad_norms_F": [ 0.001694253645837307, 0.0017545269802212715, 0.0017868074355646968, 0.0016729168128222227, 0.0013285611057654023 ], "gamma_dfa": NaN, "acc_eval": 0.599609375, "loss_eval": 1.1637687683105469, "epoch": 34 }, { "hidden_norms": [ 274.4824523925781, 260.23223876953125, 249.41390991210938, 242.22657775878906, 248.33303833007812 ], "bp_grad_norms_per_sample_med": [ 3.4118878829758614e-05, 3.6190944229019806e-05, 3.7162455555517226e-05, 3.6398294469108805e-05, 3.1276995287043974e-05 ], "bp_grad_norms_F": [ 0.0016947221010923386, 0.0017584856832399964, 0.0017846780829131603, 0.0016663862625136971, 0.0013457784662023187 ], "gamma_dfa": NaN, "acc_eval": 0.5830078125, "loss_eval": 1.1625440120697021, "epoch": 35 }, { "hidden_norms": [ 279.3048095703125, 263.830810546875, 250.07839965820312, 242.9677276611328, 248.742431640625 ], "bp_grad_norms_per_sample_med": [ 3.378376641194336e-05, 3.623673183028586e-05, 3.8036723708501086e-05, 3.8026879337849095e-05, 3.20856343023479e-05 ], "bp_grad_norms_F": [ 0.0016582749085500836, 0.001725532696582377, 0.0017548021860420704, 0.0016622358234599233, 0.0013314742827787995 ], "gamma_dfa": NaN, "acc_eval": 0.58203125, "loss_eval": 1.1663323640823364, "epoch": 36 }, { "hidden_norms": [ 277.88153076171875, 263.3263244628906, 254.0471954345703, 246.00294494628906, 251.6592559814453 ], "bp_grad_norms_per_sample_med": [ 3.402382935746573e-05, 3.644815296866e-05, 3.812061549979262e-05, 3.8299189327517524e-05, 3.244871550123207e-05 ], "bp_grad_norms_F": [ 0.0016575837507843971, 0.001726161572150886, 0.0017651193775236607, 0.001658888068050146, 0.001325216144323349 ], "gamma_dfa": NaN, "acc_eval": 0.5849609375, "loss_eval": 1.1578618288040161, "epoch": 37 }, { "hidden_norms": [ 278.96038818359375, 264.09832763671875, 252.11532592773438, 243.7300567626953, 250.29537963867188 ], "bp_grad_norms_per_sample_med": [ 3.398891203687526e-05, 3.60828016710002e-05, 3.8209349440876395e-05, 3.6874149373034015e-05, 3.130899858660996e-05 ], "bp_grad_norms_F": [ 0.0016938851913437247, 0.0017578925471752882, 0.0017999019473791122, 0.0016839306335896254, 0.0013463495997712016 ], "gamma_dfa": NaN, "acc_eval": 0.59375, "loss_eval": 1.1660709381103516, "epoch": 38 }, { "hidden_norms": [ 279.11102294921875, 262.8247375488281, 250.32635498046875, 241.73477172851562, 246.8911590576172 ], "bp_grad_norms_per_sample_med": [ 3.476023630355485e-05, 3.673156606964767e-05, 3.8200654671527445e-05, 3.745179856196046e-05, 3.111823389190249e-05 ], "bp_grad_norms_F": [ 0.0017367384862154722, 0.001807119813747704, 0.0018404393922537565, 0.0017188042402267456, 0.0013523433590307832 ], "gamma_dfa": NaN, "acc_eval": 0.58984375, "loss_eval": 1.1548914909362793, "epoch": 39 }, { "hidden_norms": [ 278.79083251953125, 263.49237060546875, 252.0679931640625, 243.65948486328125, 249.34564208984375 ], "bp_grad_norms_per_sample_med": [ 3.3709933632053435e-05, 3.595885937102139e-05, 3.795271186390892e-05, 3.70899579138495e-05, 3.1362116715172306e-05 ], "bp_grad_norms_F": [ 0.0017184949247166514, 0.0017862631939351559, 0.0018348938319832087, 0.0017180118011310697, 0.0013606568099930882 ], "gamma_dfa": NaN, "acc_eval": 0.591796875, "loss_eval": 1.159794569015503, "epoch": 40 }, { "hidden_norms": [ 281.3595886230469, 263.4467468261719, 250.73536682128906, 243.140380859375, 247.22425842285156 ], "bp_grad_norms_per_sample_med": [ 3.411353100091219e-05, 3.656598346424289e-05, 3.8585232687182724e-05, 3.752345946850255e-05, 3.1474613933824e-05 ], "bp_grad_norms_F": [ 0.0017623946769163013, 0.0018276257906109095, 0.0018694576574489474, 0.0017436364432796836, 0.0013814391568303108 ], "gamma_dfa": NaN, "acc_eval": 0.5888671875, "loss_eval": 1.153226375579834, "epoch": 41 }, { "hidden_norms": [ 279.79888916015625, 263.5989685058594, 252.2397918701172, 243.49703979492188, 248.86973571777344 ], "bp_grad_norms_per_sample_med": [ 3.528413435560651e-05, 3.805026790359989e-05, 4.0152310248231515e-05, 3.962377377320081e-05, 3.250985173508525e-05 ], "bp_grad_norms_F": [ 0.0017320383340120316, 0.0018105976050719619, 0.001847731531597674, 0.0017405269900336862, 0.0013762396993115544 ], "gamma_dfa": NaN, "acc_eval": 0.58984375, "loss_eval": 1.1387929916381836, "epoch": 42 }, { "hidden_norms": [ 280.80633544921875, 263.2684326171875, 251.36338806152344, 242.25201416015625, 245.46954345703125 ], "bp_grad_norms_per_sample_med": [ 3.463789835222997e-05, 3.694587940117344e-05, 3.909278166247532e-05, 3.8173999200807884e-05, 3.152083809254691e-05 ], "bp_grad_norms_F": [ 0.001763346022926271, 0.0018382675480097532, 0.0018745084526017308, 0.0017674838891252875, 0.0013920797500759363 ], "gamma_dfa": NaN, "acc_eval": 0.5986328125, "loss_eval": 1.1115086078643799, "epoch": 43 }, { "hidden_norms": [ 278.4877624511719, 261.4671630859375, 247.66079711914062, 240.21690368652344, 244.1111602783203 ], "bp_grad_norms_per_sample_med": [ 3.559369361028075e-05, 3.895946065313183e-05, 4.048463233630173e-05, 3.892362292390317e-05, 3.229418143746443e-05 ], "bp_grad_norms_F": [ 0.0018469772767275572, 0.0019197544315829873, 0.001963041489943862, 0.0018302135867998004, 0.001429378753527999 ], "gamma_dfa": NaN, "acc_eval": 0.6025390625, "loss_eval": 1.16768217086792, "epoch": 44 }, { "hidden_norms": [ 280.8171691894531, 263.16705322265625, 251.45835876464844, 243.88563537597656, 246.92945861816406 ], "bp_grad_norms_per_sample_med": [ 3.3486583561170846e-05, 3.533214839990251e-05, 3.789112452068366e-05, 3.651758743217215e-05, 3.081141403526999e-05 ], "bp_grad_norms_F": [ 0.0017694556154310703, 0.0018461478175595403, 0.0018877091351896524, 0.001781664090231061, 0.0014001834206283092 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1236202716827393, "epoch": 45 }, { "hidden_norms": [ 280.0203552246094, 261.3996887207031, 248.5751953125, 240.40728759765625, 243.84178161621094 ], "bp_grad_norms_per_sample_med": [ 3.66695094271563e-05, 3.912827742169611e-05, 4.0782215364743024e-05, 3.97856165363919e-05, 3.258495053160004e-05 ], "bp_grad_norms_F": [ 0.0018954386468976736, 0.0019765326287597418, 0.0020179273560643196, 0.0018787897424772382, 0.0014408754650503397 ], "gamma_dfa": NaN, "acc_eval": 0.5947265625, "loss_eval": 1.142503261566162, "epoch": 46 }, { "hidden_norms": [ 278.37445068359375, 260.7147521972656, 247.63418579101562, 239.64564514160156, 241.75396728515625 ], "bp_grad_norms_per_sample_med": [ 3.824803570751101e-05, 4.062152947881259e-05, 4.1070070437854156e-05, 4.01996003347449e-05, 3.288290827185847e-05 ], "bp_grad_norms_F": [ 0.001872657099738717, 0.0019627343863248825, 0.002008425537496805, 0.0018816223600879312, 0.001456336583942175 ], "gamma_dfa": NaN, "acc_eval": 0.6064453125, "loss_eval": 1.137413740158081, "epoch": 47 }, { "hidden_norms": [ 281.14813232421875, 263.6340637207031, 250.13082885742188, 242.0965118408203, 244.81060791015625 ], "bp_grad_norms_per_sample_med": [ 3.531872062012553e-05, 3.7883237382629886e-05, 4.0227863792097196e-05, 3.96844552597031e-05, 3.296942304586992e-05 ], "bp_grad_norms_F": [ 0.0018434273079037666, 0.0019304269226267934, 0.0019746439065784216, 0.0018603875068947673, 0.0014465745771303773 ], "gamma_dfa": NaN, "acc_eval": 0.6025390625, "loss_eval": 1.1396205425262451, "epoch": 48 }, { "hidden_norms": [ 281.31280517578125, 262.5829772949219, 247.9232940673828, 239.8461456298828, 242.20977783203125 ], "bp_grad_norms_per_sample_med": [ 3.71285859728232e-05, 3.963968629250303e-05, 4.135111521463841e-05, 4.0518349123885855e-05, 3.323471173644066e-05 ], "bp_grad_norms_F": [ 0.00189371092710644, 0.0019808171782642603, 0.002019244944676757, 0.001904282602481544, 0.0014800610952079296 ], "gamma_dfa": NaN, "acc_eval": 0.59375, "loss_eval": 1.1411675214767456, "epoch": 49 }, { "hidden_norms": [ 278.64208984375, 260.1700744628906, 246.7251434326172, 239.43145751953125, 240.350830078125 ], "bp_grad_norms_per_sample_med": [ 3.6054647353012115e-05, 3.858766285702586e-05, 4.05439204769209e-05, 4.046479079988785e-05, 3.3791853638831526e-05 ], "bp_grad_norms_F": [ 0.0018870895728468895, 0.00198533502407372, 0.0020502021070569754, 0.001929490827023983, 0.0014933926286175847 ], "gamma_dfa": NaN, "acc_eval": 0.59375, "loss_eval": 1.1310430765151978, "epoch": 50 }, { "hidden_norms": [ 281.7696533203125, 261.5150451660156, 247.67295837402344, 239.7654266357422, 240.27789306640625 ], "bp_grad_norms_per_sample_med": [ 3.671262675197795e-05, 3.92102992918808e-05, 4.1406125092180446e-05, 4.029196497867815e-05, 3.32514064211864e-05 ], "bp_grad_norms_F": [ 0.001880357856862247, 0.001981948269531131, 0.0020440546795725822, 0.0019350070506334305, 0.0014877711655572057 ], "gamma_dfa": NaN, "acc_eval": 0.60546875, "loss_eval": 1.1188440322875977, "epoch": 51 }, { "hidden_norms": [ 279.01318359375, 259.6091003417969, 244.6603240966797, 235.1455535888672, 237.438232421875 ], "bp_grad_norms_per_sample_med": [ 4.0185608668252826e-05, 4.309232099330984e-05, 4.5118234993424267e-05, 4.371534669189714e-05, 3.5620210837805644e-05 ], "bp_grad_norms_F": [ 0.0020104716531932354, 0.002107330597937107, 0.002167000202462077, 0.0020260754972696304, 0.0015411453787237406 ], "gamma_dfa": NaN, "acc_eval": 0.603515625, "loss_eval": 1.1525764465332031, "epoch": 52 }, { "hidden_norms": [ 278.2245178222656, 257.14617919921875, 243.9732666015625, 234.4013214111328, 236.68521118164062 ], "bp_grad_norms_per_sample_med": [ 3.85418206860777e-05, 4.142443503951654e-05, 4.363177140476182e-05, 4.2996281990781426e-05, 3.424972965149209e-05 ], "bp_grad_norms_F": [ 0.0020445864647626877, 0.002142493613064289, 0.0022005243226885796, 0.002054274780675769, 0.0015541499014943838 ], "gamma_dfa": NaN, "acc_eval": 0.59765625, "loss_eval": 1.162191390991211, "epoch": 53 }, { "hidden_norms": [ 278.7825622558594, 258.4292297363281, 243.01690673828125, 234.15765380859375, 235.1446533203125 ], "bp_grad_norms_per_sample_med": [ 3.855194881907664e-05, 4.1293307731393725e-05, 4.296215047361329e-05, 4.1900369978975505e-05, 3.372962964931503e-05 ], "bp_grad_norms_F": [ 0.002041360829025507, 0.0021457262337207794, 0.0021996963769197464, 0.0020641626324504614, 0.001561368815600872 ], "gamma_dfa": NaN, "acc_eval": 0.6171875, "loss_eval": 1.130479335784912, "epoch": 54 }, { "hidden_norms": [ 275.3794860839844, 256.83026123046875, 242.16006469726562, 231.49655151367188, 232.30279541015625 ], "bp_grad_norms_per_sample_med": [ 4.011294731753878e-05, 4.240096313878894e-05, 4.396942676976323e-05, 4.347893627709709e-05, 3.485888009890914e-05 ], "bp_grad_norms_F": [ 0.0021268154960125685, 0.002230642130598426, 0.0022892621345818043, 0.002145433332771063, 0.0016037407331168652 ], "gamma_dfa": NaN, "acc_eval": 0.6005859375, "loss_eval": 1.1599653959274292, "epoch": 55 }, { "hidden_norms": [ 277.5028076171875, 257.1715087890625, 241.6505584716797, 234.09323120117188, 233.63377380371094 ], "bp_grad_norms_per_sample_med": [ 3.876453047269024e-05, 4.156330396654084e-05, 4.3727923184633255e-05, 4.2131912778131664e-05, 3.510245369398035e-05 ], "bp_grad_norms_F": [ 0.002074806485325098, 0.002173666376620531, 0.002245684852823615, 0.0021073734387755394, 0.0015908328350633383 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.144984245300293, "epoch": 56 }, { "hidden_norms": [ 276.0826416015625, 255.17193603515625, 239.51519775390625, 231.28643798828125, 230.85292053222656 ], "bp_grad_norms_per_sample_med": [ 3.960869798902422e-05, 4.2907246097456664e-05, 4.45116929768119e-05, 4.3612952140392736e-05, 3.500159073155373e-05 ], "bp_grad_norms_F": [ 0.0021277335472404957, 0.0022348251659423113, 0.0022981096990406513, 0.002155488822609186, 0.001618923619389534 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.1534931659698486, "epoch": 57 }, { "hidden_norms": [ 275.6867370605469, 254.65744018554688, 238.1124267578125, 229.36215209960938, 227.90867614746094 ], "bp_grad_norms_per_sample_med": [ 3.966662916354835e-05, 4.33680324931629e-05, 4.5270633563632146e-05, 4.528860517893918e-05, 3.5298704460728914e-05 ], "bp_grad_norms_F": [ 0.002194908680394292, 0.002305977512151003, 0.0023776311427354813, 0.002223761286586523, 0.001651395345106721 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1494864225387573, "epoch": 58 }, { "hidden_norms": [ 274.8414306640625, 253.18215942382812, 238.03150939941406, 228.1765594482422, 229.46058654785156 ], "bp_grad_norms_per_sample_med": [ 4.132632238906808e-05, 4.4773249101126567e-05, 4.6669130824739113e-05, 4.591346441884525e-05, 3.6523833841783926e-05 ], "bp_grad_norms_F": [ 0.0022293017245829105, 0.002341218525543809, 0.002405093051493168, 0.0022504546213895082, 0.0016715668607503176 ], "gamma_dfa": NaN, "acc_eval": 0.5927734375, "loss_eval": 1.1698435544967651, "epoch": 59 }, { "hidden_norms": [ 273.4884338378906, 251.2228240966797, 236.2550048828125, 226.7325439453125, 225.68386840820312 ], "bp_grad_norms_per_sample_med": [ 4.192883352516219e-05, 4.3471976823639125e-05, 4.7195244405884296e-05, 4.490713035920635e-05, 3.646116965683177e-05 ], "bp_grad_norms_F": [ 0.0022312228102236986, 0.002349371323361993, 0.0024164437782019377, 0.002271530916914344, 0.0016918154433369637 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1560128927230835, "epoch": 60 }, { "hidden_norms": [ 273.4084777832031, 250.5165557861328, 236.19557189941406, 227.0643768310547, 226.594970703125 ], "bp_grad_norms_per_sample_med": [ 4.2211744585074484e-05, 4.488111881073564e-05, 4.760283627547324e-05, 4.589638047036715e-05, 3.658623973024078e-05 ], "bp_grad_norms_F": [ 0.0022313676308840513, 0.002337696962058544, 0.0024093035608530045, 0.002264693146571517, 0.0016880000475794077 ], "gamma_dfa": NaN, "acc_eval": 0.6044921875, "loss_eval": 1.1498074531555176, "epoch": 61 }, { "hidden_norms": [ 273.1318664550781, 249.35223388671875, 234.15737915039062, 223.48074340820312, 223.0059356689453 ], "bp_grad_norms_per_sample_med": [ 4.4729218643624336e-05, 4.768320650327951e-05, 4.822494520340115e-05, 4.791786341229454e-05, 3.7625926779583097e-05 ], "bp_grad_norms_F": [ 0.0023362624924629927, 0.0024679312482476234, 0.0025367215275764465, 0.0023599599953740835, 0.0017239096341654658 ], "gamma_dfa": NaN, "acc_eval": 0.603515625, "loss_eval": 1.1377537250518799, "epoch": 62 }, { "hidden_norms": [ 270.9543762207031, 249.6943817138672, 234.0796356201172, 223.80093383789062, 222.75062561035156 ], "bp_grad_norms_per_sample_med": [ 4.4321575842332095e-05, 4.7786033974261954e-05, 4.9388974730391055e-05, 4.749266372527927e-05, 3.7502803024835885e-05 ], "bp_grad_norms_F": [ 0.0023458057548850775, 0.0024719720240682364, 0.0025427823420614004, 0.0023789280094206333, 0.0017488099401816726 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1472076177597046, "epoch": 63 }, { "hidden_norms": [ 270.6864318847656, 249.71315002441406, 233.9838409423828, 223.17515563964844, 222.17759704589844 ], "bp_grad_norms_per_sample_med": [ 4.36245281889569e-05, 4.725098915514536e-05, 4.936556069878861e-05, 4.7286572225857526e-05, 3.7781614082632586e-05 ], "bp_grad_norms_F": [ 0.0023510511964559555, 0.0024691869039088488, 0.0025394195690751076, 0.0023858139757066965, 0.0017493697814643383 ], "gamma_dfa": NaN, "acc_eval": 0.5986328125, "loss_eval": 1.1437795162200928, "epoch": 64 }, { "hidden_norms": [ 269.1813659667969, 247.57632446289062, 231.57135009765625, 220.31541442871094, 220.33135986328125 ], "bp_grad_norms_per_sample_med": [ 4.363871266832575e-05, 4.776224886882119e-05, 4.8712514399085194e-05, 4.777491994900629e-05, 3.733497578650713e-05 ], "bp_grad_norms_F": [ 0.0023870510049164295, 0.0025214161723852158, 0.0025991688016802073, 0.0024342697579413652, 0.0017686353530734777 ], "gamma_dfa": NaN, "acc_eval": 0.6123046875, "loss_eval": 1.138253927230835, "epoch": 65 }, { "hidden_norms": [ 268.92877197265625, 245.84384155273438, 230.63307189941406, 220.8726806640625, 219.60350036621094 ], "bp_grad_norms_per_sample_med": [ 4.505042306846008e-05, 4.780786548508331e-05, 5.067480378784239e-05, 4.878537220065482e-05, 3.842872683890164e-05 ], "bp_grad_norms_F": [ 0.00237255753017962, 0.002493572887033224, 0.0025717453099787235, 0.0024270617868751287, 0.0017787005053833127 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1350346803665161, "epoch": 66 }, { "hidden_norms": [ 268.9022521972656, 244.85621643066406, 229.2279510498047, 218.72445678710938, 217.325439453125 ], "bp_grad_norms_per_sample_med": [ 4.515323234954849e-05, 4.8419675295008346e-05, 5.0062186346622184e-05, 4.777919821208343e-05, 3.962183836847544e-05 ], "bp_grad_norms_F": [ 0.0024519655853509903, 0.002586368238553405, 0.00266969739459455, 0.0024983694311231375, 0.001813769806176424 ], "gamma_dfa": NaN, "acc_eval": 0.58984375, "loss_eval": 1.143377661705017, "epoch": 67 }, { "hidden_norms": [ 267.7603454589844, 245.58932495117188, 229.04205322265625, 219.0813446044922, 217.887939453125 ], "bp_grad_norms_per_sample_med": [ 4.398225064505823e-05, 4.6881206799298525e-05, 4.986919157090597e-05, 4.9659283831715584e-05, 3.928233854821883e-05 ], "bp_grad_norms_F": [ 0.0024525129701942205, 0.0025901535991579294, 0.002675000112503767, 0.0025050004478543997, 0.0018165758810937405 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.1445319652557373, "epoch": 68 }, { "hidden_norms": [ 267.32110595703125, 244.51095581054688, 228.1964569091797, 217.7543182373047, 215.99093627929688 ], "bp_grad_norms_per_sample_med": [ 4.567872019833885e-05, 4.9028451030608267e-05, 5.0534836191218346e-05, 4.8578112910036e-05, 3.865628605126403e-05 ], "bp_grad_norms_F": [ 0.002467149868607521, 0.0026051453314721584, 0.0026927595026791096, 0.002530105412006378, 0.0018421142594888806 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.143081545829773, "epoch": 69 }, { "hidden_norms": [ 266.6060791015625, 242.973388671875, 227.23739624023438, 216.60504150390625, 213.26922607421875 ], "bp_grad_norms_per_sample_med": [ 4.524671021499671e-05, 4.8752917791716754e-05, 5.0053116865456104e-05, 4.897990220342763e-05, 3.949753590859473e-05 ], "bp_grad_norms_F": [ 0.002536450745537877, 0.002682002494111657, 0.002782325493171811, 0.002600395353510976, 0.0018774428172037005 ], "gamma_dfa": NaN, "acc_eval": 0.607421875, "loss_eval": 1.1569209098815918, "epoch": 70 }, { "hidden_norms": [ 265.7056579589844, 243.6046142578125, 226.88746643066406, 217.55291748046875, 213.99151611328125 ], "bp_grad_norms_per_sample_med": [ 4.667519897338934e-05, 4.9728132580639794e-05, 5.27437987329904e-05, 5.151727600605227e-05, 4.0550570702180266e-05 ], "bp_grad_norms_F": [ 0.002509700832888484, 0.0026521242689341307, 0.0027410376351326704, 0.002574845217168331, 0.001871992484666407 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.1381304264068604, "epoch": 71 }, { "hidden_norms": [ 264.63116455078125, 241.50344848632812, 225.20465087890625, 214.67364501953125, 212.77584838867188 ], "bp_grad_norms_per_sample_med": [ 4.526918928604573e-05, 5.0124705012422055e-05, 5.2680206863442436e-05, 5.1697836170205846e-05, 3.9593822293682024e-05 ], "bp_grad_norms_F": [ 0.0025687876623123884, 0.0027084490284323692, 0.0027945584151893854, 0.0026290949899703264, 0.0018978636944666505 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.149982213973999, "epoch": 72 }, { "hidden_norms": [ 264.168701171875, 241.78074645996094, 224.8336944580078, 214.45762634277344, 212.4181671142578 ], "bp_grad_norms_per_sample_med": [ 4.745498517877422e-05, 5.042303018854e-05, 5.3622185077983886e-05, 5.276402589515783e-05, 4.0586572140455246e-05 ], "bp_grad_norms_F": [ 0.0026231552474200726, 0.002779489615932107, 0.002866284688934684, 0.00268669705837965, 0.0019228557357564569 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.158836007118225, "epoch": 73 }, { "hidden_norms": [ 263.89593505859375, 240.3160858154297, 223.6101531982422, 212.4967803955078, 210.63546752929688 ], "bp_grad_norms_per_sample_med": [ 4.678544428315945e-05, 5.029747626394965e-05, 5.3069161367602646e-05, 5.2157745813019574e-05, 4.0450311644235626e-05 ], "bp_grad_norms_F": [ 0.0026451845187693834, 0.002798875328153372, 0.0028935885056853294, 0.0027081011794507504, 0.001933218096382916 ], "gamma_dfa": NaN, "acc_eval": 0.607421875, "loss_eval": 1.1447510719299316, "epoch": 74 }, { "hidden_norms": [ 262.4220275878906, 239.43899536132812, 223.32151794433594, 212.5982666015625, 209.80105590820312 ], "bp_grad_norms_per_sample_med": [ 4.713214002549648e-05, 5.087011959403753e-05, 5.283053906168789e-05, 5.280825644149445e-05, 4.054068267578259e-05 ], "bp_grad_norms_F": [ 0.002688886132091284, 0.002841175301000476, 0.002931408118456602, 0.0027343749534338713, 0.001953375292941928 ], "gamma_dfa": NaN, "acc_eval": 0.6201171875, "loss_eval": 1.1561517715454102, "epoch": 75 }, { "hidden_norms": [ 262.65814208984375, 240.0749969482422, 223.0806121826172, 212.08688354492188, 209.22561645507812 ], "bp_grad_norms_per_sample_med": [ 4.8153047828236595e-05, 5.145415343577042e-05, 5.4130876378621906e-05, 5.3563955589197576e-05, 4.1630475607234985e-05 ], "bp_grad_norms_F": [ 0.0026582488790154457, 0.0028067713137716055, 0.00290639977902174, 0.0027312941383570433, 0.0019485733937472105 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1465811729431152, "epoch": 76 }, { "hidden_norms": [ 262.0201721191406, 239.08547973632812, 222.36146545410156, 211.62014770507812, 208.1699676513672 ], "bp_grad_norms_per_sample_med": [ 4.763290053233504e-05, 5.171096199774183e-05, 5.4121221182867885e-05, 5.251873881206848e-05, 4.096185875823721e-05 ], "bp_grad_norms_F": [ 0.0027110630180686712, 0.002856222679838538, 0.002954155672341585, 0.0027671835850924253, 0.001963438233360648 ], "gamma_dfa": NaN, "acc_eval": 0.6142578125, "loss_eval": 1.140420913696289, "epoch": 77 }, { "hidden_norms": [ 261.04132080078125, 238.44912719726562, 221.8912353515625, 210.62893676757812, 207.68223571777344 ], "bp_grad_norms_per_sample_med": [ 4.7598918172298e-05, 5.09894234710373e-05, 5.384815813158639e-05, 5.2337087254272774e-05, 4.065291432198137e-05 ], "bp_grad_norms_F": [ 0.00274560390971601, 0.0029035566840320826, 0.0030046424362808466, 0.0028060651384294033, 0.001984622096642852 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.1556674242019653, "epoch": 78 }, { "hidden_norms": [ 260.81304931640625, 237.52015686035156, 221.12814331054688, 210.04925537109375, 206.80441284179688 ], "bp_grad_norms_per_sample_med": [ 4.8430883907712996e-05, 5.440305176307447e-05, 5.596410119323991e-05, 5.4586391343036667e-05, 4.195213477942161e-05 ], "bp_grad_norms_F": [ 0.002767855068668723, 0.002925564767792821, 0.003015928901731968, 0.002823467366397381, 0.0020000736694782972 ], "gamma_dfa": NaN, "acc_eval": 0.599609375, "loss_eval": 1.155595302581787, "epoch": 79 }, { "hidden_norms": [ 260.0649108886719, 236.74310302734375, 220.48731994628906, 209.0772247314453, 205.55821228027344 ], "bp_grad_norms_per_sample_med": [ 4.8615416744723916e-05, 5.309982589096762e-05, 5.548154513235204e-05, 5.3888015827396885e-05, 4.1955223423428833e-05 ], "bp_grad_norms_F": [ 0.0028222037944942713, 0.0029849831480532885, 0.003080391325056553, 0.0028690374456346035, 0.002019484294578433 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.151352882385254, "epoch": 80 }, { "hidden_norms": [ 259.8204650878906, 236.13253784179688, 219.08865356445312, 207.6793975830078, 205.0387725830078 ], "bp_grad_norms_per_sample_med": [ 4.734982212539762e-05, 5.1937022362835705e-05, 5.472155680763535e-05, 5.394391337176785e-05, 4.0832986996974796e-05 ], "bp_grad_norms_F": [ 0.00282403570599854, 0.0029848285485059023, 0.0030928945634514093, 0.002879998181015253, 0.0020237534772604704 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.153958797454834, "epoch": 81 }, { "hidden_norms": [ 259.70703125, 235.5811767578125, 218.87939453125, 207.87005615234375, 204.21360778808594 ], "bp_grad_norms_per_sample_med": [ 4.972740134689957e-05, 5.442327164928429e-05, 5.538179539144039e-05, 5.4411018936662003e-05, 4.185390207567252e-05 ], "bp_grad_norms_F": [ 0.002822998445481062, 0.00298913661390543, 0.0030840388499200344, 0.0028817548882216215, 0.0020279802847653627 ], "gamma_dfa": NaN, "acc_eval": 0.6201171875, "loss_eval": 1.153503656387329, "epoch": 82 }, { "hidden_norms": [ 258.22747802734375, 235.3745880126953, 218.20066833496094, 206.82144165039062, 203.41139221191406 ], "bp_grad_norms_per_sample_med": [ 5.077639434603043e-05, 5.5536078434670344e-05, 5.664999844157137e-05, 5.608425635728054e-05, 4.293184611015022e-05 ], "bp_grad_norms_F": [ 0.002843277994543314, 0.0030130224768072367, 0.0031098793260753155, 0.00290561281144619, 0.0020425335969775915 ], "gamma_dfa": NaN, "acc_eval": 0.603515625, "loss_eval": 1.1597235202789307, "epoch": 83 }, { "hidden_norms": [ 258.78253173828125, 234.73965454101562, 217.91439819335938, 207.1282958984375, 203.4480743408203 ], "bp_grad_norms_per_sample_med": [ 4.941036968375556e-05, 5.3143365221330896e-05, 5.529402187676169e-05, 5.3718889830634e-05, 4.207601887173951e-05 ], "bp_grad_norms_F": [ 0.0028217420913279057, 0.0029905554838478565, 0.0030917164403945208, 0.002896753139793873, 0.00204362440854311 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1545956134796143, "epoch": 84 }, { "hidden_norms": [ 258.10736083984375, 234.35299682617188, 217.81224060058594, 206.38864135742188, 202.70126342773438 ], "bp_grad_norms_per_sample_med": [ 4.899106716038659e-05, 5.2254512411309406e-05, 5.481128755491227e-05, 5.298088217386976e-05, 4.121303936699405e-05 ], "bp_grad_norms_F": [ 0.002849399344995618, 0.0030259499326348305, 0.0031236386857926846, 0.002921136561781168, 0.0020506957080215216 ], "gamma_dfa": NaN, "acc_eval": 0.615234375, "loss_eval": 1.150564193725586, "epoch": 85 }, { "hidden_norms": [ 258.50750732421875, 234.4120330810547, 217.49217224121094, 205.7490692138672, 202.62380981445312 ], "bp_grad_norms_per_sample_med": [ 4.976892887498252e-05, 5.383255484048277e-05, 5.497025267686695e-05, 5.391201557358727e-05, 4.2558931454550475e-05 ], "bp_grad_norms_F": [ 0.0028686418663710356, 0.003045660676434636, 0.0031442255713045597, 0.002935740165412426, 0.0020568587351590395 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.152902603149414, "epoch": 86 }, { "hidden_norms": [ 258.063720703125, 233.87294006347656, 217.34030151367188, 205.4007110595703, 202.4425506591797 ], "bp_grad_norms_per_sample_med": [ 5.047345257480629e-05, 5.492625859915279e-05, 5.640966628561728e-05, 5.587706982623786e-05, 4.286773400963284e-05 ], "bp_grad_norms_F": [ 0.002875820267945528, 0.003056521760299802, 0.0031533341389149427, 0.002944495528936386, 0.0020668748766183853 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.152883529663086, "epoch": 87 }, { "hidden_norms": [ 258.1524353027344, 234.54095458984375, 216.9737548828125, 205.64048767089844, 202.26617431640625 ], "bp_grad_norms_per_sample_med": [ 4.9309845053358003e-05, 5.373455860535614e-05, 5.6388864322798327e-05, 5.448140291264281e-05, 4.2345352994743735e-05 ], "bp_grad_norms_F": [ 0.0028876049909740686, 0.0030658405739814043, 0.0031632501631975174, 0.002954283496364951, 0.0020715948194265366 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.155066967010498, "epoch": 88 }, { "hidden_norms": [ 257.7385559082031, 233.87037658691406, 216.7277069091797, 205.37454223632812, 202.0509033203125 ], "bp_grad_norms_per_sample_med": [ 5.0028131227009e-05, 5.394254549173638e-05, 5.677127046510577e-05, 5.581674486165866e-05, 4.2508807382546365e-05 ], "bp_grad_norms_F": [ 0.0028917219024151564, 0.0030712694860994816, 0.0031723883002996445, 0.0029576809611171484, 0.0020730902906507254 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.1531357765197754, "epoch": 89 }, { "hidden_norms": [ 257.52423095703125, 233.51254272460938, 216.73731994628906, 205.52561950683594, 202.19493103027344 ], "bp_grad_norms_per_sample_med": [ 4.9573794967727736e-05, 5.4153944802237675e-05, 5.742486973758787e-05, 5.468217204906978e-05, 4.2126855987589806e-05 ], "bp_grad_norms_F": [ 0.0029005431570112705, 0.0030793119221925735, 0.003179334569722414, 0.0029661250300705433, 0.002075627911835909 ], "gamma_dfa": NaN, "acc_eval": 0.603515625, "loss_eval": 1.155139684677124, "epoch": 90 }, { "hidden_norms": [ 257.5526428222656, 233.24456787109375, 216.63601684570312, 205.40318298339844, 201.8704376220703 ], "bp_grad_norms_per_sample_med": [ 4.996290954295546e-05, 5.331254214979708e-05, 5.576194598688744e-05, 5.50017248315271e-05, 4.1135557694360614e-05 ], "bp_grad_norms_F": [ 0.002902554115280509, 0.003083745948970318, 0.0031855429988354445, 0.0029742431361228228, 0.002079661935567856 ], "gamma_dfa": NaN, "acc_eval": 0.611328125, "loss_eval": 1.15346360206604, "epoch": 91 }, { "hidden_norms": [ 257.3648681640625, 233.42010498046875, 216.6300506591797, 204.97442626953125, 201.4558868408203 ], "bp_grad_norms_per_sample_med": [ 5.06279211549554e-05, 5.411348683992401e-05, 5.6813423725543544e-05, 5.523188519873656e-05, 4.197460293653421e-05 ], "bp_grad_norms_F": [ 0.0029165328014642, 0.003098647342994809, 0.00319958315230906, 0.002985388273373246, 0.002088340697810054 ], "gamma_dfa": NaN, "acc_eval": 0.6015625, "loss_eval": 1.155455470085144, "epoch": 92 }, { "hidden_norms": [ 257.30535888671875, 233.4147491455078, 216.60826110839844, 205.0714874267578, 201.24066162109375 ], "bp_grad_norms_per_sample_med": [ 5.053050699643791e-05, 5.4108801123220474e-05, 5.702309499611147e-05, 5.574637179961428e-05, 4.271106809028424e-05 ], "bp_grad_norms_F": [ 0.002917014993727207, 0.0030978922732174397, 0.0031987964175641537, 0.0029851715080440044, 0.0020893686451017857 ], "gamma_dfa": NaN, "acc_eval": 0.6103515625, "loss_eval": 1.1536216735839844, "epoch": 93 }, { "hidden_norms": [ 257.18878173828125, 232.8798370361328, 216.17039489746094, 204.66229248046875, 201.07859802246094 ], "bp_grad_norms_per_sample_med": [ 5.010717359255068e-05, 5.397907079895958e-05, 5.614722249447368e-05, 5.553716255235486e-05, 4.292877929401584e-05 ], "bp_grad_norms_F": [ 0.0029321948532015085, 0.003115386702120304, 0.0032163059804588556, 0.002997474977746606, 0.002096242969855666 ], "gamma_dfa": NaN, "acc_eval": 0.6123046875, "loss_eval": 1.1570696830749512, "epoch": 94 }, { "hidden_norms": [ 257.0701904296875, 232.91481018066406, 216.06378173828125, 204.648681640625, 201.00148010253906 ], "bp_grad_norms_per_sample_med": [ 4.9896454584086314e-05, 5.386451448430307e-05, 5.5900127335917205e-05, 5.5407243053196e-05, 4.247200922691263e-05 ], "bp_grad_norms_F": [ 0.0029298008885234594, 0.0031122476793825626, 0.0032105366699397564, 0.0029950770549476147, 0.0020956522785127163 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.1554739475250244, "epoch": 95 }, { "hidden_norms": [ 257.0519104003906, 232.83355712890625, 216.1780242919922, 204.67999267578125, 201.0236358642578 ], "bp_grad_norms_per_sample_med": [ 5.054255234426819e-05, 5.421326932264492e-05, 5.641246752929874e-05, 5.574019087362103e-05, 4.288824857212603e-05 ], "bp_grad_norms_F": [ 0.0029319566674530506, 0.0031146046239882708, 0.003213704563677311, 0.002997281262651086, 0.0020963428542017937 ], "gamma_dfa": NaN, "acc_eval": 0.607421875, "loss_eval": 1.1545898914337158, "epoch": 96 }, { "hidden_norms": [ 257.1473388671875, 232.85020446777344, 216.2519989013672, 204.68023681640625, 200.93080139160156 ], "bp_grad_norms_per_sample_med": [ 5.0549009756650776e-05, 5.3789182857144624e-05, 5.673874693457037e-05, 5.580837023444474e-05, 4.2498151742620394e-05 ], "bp_grad_norms_F": [ 0.0029327664524316788, 0.0031159960199147463, 0.003215631702914834, 0.002998515497893095, 0.0020966045558452606 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1546047925949097, "epoch": 97 }, { "hidden_norms": [ 257.09906005859375, 232.74813842773438, 216.1462860107422, 204.6047821044922, 200.89031982421875 ], "bp_grad_norms_per_sample_med": [ 5.086465898784809e-05, 5.3742358431918547e-05, 5.673644773196429e-05, 5.5752621847204864e-05, 4.2624127672752365e-05 ], "bp_grad_norms_F": [ 0.0029341024346649647, 0.003117120126262307, 0.0032170764170587063, 0.0029998423997312784, 0.002097061835229397 ], "gamma_dfa": NaN, "acc_eval": 0.6083984375, "loss_eval": 1.1545934677124023, "epoch": 98 }, { "hidden_norms": [ 257.09326171875, 232.7879638671875, 216.1444091796875, 204.5867919921875, 200.89596557617188 ], "bp_grad_norms_per_sample_med": [ 5.078025787952356e-05, 5.40847031516023e-05, 5.667618097504601e-05, 5.571893780143e-05, 4.271125726518221e-05 ], "bp_grad_norms_F": [ 0.0029357182793319225, 0.0031186225824058056, 0.003218533471226692, 0.0030010156333446503, 0.002097515854984522 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.154747486114502, "epoch": 99 }, { "hidden_norms": [ 257.0869140625, 232.78091430664062, 216.12852478027344, 204.58143615722656, 200.87417602539062 ], "bp_grad_norms_per_sample_med": [ 5.08715384057723e-05, 5.4204192565521225e-05, 5.669457823387347e-05, 5.573080852627754e-05, 4.275495302863419e-05 ], "bp_grad_norms_F": [ 0.002935809548944235, 0.003118706401437521, 0.0032186671160161495, 0.003001126926392317, 0.0020975489169359207 ], "gamma_dfa": NaN, "acc_eval": 0.609375, "loss_eval": 1.1547397375106812, "epoch": 100 } ], "dfa_log": [ { "hidden_norms": [ 8.718070030212402, 8.780964851379395, 8.812002182006836, 8.828720092773438, 8.893179893493652 ], "bp_grad_norms_per_sample_med": [ 0.0010068593546748161, 0.000997236929833889, 0.0009934091940522194, 0.0009870644425973296, 0.0009829498594626784 ], "bp_grad_norms_F": [ 0.03544403985142708, 0.03507080301642418, 0.03477022796869278, 0.03443896397948265, 0.03407429903745651 ], "gamma_dfa": 0.007406219025142491, "acc_eval": 0.115234375, "loss_eval": 2.383650302886963, "epoch": 0 }, { "hidden_norms": [ 802.1658935546875, 3058.3173828125, 4910.8408203125, 6491.31494140625, 7304.1533203125 ], "bp_grad_norms_per_sample_med": [ 2.526000798752648e-06, 1.3625027577290894e-06, 1.3747999219049234e-06, 1.378283172925876e-06, 1.3869492931917193e-06 ], "bp_grad_norms_F": [ 0.00013306058826856315, 7.476000610040501e-05, 7.328101492021233e-05, 7.293069211300462e-05, 7.309897773666307e-05 ], "gamma_dfa": 0.08989996102172881, "acc_eval": 0.310546875, "loss_eval": 1.9283097982406616, "epoch": 1 }, { "hidden_norms": [ 1580.1480712890625, 13320.0517578125, 22793.435546875, 32440.041015625, 37758.640625 ], "bp_grad_norms_per_sample_med": [ 1.1427439403632889e-06, 3.0901847480890865e-07, 3.1107475706448895e-07, 3.1377521736430936e-07, 3.1722706239634135e-07 ], "bp_grad_norms_F": [ 6.523138290503994e-05, 2.3476462956750765e-05, 2.0436000340851024e-05, 1.96047385543352e-05, 1.9654715288197622e-05 ], "gamma_dfa": 0.0858152944711037, "acc_eval": 0.2880859375, "loss_eval": 1.9359606504440308, "epoch": 2 }, { "hidden_norms": [ 2343.090576171875, 32438.32421875, 58119.84375, 87185.09375, 104586.15625 ], "bp_grad_norms_per_sample_med": [ 8.229510513046989e-07, 1.3056541092737461e-07, 1.2754330214193033e-07, 1.2950138739142858e-07, 1.2936459370394005e-07 ], "bp_grad_norms_F": [ 0.0001579313538968563, 2.960947858809959e-05, 1.2371615412121173e-05, 8.468440682918299e-06, 7.067524620651966e-06 ], "gamma_dfa": 0.08629915304481983, "acc_eval": 0.3017578125, "loss_eval": 1.9288904666900635, "epoch": 3 }, { "hidden_norms": [ 3129.4423828125, 62780.5, 117608.9375, 182640.09375, 223504.390625 ], "bp_grad_norms_per_sample_med": [ 6.484323762379063e-07, 7.041825256237644e-08, 6.729855783760286e-08, 6.816127040565334e-08, 6.818439857170233e-08 ], "bp_grad_norms_F": [ 2.9993034331710078e-05, 2.8730657959386008e-06, 2.3409718323819106e-06, 2.367017486903933e-06, 2.3597553990839515e-06 ], "gamma_dfa": 0.08862219587899745, "acc_eval": 0.3076171875, "loss_eval": 1.926429033279419, "epoch": 4 }, { "hidden_norms": [ 3942.00390625, 109015.7890625, 203168.390625, 329067.625, 404167.84375 ], "bp_grad_norms_per_sample_med": [ 5.148021386958135e-07, 4.3746137379230277e-08, 4.211498705330996e-08, 4.271550579915129e-08, 4.2616289164243426e-08 ], "bp_grad_norms_F": [ 2.426102219033055e-05, 1.769960135789006e-06, 1.4341048881760798e-06, 1.45279318530811e-06, 1.44924592859752e-06 ], "gamma_dfa": 0.0876110177487135, "acc_eval": 0.328125, "loss_eval": 1.9219281673431396, "epoch": 5 }, { "hidden_norms": [ 4737.880859375, 173361.203125, 331121.75, 547707.8125, 677363.375 ], "bp_grad_norms_per_sample_med": [ 4.4596529846785415e-07, 2.929639286719521e-08, 2.8080462399771022e-08, 2.8515311001342525e-08, 2.847208158129888e-08 ], "bp_grad_norms_F": [ 2.1308444047463126e-05, 1.213497625940363e-06, 9.622256129659945e-07, 9.734020522955689e-07, 9.715020041767275e-07 ], "gamma_dfa": 0.08417161786928773, "acc_eval": 0.2919921875, "loss_eval": 1.942756175994873, "epoch": 6 }, { "hidden_norms": [ 5535.86865234375, 258337.40625, 501117.59375, 823776.9375, 1026549.875 ], "bp_grad_norms_per_sample_med": [ 3.856409307445574e-07, 2.2078769035260848e-08, 2.0866384176088104e-08, 2.09813144635973e-08, 2.1003458527957264e-08 ], "bp_grad_norms_F": [ 1.847265775722917e-05, 8.849666528476519e-07, 7.187628057181428e-07, 7.262269718921743e-07, 7.249743703141576e-07 ], "gamma_dfa": 0.08587896963581443, "acc_eval": 0.2919921875, "loss_eval": 1.9307396411895752, "epoch": 7 }, { "hidden_norms": [ 6304.064453125, 367445.5625, 717525.125, 1200281.0, 1512872.125 ], "bp_grad_norms_per_sample_med": [ 3.410295903449878e-07, 1.670872862291617e-08, 1.5770844186135946e-08, 1.5891666649281433e-08, 1.588542275499094e-08 ], "bp_grad_norms_F": [ 1.6556636182940565e-05, 6.716044254062581e-07, 5.55544488634041e-07, 5.606318040918268e-07, 5.59783927656099e-07 ], "gamma_dfa": 0.08515941491350532, "acc_eval": 0.306640625, "loss_eval": 1.9279191493988037, "epoch": 8 }, { "hidden_norms": [ 7086.48388671875, 505478.71875, 997925.8125, 1708849.375, 2150479.25 ], "bp_grad_norms_per_sample_med": [ 3.013988703060022e-07, 1.3297809964285534e-08, 1.2481795153007624e-08, 1.262175253202713e-08, 1.2595491760691857e-08 ], "bp_grad_norms_F": [ 1.4646101590187754e-05, 5.195778953748231e-07, 4.4164838186588895e-07, 4.451969459751126e-07, 4.4467057591646153e-07 ], "gamma_dfa": 0.08757842611521482, "acc_eval": 0.318359375, "loss_eval": 1.9144790172576904, "epoch": 9 }, { "hidden_norms": [ 7891.7685546875, 675713.625, 1320934.25, 2319375.25, 2933561.75 ], "bp_grad_norms_per_sample_med": [ 2.7613364750322944e-07, 1.1096022767276281e-08, 1.0442049891423721e-08, 1.0500828651061056e-08, 1.0485931234427426e-08 ], "bp_grad_norms_F": [ 1.3369051885092631e-05, 4.295688142974541e-07, 3.6954631355001766e-07, 3.72132660686475e-07, 3.718281220699282e-07 ], "gamma_dfa": 0.08759273961186409, "acc_eval": 0.3037109375, "loss_eval": 1.928476095199585, "epoch": 10 }, { "hidden_norms": [ 8605.7783203125, 881309.9375, 1719981.25, 3048018.25, 3848896.25 ], "bp_grad_norms_per_sample_med": [ 2.546977952988527e-07, 9.457612470953336e-09, 8.959561981214392e-09, 8.996098976865596e-09, 8.995014511015142e-09 ], "bp_grad_norms_F": [ 1.2278720532776788e-05, 3.6486676435742993e-07, 3.18511354180373e-07, 3.204301890491479e-07, 3.2022188634073245e-07 ], "gamma_dfa": 0.08920952118933201, "acc_eval": 0.3017578125, "loss_eval": 1.9193304777145386, "epoch": 11 }, { "hidden_norms": [ 9378.4287109375, 1120098.75, 2197340.0, 3930402.25, 4945595.0 ], "bp_grad_norms_per_sample_med": [ 2.424853278171213e-07, 8.285154784459792e-09, 7.84627474104127e-09, 7.900293752527432e-09, 7.906582943917329e-09 ], "bp_grad_norms_F": [ 1.1596725016715936e-05, 3.161075028401683e-07, 2.796709850372281e-07, 2.81156104620095e-07, 2.810372734529665e-07 ], "gamma_dfa": 0.09209982817992568, "acc_eval": 0.287109375, "loss_eval": 1.927558422088623, "epoch": 12 }, { "hidden_norms": [ 10124.396484375, 1412441.875, 2752346.75, 5010036.0, 6325289.5 ], "bp_grad_norms_per_sample_med": [ 2.236940588318248e-07, 7.092171738776187e-09, 6.815563668993718e-09, 6.8297678623707725e-09, 6.830232379684276e-09 ], "bp_grad_norms_F": [ 1.0770681910798885e-05, 2.7517026524037647e-07, 2.434409793750092e-07, 2.4456548430862313e-07, 2.445065661049739e-07 ], "gamma_dfa": 0.0919318727683276, "acc_eval": 0.2900390625, "loss_eval": 1.9280297756195068, "epoch": 13 }, { "hidden_norms": [ 10873.9169921875, 1726814.125, 3365165.0, 6225292.5, 7941070.5 ], "bp_grad_norms_per_sample_med": [ 2.0750607632180618e-07, 6.175024491739123e-09, 5.938003866390318e-09, 5.979505779407646e-09, 5.979241990416995e-09 ], "bp_grad_norms_F": [ 9.84854341368191e-06, 2.3993459308258025e-07, 2.1497004354387172e-07, 2.1585482556929492e-07, 2.1582005160780682e-07 ], "gamma_dfa": 0.09486197168007493, "acc_eval": 0.2978515625, "loss_eval": 1.9190003871917725, "epoch": 14 }, { "hidden_norms": [ 11534.0087890625, 2084976.25, 4091674.75, 7667605.5, 9821730.0 ], "bp_grad_norms_per_sample_med": [ 1.9337822720899567e-07, 5.5730837722478554e-09, 5.387873702744628e-09, 5.409793057964407e-09, 5.415522696949893e-09 ], "bp_grad_norms_F": [ 9.290296475228388e-06, 2.1226249202754843e-07, 1.9121620198347955e-07, 1.9190700584204023e-07, 1.9189823774468096e-07 ], "gamma_dfa": 0.09578572702594101, "acc_eval": 0.28515625, "loss_eval": 1.9317920207977295, "epoch": 15 }, { "hidden_norms": [ 12231.0380859375, 2494592.5, 4969235.5, 9387796.0, 12017026.0 ], "bp_grad_norms_per_sample_med": [ 1.7950755193396617e-07, 4.997119606997558e-09, 4.8298063326512874e-09, 4.8657629037052175e-09, 4.859395552614387e-09 ], "bp_grad_norms_F": [ 8.774502930464223e-06, 1.8752842834146577e-07, 1.7071489821773866e-07, 1.7126839679804107e-07, 1.7126781415299774e-07 ], "gamma_dfa": 0.09745451644994318, "acc_eval": 0.2978515625, "loss_eval": 1.927154541015625, "epoch": 16 }, { "hidden_norms": [ 12895.0341796875, 2937750.0, 5861416.5, 11095317.0, 14303387.0 ], "bp_grad_norms_per_sample_med": [ 1.7269709928768862e-07, 4.551929055907067e-09, 4.4097947515808755e-09, 4.41813474694186e-09, 4.416958798714177e-09 ], "bp_grad_norms_F": [ 8.354931196663529e-06, 1.7010511044190935e-07, 1.556661288759642e-07, 1.5612842219070444e-07, 1.5612160098044114e-07 ], "gamma_dfa": 0.09986255329567939, "acc_eval": 0.3115234375, "loss_eval": 1.9158110618591309, "epoch": 17 }, { "hidden_norms": [ 13624.58984375, 3430302.75, 6892795.0, 13179784.0, 16997646.0 ], "bp_grad_norms_per_sample_med": [ 1.642013387481711e-07, 4.094950600830316e-09, 4.012986831725129e-09, 4.022568500516854e-09, 4.023625876925507e-09 ], "bp_grad_norms_F": [ 7.884121259849053e-06, 1.54415545239317e-07, 1.407240830531009e-07, 1.411058434541701e-07, 1.4110656820776057e-07 ], "gamma_dfa": 0.09882167540490627, "acc_eval": 0.296875, "loss_eval": 1.9182151556015015, "epoch": 18 }, { "hidden_norms": [ 14323.6708984375, 3985548.0, 8076905.5, 15465362.0, 20015594.0 ], "bp_grad_norms_per_sample_med": [ 1.551940442823252e-07, 3.79724474086629e-09, 3.6876826037257615e-09, 3.700401984829682e-09, 3.6983835993709135e-09 ], "bp_grad_norms_F": [ 7.607863608427579e-06, 1.393282218487002e-07, 1.283839452526081e-07, 1.2869591614617093e-07, 1.2869809040694236e-07 ], "gamma_dfa": 0.1002046266803518, "acc_eval": 0.294921875, "loss_eval": 1.9388974905014038, "epoch": 19 }, { "hidden_norms": [ 14955.4462890625, 4541631.5, 9327444.0, 17893654.0, 23108114.0 ], "bp_grad_norms_per_sample_med": [ 1.4713883444983367e-07, 3.464018405452407e-09, 3.3744134153579353e-09, 3.379040602879968e-09, 3.381670721225305e-09 ], "bp_grad_norms_F": [ 7.235442353703547e-06, 1.2747574373861426e-07, 1.1753004969250469e-07, 1.1780696951291247e-07, 1.1780796427274254e-07 ], "gamma_dfa": 0.10065551439765841, "acc_eval": 0.30859375, "loss_eval": 1.9343281984329224, "epoch": 20 }, { "hidden_norms": [ 15583.8564453125, 5145675.5, 10628445.0, 20547210.0, 26561584.0 ], "bp_grad_norms_per_sample_med": [ 1.4314694851691456e-07, 3.170894435911009e-09, 3.083378885548882e-09, 3.0910656256821767e-09, 3.0932543193529227e-09 ], "bp_grad_norms_F": [ 6.938716524018673e-06, 1.1743370009753562e-07, 1.0794892091325892e-07, 1.0819184126376058e-07, 1.0819199047773509e-07 ], "gamma_dfa": 0.10184943513013422, "acc_eval": 0.3154296875, "loss_eval": 1.9154099225997925, "epoch": 21 }, { "hidden_norms": [ 16234.9208984375, 5839592.5, 12062968.0, 23496628.0, 30428386.0 ], "bp_grad_norms_per_sample_med": [ 1.379862197836701e-07, 2.91886981251821e-09, 2.8514124394973805e-09, 2.8584146161136914e-09, 2.860225389866855e-09 ], "bp_grad_norms_F": [ 6.72459282213822e-06, 1.0762735769276333e-07, 9.920048427147776e-08, 9.94118352082296e-08, 9.941232548271728e-08 ], "gamma_dfa": 0.1024534439202398, "acc_eval": 0.3095703125, "loss_eval": 1.9225246906280518, "epoch": 22 }, { "hidden_norms": [ 16833.765625, 6566770.0, 13630788.0, 26729236.0, 34665300.0 ], "bp_grad_norms_per_sample_med": [ 1.331996628550769e-07, 2.688527622751735e-09, 2.6381341555747895e-09, 2.6441848710589966e-09, 2.644968466469777e-09 ], "bp_grad_norms_F": [ 6.5681074374879245e-06, 9.902939268613409e-08, 9.131563416531208e-08, 9.149899682370233e-08, 9.149922419737777e-08 ], "gamma_dfa": 0.10199526121141389, "acc_eval": 0.30859375, "loss_eval": 1.9233064651489258, "epoch": 23 }, { "hidden_norms": [ 17456.634765625, 7337101.0, 15401232.0, 30171576.0, 39161244.0 ], "bp_grad_norms_per_sample_med": [ 1.2747005939672817e-07, 2.4809998500074926e-09, 2.4282977850731413e-09, 2.432346990488554e-09, 2.431272960734532e-09 ], "bp_grad_norms_F": [ 6.5036538217100315e-06, 9.14754565428666e-08, 8.484188640522916e-08, 8.500099824004792e-08, 8.500632731056612e-08 ], "gamma_dfa": 0.10456769005395472, "acc_eval": 0.30078125, "loss_eval": 1.9299731254577637, "epoch": 24 }, { "hidden_norms": [ 18049.205078125, 8139419.5, 17132936.0, 33801196.0, 43890588.0 ], "bp_grad_norms_per_sample_med": [ 1.2153788020441425e-07, 2.2737314253618024e-09, 2.2332342641817604e-09, 2.232388940370811e-09, 2.237900753598865e-09 ], "bp_grad_norms_F": [ 6.099615802668268e-06, 8.523231542767462e-08, 7.842250226985925e-08, 7.855853567662052e-08, 7.856372263859157e-08 ], "gamma_dfa": 0.10287670505931601, "acc_eval": 0.3232421875, "loss_eval": 1.923604965209961, "epoch": 25 }, { "hidden_norms": [ 18644.9375, 9035569.0, 19136636.0, 37813052.0, 49194300.0 ], "bp_grad_norms_per_sample_med": [ 1.212478508705317e-07, 2.0938955014315752e-09, 2.0560451119422396e-09, 2.058360148993188e-09, 2.061209425363586e-09 ], "bp_grad_norms_F": [ 5.810702987218974e-06, 7.886949049407121e-08, 7.294480752761956e-08, 7.307144755941408e-08, 7.307325233796291e-08 ], "gamma_dfa": 0.10249267728067935, "acc_eval": 0.3037109375, "loss_eval": 1.9200568199157715, "epoch": 26 }, { "hidden_norms": [ 19280.703125, 9952065.0, 21071430.0, 41963900.0, 54690120.0 ], "bp_grad_norms_per_sample_med": [ 1.1414142875310063e-07, 1.9668882078605066e-09, 1.928355919389446e-09, 1.9296169107008154e-09, 1.929810311551705e-09 ], "bp_grad_norms_F": [ 5.566818344959756e-06, 7.357547104902551e-08, 6.781976935599232e-08, 6.792832607516175e-08, 6.79302942785398e-08 ], "gamma_dfa": 0.10335587273584679, "acc_eval": 0.310546875, "loss_eval": 1.92685067653656, "epoch": 27 }, { "hidden_norms": [ 19887.205078125, 10899353.0, 23080260.0, 46142640.0, 60105148.0 ], "bp_grad_norms_per_sample_med": [ 1.1361055385350483e-07, 1.8462845696731733e-09, 1.815088412904231e-09, 1.8113950339682106e-09, 1.8156832704008252e-09 ], "bp_grad_norms_F": [ 5.398809662437998e-06, 6.89453401037099e-08, 6.4051612014282e-08, 6.414857267600382e-08, 6.415204012455433e-08 ], "gamma_dfa": 0.10455695656128228, "acc_eval": 0.302734375, "loss_eval": 1.923227310180664, "epoch": 28 }, { "hidden_norms": [ 20438.587890625, 11953376.0, 25259200.0, 50259240.0, 65732368.0 ], "bp_grad_norms_per_sample_med": [ 1.1073134231764925e-07, 1.7497674420496878e-09, 1.7245866956727696e-09, 1.7265968654811559e-09, 1.727246901062074e-09 ], "bp_grad_norms_F": [ 5.281461653794395e-06, 6.489771209317041e-08, 6.026093046784808e-08, 6.034837696233808e-08, 6.035197941400838e-08 ], "gamma_dfa": 0.10511547370697372, "acc_eval": 0.326171875, "loss_eval": 1.9300421476364136, "epoch": 29 }, { "hidden_norms": [ 20991.0234375, 13017462.0, 27475572.0, 54971628.0, 71927184.0 ], "bp_grad_norms_per_sample_med": [ 1.0625635837868685e-07, 1.6529324575742521e-09, 1.6255721213553898e-09, 1.6247864165208625e-09, 1.6244732226056158e-09 ], "bp_grad_norms_F": [ 5.098012934467988e-06, 6.077872427567854e-08, 5.674080227890954e-08, 5.681971870785674e-08, 5.6821534144546604e-08 ], "gamma_dfa": 0.10590779440826736, "acc_eval": 0.3017578125, "loss_eval": 1.9211739301681519, "epoch": 30 }, { "hidden_norms": [ 21617.34765625, 14125094.0, 29881326.0, 59926964.0, 78189832.0 ], "bp_grad_norms_per_sample_med": [ 1.0433515029717455e-07, 1.5471924852406005e-09, 1.5234034034250499e-09, 1.5246930384904545e-09, 1.5239296491387222e-09 ], "bp_grad_norms_F": [ 4.977115622750716e-06, 5.780140810429657e-08, 5.362210941939338e-08, 5.3694908075385683e-08, 5.369727773540944e-08 ], "gamma_dfa": 0.10481705865822732, "acc_eval": 0.3212890625, "loss_eval": 1.9209015369415283, "epoch": 31 }, { "hidden_norms": [ 22126.13671875, 15300531.0, 32579362.0, 65167536.0, 85083400.0 ], "bp_grad_norms_per_sample_med": [ 1.0149238249823611e-07, 1.4551810867402537e-09, 1.4291762218121562e-09, 1.432274854273885e-09, 1.4318950469771607e-09 ], "bp_grad_norms_F": [ 4.9215527724300046e-06, 5.434217342781267e-08, 5.088266163966182e-08, 5.094950239481477e-08, 5.0953229191463834e-08 ], "gamma_dfa": 0.10599250381346792, "acc_eval": 0.30859375, "loss_eval": 1.9330241680145264, "epoch": 32 }, { "hidden_norms": [ 22662.396484375, 16481282.0, 35263600.0, 70793304.0, 92166136.0 ], "bp_grad_norms_per_sample_med": [ 9.882934648430819e-08, 1.3810197430075277e-09, 1.3668104426045602e-09, 1.3675354182396404e-09, 1.366150526038723e-09 ], "bp_grad_norms_F": [ 4.6740801735722926e-06, 5.137474090588512e-08, 4.796589792022132e-08, 4.802501862855024e-08, 4.8027377630432966e-08 ], "gamma_dfa": 0.10529429838061333, "acc_eval": 0.3115234375, "loss_eval": 1.9205418825149536, "epoch": 33 }, { "hidden_norms": [ 23192.3125, 17779744.0, 38108720.0, 76522688.0, 99643120.0 ], "bp_grad_norms_per_sample_med": [ 9.530750588737646e-08, 1.3089170858293642e-09, 1.2901538726239892e-09, 1.2906937740808644e-09, 1.2914372904404559e-09 ], "bp_grad_norms_F": [ 4.669429472414777e-06, 4.88593805414439e-08, 4.5740907950175824e-08, 4.579441181817856e-08, 4.5798362435789386e-08 ], "gamma_dfa": 0.1058788642694708, "acc_eval": 0.30078125, "loss_eval": 1.9393997192382812, "epoch": 34 }, { "hidden_norms": [ 23683.251953125, 18992256.0, 40936536.0, 82030200.0, 106929248.0 ], "bp_grad_norms_per_sample_med": [ 9.458356942104729e-08, 1.2407530558533608e-09, 1.2231146095942336e-09, 1.2233244417458877e-09, 1.2247586278490985e-09 ], "bp_grad_norms_F": [ 4.483116299525136e-06, 4.651869289773458e-08, 4.358627236911161e-08, 4.363666050721804e-08, 4.3638891611408326e-08 ], "gamma_dfa": 0.10620562738040462, "acc_eval": 0.3251953125, "loss_eval": 1.9221802949905396, "epoch": 35 }, { "hidden_norms": [ 24223.7265625, 20421224.0, 43883308.0, 87849264.0, 114523200.0 ], "bp_grad_norms_per_sample_med": [ 9.247051480087976e-08, 1.182353992490448e-09, 1.1679496259020539e-09, 1.169668362166476e-09, 1.1697178781133744e-09 ], "bp_grad_norms_F": [ 4.388592969917227e-06, 4.4431864409943955e-08, 4.157495325785021e-08, 4.162143696362364e-08, 4.16235543809762e-08 ], "gamma_dfa": 0.10484841075958684, "acc_eval": 0.2998046875, "loss_eval": 1.9306102991104126, "epoch": 36 }, { "hidden_norms": [ 24732.05078125, 21765008.0, 46887340.0, 93818392.0, 122372552.0 ], "bp_grad_norms_per_sample_med": [ 9.012441637423763e-08, 1.1452657711075176e-09, 1.1280866241136778e-09, 1.1283430856323662e-09, 1.1287816237270931e-09 ], "bp_grad_norms_F": [ 4.297942268749466e-06, 4.29258228962226e-08, 3.9989565436826524e-08, 4.003141995667647e-08, 4.003394948881578e-08 ], "gamma_dfa": 0.10523941312567331, "acc_eval": 0.302734375, "loss_eval": 1.9360214471817017, "epoch": 37 }, { "hidden_norms": [ 25179.26953125, 23094218.0, 50076040.0, 100053064.0, 130605352.0 ], "bp_grad_norms_per_sample_med": [ 8.80345041309738e-08, 1.0831726626747695e-09, 1.0690409668612233e-09, 1.0700328401114234e-09, 1.0692404739387484e-09 ], "bp_grad_norms_F": [ 4.235343567415839e-06, 4.072955306355652e-08, 3.817867622046833e-08, 3.8218924913735464e-08, 3.822109917450689e-08 ], "gamma_dfa": 0.10568258634884842, "acc_eval": 0.3193359375, "loss_eval": 1.927825689315796, "epoch": 38 }, { "hidden_norms": [ 25586.23828125, 24470240.0, 53013036.0, 105981368.0, 138543408.0 ], "bp_grad_norms_per_sample_med": [ 8.783595717432036e-08, 1.0381262516290235e-09, 1.0265919225815878e-09, 1.0273364381419015e-09, 1.0274008310773297e-09 ], "bp_grad_norms_F": [ 4.177269602223532e-06, 3.924894187434802e-08, 3.684685978555535e-08, 3.688498040332888e-08, 3.688741045948518e-08 ], "gamma_dfa": 0.10561428684741259, "acc_eval": 0.302734375, "loss_eval": 1.9321579933166504, "epoch": 39 }, { "hidden_norms": [ 26049.974609375, 25812240.0, 56223324.0, 112200904.0, 146978224.0 ], "bp_grad_norms_per_sample_med": [ 8.555475972116255e-08, 9.982903392824483e-10, 9.87055215340149e-10, 9.8631947054173e-10, 9.876408579856388e-10 ], "bp_grad_norms_F": [ 4.088252808287507e-06, 3.767732792425704e-08, 3.5331073178213046e-08, 3.536514370239274e-08, 3.5367978767908426e-08 ], "gamma_dfa": 0.10579964506905526, "acc_eval": 0.318359375, "loss_eval": 1.930686116218567, "epoch": 40 }, { "hidden_norms": [ 26467.328125, 27200558.0, 59437036.0, 118688848.0, 155514592.0 ], "bp_grad_norms_per_sample_med": [ 8.46039256430231e-08, 9.647596055373242e-10, 9.512606258255119e-10, 9.511659238015113e-10, 9.522146404705722e-10 ], "bp_grad_norms_F": [ 4.015588729089359e-06, 3.636354861669133e-08, 3.413835614196614e-08, 3.417060767674229e-08, 3.417307326003538e-08 ], "gamma_dfa": 0.10565257369307801, "acc_eval": 0.314453125, "loss_eval": 1.9317667484283447, "epoch": 41 }, { "hidden_norms": [ 26919.3671875, 28678974.0, 62716300.0, 125549296.0, 163974208.0 ], "bp_grad_norms_per_sample_med": [ 8.232915860162393e-08, 9.29719468079071e-10, 9.197844152986079e-10, 9.194760508535182e-10, 9.196678418810222e-10 ], "bp_grad_norms_F": [ 3.951602138840826e-06, 3.508949220076829e-08, 3.2971975372220186e-08, 3.3001178678659926e-08, 3.300409190387654e-08 ], "gamma_dfa": 0.10566475696396083, "acc_eval": 0.3056640625, "loss_eval": 1.9284584522247314, "epoch": 42 }, { "hidden_norms": [ 27317.033203125, 30078810.0, 66046968.0, 132107504.0, 172659440.0 ], "bp_grad_norms_per_sample_med": [ 8.130339068657122e-08, 9.03509489447174e-10, 8.925334360476711e-10, 8.917908633776506e-10, 8.925368222278962e-10 ], "bp_grad_norms_F": [ 3.9174719859147444e-06, 3.398368519924588e-08, 3.1965900149089066e-08, 3.199273024279137e-08, 3.199540898890518e-08 ], "gamma_dfa": 0.10646540904417634, "acc_eval": 0.3115234375, "loss_eval": 1.9241154193878174, "epoch": 43 }, { "hidden_norms": [ 27715.529296875, 31383778.0, 69356640.0, 138681856.0, 181338928.0 ], "bp_grad_norms_per_sample_med": [ 8.031172171740764e-08, 8.735605017129444e-10, 8.597746958827202e-10, 8.612066615398817e-10, 8.621173774869817e-10 ], "bp_grad_norms_F": [ 3.837071290035965e-06, 3.286310601424702e-08, 3.101721191001161e-08, 3.104238288642591e-08, 3.104513979224066e-08 ], "gamma_dfa": 0.10568622383289039, "acc_eval": 0.2939453125, "loss_eval": 1.938409447669983, "epoch": 44 }, { "hidden_norms": [ 28149.3203125, 32840858.0, 72848112.0, 145667440.0, 190265088.0 ], "bp_grad_norms_per_sample_med": [ 7.894184506085367e-08, 8.401777051858517e-10, 8.299890774665641e-10, 8.304122944835512e-10, 8.303523979513727e-10 ], "bp_grad_norms_F": [ 3.798121497311513e-06, 3.184389640864538e-08, 3.004597459721481e-08, 3.0069060130699654e-08, 3.007191295978373e-08 ], "gamma_dfa": 0.10558789351489395, "acc_eval": 0.3037109375, "loss_eval": 1.9300565719604492, "epoch": 45 }, { "hidden_norms": [ 28522.55078125, 34358040.0, 76134080.0, 152412848.0, 198973936.0 ], "bp_grad_norms_per_sample_med": [ 7.830858095303483e-08, 8.109956595170331e-10, 8.036356025087343e-10, 8.033995135825478e-10, 8.031720843959533e-10 ], "bp_grad_norms_F": [ 3.7768336369481403e-06, 3.096561229654071e-08, 2.9296373327269976e-08, 2.9317961391939207e-08, 2.9320871064442144e-08 ], "gamma_dfa": 0.10623026502435096, "acc_eval": 0.3115234375, "loss_eval": 1.930029273033142, "epoch": 46 }, { "hidden_norms": [ 28924.912109375, 35808620.0, 79629336.0, 159269824.0, 208087264.0 ], "bp_grad_norms_per_sample_med": [ 7.754207587140627e-08, 7.940589297206202e-10, 7.852188899093449e-10, 7.844204730211857e-10, 7.861447048895798e-10 ], "bp_grad_norms_F": [ 3.695072564369184e-06, 3.0030403053160626e-08, 2.8479737679276695e-08, 2.849986913133762e-08, 2.8502654458861798e-08 ], "gamma_dfa": 0.1059467513114214, "acc_eval": 0.30078125, "loss_eval": 1.9284684658050537, "epoch": 47 }, { "hidden_norms": [ 29289.236328125, 37312204.0, 83049256.0, 165977216.0, 216710016.0 ], "bp_grad_norms_per_sample_med": [ 7.562951509498816e-08, 7.782112176890621e-10, 7.675478586044449e-10, 7.666810519779688e-10, 7.681388303204528e-10 ], "bp_grad_norms_F": [ 3.6269300380809e-06, 2.9297559933638695e-08, 2.782604902051844e-08, 2.7844757610751003e-08, 2.7847393724300673e-08 ], "gamma_dfa": 0.10581977141555399, "acc_eval": 0.3037109375, "loss_eval": 1.9282777309417725, "epoch": 48 }, { "hidden_norms": [ 29638.296875, 38754036.0, 86627536.0, 172893504.0, 225686464.0 ], "bp_grad_norms_per_sample_med": [ 7.50456763398688e-08, 7.526539391733422e-10, 7.443530236628249e-10, 7.439299176681402e-10, 7.444729277494844e-10 ], "bp_grad_norms_F": [ 3.6355218071548734e-06, 2.845291824371543e-08, 2.7127033064289208e-08, 2.714476821097378e-08, 2.7147471826083347e-08 ], "gamma_dfa": 0.1066790189652238, "acc_eval": 0.3056640625, "loss_eval": 1.925389051437378, "epoch": 49 }, { "hidden_norms": [ 29950.615234375, 40150236.0, 90007640.0, 179977856.0, 235206976.0 ], "bp_grad_norms_per_sample_med": [ 7.382724476201474e-08, 7.370593024802474e-10, 7.280710478951846e-10, 7.283330605289962e-10, 7.279294389483937e-10 ], "bp_grad_norms_F": [ 3.5918935736845015e-06, 2.7770946431360244e-08, 2.6450262424759785e-08, 2.6465910352158062e-08, 2.6468752523101102e-08 ], "gamma_dfa": 0.10654840966162737, "acc_eval": 0.3076171875, "loss_eval": 1.929931402206421, "epoch": 50 }, { "hidden_norms": [ 30266.310546875, 41604512.0, 93401064.0, 187075808.0, 244203616.0 ], "bp_grad_norms_per_sample_med": [ 7.343555097349963e-08, 7.144400626657443e-10, 7.057154305378788e-10, 7.05836944447924e-10, 7.073042707084198e-10 ], "bp_grad_norms_F": [ 3.5134323752572527e-06, 2.7063506990998576e-08, 2.580901536930469e-08, 2.582418012764265e-08, 2.582707381293403e-08 ], "gamma_dfa": 0.10640880587743595, "acc_eval": 0.314453125, "loss_eval": 1.9268465042114258, "epoch": 51 }, { "hidden_norms": [ 30588.291015625, 43073320.0, 96898208.0, 193783280.0, 253267328.0 ], "bp_grad_norms_per_sample_med": [ 7.257300893570573e-08, 6.925075513031231e-10, 6.871804236752155e-10, 6.855109813130866e-10, 6.860176871015256e-10 ], "bp_grad_norms_F": [ 3.4990612221008632e-06, 2.652852693074692e-08, 2.5297810068991566e-08, 2.5311907236869047e-08, 2.531497678148753e-08 ], "gamma_dfa": 0.10629434209840838, "acc_eval": 0.3125, "loss_eval": 1.932523488998413, "epoch": 52 }, { "hidden_norms": [ 30898.34765625, 44412940.0, 100019336.0, 199966816.0, 261667760.0 ], "bp_grad_norms_per_sample_med": [ 7.140450719589353e-08, 6.861456958162648e-10, 6.789319106914604e-10, 6.784582895491553e-10, 6.785109696316738e-10 ], "bp_grad_norms_F": [ 3.470987167020212e-06, 2.5969489669819268e-08, 2.478421379237261e-08, 2.479695204726795e-08, 2.4800137055080995e-08 ], "gamma_dfa": 0.1070190458704019, "acc_eval": 0.310546875, "loss_eval": 1.932159662246704, "epoch": 53 }, { "hidden_norms": [ 31188.375, 45820600.0, 103429992.0, 206547120.0, 270181600.0 ], "bp_grad_norms_per_sample_med": [ 7.079076169702603e-08, 6.688025688816879e-10, 6.633480986728557e-10, 6.629659043966285e-10, 6.630911930649575e-10 ], "bp_grad_norms_F": [ 3.4183981370006222e-06, 2.540217280966317e-08, 2.4278467236626966e-08, 2.4290830680229192e-08, 2.429379897250783e-08 ], "gamma_dfa": 0.10550818023330066, "acc_eval": 0.2998046875, "loss_eval": 1.9357173442840576, "epoch": 54 }, { "hidden_norms": [ 31478.2109375, 47178892.0, 107044784.0, 213196560.0, 278895232.0 ], "bp_grad_norms_per_sample_med": [ 7.016877390242371e-08, 6.609012226377331e-10, 6.520708972779232e-10, 6.519841333485488e-10, 6.530669338644657e-10 ], "bp_grad_norms_F": [ 3.405668167033582e-06, 2.4965938649756936e-08, 2.3893584000234114e-08, 2.390493669679472e-08, 2.390810749375305e-08 ], "gamma_dfa": 0.10673638083972037, "acc_eval": 0.294921875, "loss_eval": 1.9359304904937744, "epoch": 55 }, { "hidden_norms": [ 31753.5859375, 48563264.0, 110454832.0, 219550528.0, 287320896.0 ], "bp_grad_norms_per_sample_med": [ 7.007908919831607e-08, 6.483197867446222e-10, 6.408613084651904e-10, 6.410805775125539e-10, 6.409432429244077e-10 ], "bp_grad_norms_F": [ 3.369002797626308e-06, 2.447991498399915e-08, 2.3494733270013057e-08, 2.350535943662635e-08, 2.350850003551841e-08 ], "gamma_dfa": 0.10726616549072787, "acc_eval": 0.3076171875, "loss_eval": 1.9281866550445557, "epoch": 56 }, { "hidden_norms": [ 32002.76953125, 49866268.0, 113724368.0, 225759120.0, 295231328.0 ], "bp_grad_norms_per_sample_med": [ 6.914736161434121e-08, 6.332004365283694e-10, 6.232644400583354e-10, 6.233273341926804e-10, 6.240686856173738e-10 ], "bp_grad_norms_F": [ 3.3845158213807736e-06, 2.415495181651295e-08, 2.3192731291032942e-08, 2.3202973764568924e-08, 2.3206132127029377e-08 ], "gamma_dfa": 0.10715722179156728, "acc_eval": 0.3095703125, "loss_eval": 1.9343407154083252, "epoch": 57 }, { "hidden_norms": [ 32277.291015625, 51206064.0, 116617608.0, 231756352.0, 303064864.0 ], "bp_grad_norms_per_sample_med": [ 6.926612172719615e-08, 6.240719607752965e-10, 6.182420131395361e-10, 6.17405682135086e-10, 6.178215161689593e-10 ], "bp_grad_norms_F": [ 3.317889877507696e-06, 2.3704412654979024e-08, 2.2745311412109004e-08, 2.2754765183208292e-08, 2.2757769002623718e-08 ], "gamma_dfa": 0.10657632350921631, "acc_eval": 0.302734375, "loss_eval": 1.9305057525634766, "epoch": 58 }, { "hidden_norms": [ 32521.890625, 52538716.0, 119605040.0, 237773904.0, 310920672.0 ], "bp_grad_norms_per_sample_med": [ 6.805787933217289e-08, 6.190028489783117e-10, 6.10553496649402e-10, 6.107545580391616e-10, 6.10922701316241e-10 ], "bp_grad_norms_F": [ 3.2823897981870687e-06, 2.3313557306892108e-08, 2.2385792775025948e-08, 2.239448981811165e-08, 2.239757002087117e-08 ], "gamma_dfa": 0.10671919275773689, "acc_eval": 0.302734375, "loss_eval": 1.9269468784332275, "epoch": 59 }, { "hidden_norms": [ 32717.80859375, 53698120.0, 122676120.0, 243745136.0, 318772768.0 ], "bp_grad_norms_per_sample_med": [ 6.75130422678194e-08, 6.033377686343044e-10, 5.948920800413759e-10, 5.949861159315617e-10, 5.951407144877408e-10 ], "bp_grad_norms_F": [ 3.2588357044005534e-06, 2.2926835541170476e-08, 2.205681148836902e-08, 2.206508220581327e-08, 2.2068283200837868e-08 ], "gamma_dfa": 0.10711025857017376, "acc_eval": 0.314453125, "loss_eval": 1.9273767471313477, "epoch": 60 }, { "hidden_norms": [ 32950.74609375, 54885932.0, 125689616.0, 249312240.0, 326217856.0 ], "bp_grad_norms_per_sample_med": [ 6.673791119737871e-08, 5.923626589243725e-10, 5.863842189590684e-10, 5.866296337586618e-10, 5.870876007563197e-10 ], "bp_grad_norms_F": [ 3.2307948458765168e-06, 2.2597017590442192e-08, 2.1738133071380616e-08, 2.1745805156569986e-08, 2.1749071876797643e-08 ], "gamma_dfa": 0.10673619594308548, "acc_eval": 0.31640625, "loss_eval": 1.9271256923675537, "epoch": 61 }, { "hidden_norms": [ 33148.1328125, 55976648.0, 128534072.0, 254655232.0, 333162784.0 ], "bp_grad_norms_per_sample_med": [ 6.663199769718631e-08, 5.852057172184288e-10, 5.787633705622852e-10, 5.792484825128952e-10, 5.793157620281875e-10 ], "bp_grad_norms_F": [ 3.197097157681128e-06, 2.2320827852695402e-08, 2.1484760637235922e-08, 2.149219824332249e-08, 2.1495376145708178e-08 ], "gamma_dfa": 0.10659754439257085, "acc_eval": 0.310546875, "loss_eval": 1.9244905710220337, "epoch": 62 }, { "hidden_norms": [ 33369.18359375, 57164716.0, 131352720.0, 259876736.0, 339964160.0 ], "bp_grad_norms_per_sample_med": [ 6.583201184184873e-08, 5.737598174349046e-10, 5.67273561458137e-10, 5.66656666034504e-10, 5.665773961105458e-10 ], "bp_grad_norms_F": [ 3.2037539767770795e-06, 2.2096731555620863e-08, 2.127841902677119e-08, 2.1285371687440602e-08, 2.1288625973170383e-08 ], "gamma_dfa": 0.10679806087864563, "acc_eval": 0.3154296875, "loss_eval": 1.9308257102966309, "epoch": 63 }, { "hidden_norms": [ 33540.88671875, 58301528.0, 133722112.0, 264798368.0, 346396256.0 ], "bp_grad_norms_per_sample_med": [ 6.606099844930213e-08, 5.686319748399171e-10, 5.629098853709991e-10, 5.619399945366865e-10, 5.626447086015673e-10 ], "bp_grad_norms_F": [ 3.1530219075648347e-06, 2.1766210167584177e-08, 2.0992644067518995e-08, 2.0999330274662498e-08, 2.1002534822400776e-08 ], "gamma_dfa": 0.10647483140928671, "acc_eval": 0.3115234375, "loss_eval": 1.925765037536621, "epoch": 64 }, { "hidden_norms": [ 33728.984375, 59420104.0, 136277376.0, 270265568.0, 353408672.0 ], "bp_grad_norms_per_sample_med": [ 6.57889458466343e-08, 5.627094901150542e-10, 5.575621631059846e-10, 5.567652450189087e-10, 5.571588745922895e-10 ], "bp_grad_norms_F": [ 3.138873807984055e-06, 2.1483266721133987e-08, 2.0736742101234995e-08, 2.0742897177683517e-08, 2.0746110607205992e-08 ], "gamma_dfa": 0.10677585859230021, "acc_eval": 0.3154296875, "loss_eval": 1.9289934635162354, "epoch": 65 }, { "hidden_norms": [ 33919.515625, 60492864.0, 138846208.0, 275456896.0, 359821632.0 ], "bp_grad_norms_per_sample_med": [ 6.451340084367985e-08, 5.607461717183071e-10, 5.556192728128906e-10, 5.553609239150603e-10, 5.557289628477236e-10 ], "bp_grad_norms_F": [ 3.125772991552367e-06, 2.1269308092541905e-08, 2.0518179155715188e-08, 2.052397540808215e-08, 2.0527094690692138e-08 ], "gamma_dfa": 0.10671760967670707, "acc_eval": 0.3125, "loss_eval": 1.9296305179595947, "epoch": 66 }, { "hidden_norms": [ 34098.5, 61508056.0, 141295472.0, 280204000.0, 365860768.0 ], "bp_grad_norms_per_sample_med": [ 6.474934366451635e-08, 5.519530943409734e-10, 5.459506735583375e-10, 5.446967876743258e-10, 5.452004958605983e-10 ], "bp_grad_norms_F": [ 3.1189638320938684e-06, 2.1083655710185667e-08, 2.0349753881987453e-08, 2.0355370722313637e-08, 2.0358520202989894e-08 ], "gamma_dfa": 0.10652847628807649, "acc_eval": 0.3046875, "loss_eval": 1.9298161268234253, "epoch": 67 }, { "hidden_norms": [ 34267.96875, 62529272.0, 143621744.0, 284772064.0, 371754336.0 ], "bp_grad_norms_per_sample_med": [ 6.392743046035321e-08, 5.466314068058864e-10, 5.412825743178473e-10, 5.413390846698007e-10, 5.416116999334974e-10 ], "bp_grad_norms_F": [ 3.0790877190156607e-06, 2.0871810946232472e-08, 2.0159163227617682e-08, 2.0164401703937074e-08, 2.0167590264463797e-08 ], "gamma_dfa": 0.10652959482831648, "acc_eval": 0.298828125, "loss_eval": 1.926388144493103, "epoch": 68 }, { "hidden_norms": [ 34420.42578125, 63473892.0, 145906128.0, 289224256.0, 377581856.0 ], "bp_grad_norms_per_sample_med": [ 6.427427479138714e-08, 5.377295275721394e-10, 5.307561612433176e-10, 5.305922923248829e-10, 5.308011252758149e-10 ], "bp_grad_norms_F": [ 3.096157115578535e-06, 2.067219107004803e-08, 2.0005694878477698e-08, 2.001087118230771e-08, 2.001400645212925e-08 ], "gamma_dfa": 0.10710431921324925, "acc_eval": 0.310546875, "loss_eval": 1.9277684688568115, "epoch": 69 }, { "hidden_norms": [ 34573.87890625, 64328388.0, 148036320.0, 293257856.0, 382751104.0 ], "bp_grad_norms_per_sample_med": [ 6.389419127117435e-08, 5.373848033229933e-10, 5.314943485323909e-10, 5.314927387090052e-10, 5.31539035009132e-10 ], "bp_grad_norms_F": [ 3.072862682529376e-06, 2.049388392322271e-08, 1.98319511923728e-08, 1.9836669196138246e-08, 1.9840014076066836e-08 ], "gamma_dfa": 0.10700461147644091, "acc_eval": 0.3076171875, "loss_eval": 1.9307092428207397, "epoch": 70 }, { "hidden_norms": [ 34690.74609375, 65142160.0, 150006800.0, 297046144.0, 387685792.0 ], "bp_grad_norms_per_sample_med": [ 6.348407310952098e-08, 5.322000062868426e-10, 5.271332259582096e-10, 5.264539360005926e-10, 5.263872671079639e-10 ], "bp_grad_norms_F": [ 3.055365141335642e-06, 2.0346906381973895e-08, 1.9688986441224188e-08, 1.969357477094036e-08, 1.969680063496071e-08 ], "gamma_dfa": 0.10688555391971022, "acc_eval": 0.314453125, "loss_eval": 1.9277830123901367, "epoch": 71 }, { "hidden_norms": [ 34818.79296875, 65891160.0, 151813680.0, 300644832.0, 392342848.0 ], "bp_grad_norms_per_sample_med": [ 6.302482802311715e-08, 5.310150652526602e-10, 5.265936020570905e-10, 5.26124921407245e-10, 5.26482579754628e-10 ], "bp_grad_norms_F": [ 3.027237426067586e-06, 2.0201985861945104e-08, 1.9550000729395833e-08, 1.955433681644081e-08, 1.9557578667672715e-08 ], "gamma_dfa": 0.10652808679151349, "acc_eval": 0.2998046875, "loss_eval": 1.9273805618286133, "epoch": 72 }, { "hidden_norms": [ 34951.515625, 66590476.0, 153730848.0, 304118720.0, 396925408.0 ], "bp_grad_norms_per_sample_med": [ 6.403244157127119e-08, 5.26472032635894e-10, 5.205495479110311e-10, 5.201504782448296e-10, 5.20502474454787e-10 ], "bp_grad_norms_F": [ 3.0631524623458972e-06, 2.0121730059941e-08, 1.9494045488954725e-08, 1.9498189729461046e-08, 1.950143335704979e-08 ], "gamma_dfa": 0.1070192107144976, "acc_eval": 0.3017578125, "loss_eval": 1.934456467628479, "epoch": 73 }, { "hidden_norms": [ 35056.31640625, 67311408.0, 155368816.0, 307494752.0, 401124448.0 ], "bp_grad_norms_per_sample_med": [ 6.303329769252741e-08, 5.209726539057158e-10, 5.160313842900166e-10, 5.156270965755994e-10, 5.161130411934778e-10 ], "bp_grad_norms_F": [ 3.0127189347695094e-06, 1.993531562050066e-08, 1.93110221147208e-08, 1.9314887467203334e-08, 1.9318180832783582e-08 ], "gamma_dfa": 0.10658633662387729, "acc_eval": 0.3076171875, "loss_eval": 1.9260145425796509, "epoch": 74 }, { "hidden_norms": [ 35158.68359375, 67933192.0, 157091536.0, 310654048.0, 405321344.0 ], "bp_grad_norms_per_sample_med": [ 6.339039515523837e-08, 5.170803230036825e-10, 5.107546607874269e-10, 5.104218714357955e-10, 5.108970468903351e-10 ], "bp_grad_norms_F": [ 3.0164017061906634e-06, 1.9819051289005074e-08, 1.921591774589615e-08, 1.921967651696832e-08, 1.9223040936822144e-08 ], "gamma_dfa": 0.10703902837121859, "acc_eval": 0.3095703125, "loss_eval": 1.927987813949585, "epoch": 75 }, { "hidden_norms": [ 35270.68359375, 68510120.0, 158496816.0, 313641408.0, 409130592.0 ], "bp_grad_norms_per_sample_med": [ 6.246813200050383e-08, 5.133981018090594e-10, 5.070178166199923e-10, 5.070903141835004e-10, 5.071925657240683e-10 ], "bp_grad_norms_F": [ 3.004009158757981e-06, 1.970923690919335e-08, 1.910464320076244e-08, 1.9108172821802327e-08, 1.9111526583515115e-08 ], "gamma_dfa": 0.1070477613247931, "acc_eval": 0.3193359375, "loss_eval": 1.9260926246643066, "epoch": 76 }, { "hidden_norms": [ 35364.3125, 69078320.0, 159830400.0, 316294976.0, 412518496.0 ], "bp_grad_norms_per_sample_med": [ 6.217867820623724e-08, 5.12098419225282e-10, 5.052269158589695e-10, 5.058938268298618e-10, 5.053178431246863e-10 ], "bp_grad_norms_F": [ 2.9913805974501884e-06, 1.9599063705300068e-08, 1.900307999846973e-08, 1.9006522578024487e-08, 1.9009846141671005e-08 ], "gamma_dfa": 0.10688473540358245, "acc_eval": 0.3076171875, "loss_eval": 1.926918864250183, "epoch": 77 }, { "hidden_norms": [ 35441.375, 69602704.0, 161117808.0, 318818240.0, 415766208.0 ], "bp_grad_norms_per_sample_med": [ 6.249013040360296e-08, 5.102671063461628e-10, 5.039960671027188e-10, 5.038492956188634e-10, 5.034740402365401e-10 ], "bp_grad_norms_F": [ 2.9863124382245587e-06, 1.9512324200832154e-08, 1.8926254341522508e-08, 1.8929529943534362e-08, 1.8932860612608238e-08 ], "gamma_dfa": 0.10701000291737728, "acc_eval": 0.306640625, "loss_eval": 1.9271972179412842, "epoch": 78 }, { "hidden_norms": [ 35514.78125, 70081152.0, 162190624.0, 321009312.0, 418699392.0 ], "bp_grad_norms_per_sample_med": [ 6.149930698029493e-08, 5.099357047733122e-10, 5.055039165036135e-10, 5.048302331722709e-10, 5.054044960317583e-10 ], "bp_grad_norms_F": [ 2.969128445329261e-06, 1.9427163877594467e-08, 1.883810085701043e-08, 1.884115441441736e-08, 1.884450639977331e-08 ], "gamma_dfa": 0.10680000087450026, "acc_eval": 0.3017578125, "loss_eval": 1.9285144805908203, "epoch": 79 }, { "hidden_norms": [ 35582.9765625, 70499392.0, 163284976.0, 323095264.0, 421363552.0 ], "bp_grad_norms_per_sample_med": [ 6.187113399391819e-08, 5.05410657769545e-10, 4.990756696798826e-10, 4.979930912085706e-10, 4.985904467069702e-10 ], "bp_grad_norms_F": [ 2.9715449727518717e-06, 1.9354965630213883e-08, 1.877567434860339e-08, 1.8778711918798763e-08, 1.8782076338652587e-08 ], "gamma_dfa": 0.10694103027344681, "acc_eval": 0.310546875, "loss_eval": 1.92802095413208, "epoch": 80 }, { "hidden_norms": [ 35639.56640625, 70899536.0, 164253712.0, 324923200.0, 423745824.0 ], "bp_grad_norms_per_sample_med": [ 6.238182237439105e-08, 5.018311322046998e-10, 4.970572842211141e-10, 4.953790155859394e-10, 4.961450694729308e-10 ], "bp_grad_norms_F": [ 2.971921048811055e-06, 1.9296171771543413e-08, 1.872837351868384e-08, 1.8731368456315067e-08, 1.873476662694884e-08 ], "gamma_dfa": 0.10704115682892734, "acc_eval": 0.3076171875, "loss_eval": 1.926428198814392, "epoch": 81 }, { "hidden_norms": [ 35689.78515625, 71256024.0, 165127008.0, 326618208.0, 425949792.0 ], "bp_grad_norms_per_sample_med": [ 6.238117578050151e-08, 4.972192657604069e-10, 4.926972718699574e-10, 4.921834606541609e-10, 4.923969565417963e-10 ], "bp_grad_norms_F": [ 2.9655700473085744e-06, 1.9235280035445612e-08, 1.8671270751724478e-08, 1.8674217727721043e-08, 1.8677596358429582e-08 ], "gamma_dfa": 0.10696214074414456, "acc_eval": 0.3056640625, "loss_eval": 1.924986481666565, "epoch": 82 }, { "hidden_norms": [ 35742.58984375, 71595640.0, 165912336.0, 328130016.0, 427838752.0 ], "bp_grad_norms_per_sample_med": [ 6.213700487478491e-08, 4.983659041002397e-10, 4.936055453264032e-10, 4.941617670617404e-10, 4.939196274200697e-10 ], "bp_grad_norms_F": [ 2.951217993540922e-06, 1.919361736213432e-08, 1.863161003257119e-08, 1.8634468190725784e-08, 1.8637845045077484e-08 ], "gamma_dfa": 0.10690056857129093, "acc_eval": 0.3046875, "loss_eval": 1.9250625371932983, "epoch": 83 }, { "hidden_norms": [ 35784.6640625, 71885704.0, 166691376.0, 329546848.0, 429668704.0 ], "bp_grad_norms_per_sample_med": [ 6.175997668833588e-08, 4.971995593017198e-10, 4.919967211414189e-10, 4.91977791838849e-10, 4.926699603835516e-10 ], "bp_grad_norms_F": [ 2.9550594717875356e-06, 1.9144454910247077e-08, 1.8583381944381472e-08, 1.858614595562358e-08, 1.8589524586332118e-08 ], "gamma_dfa": 0.10689649073174223, "acc_eval": 0.3076171875, "loss_eval": 1.926330327987671, "epoch": 84 }, { "hidden_norms": [ 35822.33984375, 72122744.0, 167344016.0, 330816224.0, 431313312.0 ], "bp_grad_norms_per_sample_med": [ 6.139300978702522e-08, 4.980582613001161e-10, 4.935602482269985e-10, 4.934832542602408e-10, 4.934415098745148e-10 ], "bp_grad_norms_F": [ 2.9577784061984858e-06, 1.9112555094125128e-08, 1.8551357783280764e-08, 1.8553992120473595e-08, 1.8557404501962083e-08 ], "gamma_dfa": 0.10689723303948995, "acc_eval": 0.3056640625, "loss_eval": 1.9307332038879395, "epoch": 85 }, { "hidden_norms": [ 35859.390625, 72358304.0, 167947920.0, 331984992.0, 432823232.0 ], "bp_grad_norms_per_sample_med": [ 6.135296359843778e-08, 4.947317000514317e-10, 4.903184525062443e-10, 4.896648087004962e-10, 4.905649775288623e-10 ], "bp_grad_norms_F": [ 2.9511427328543505e-06, 1.906450464161935e-08, 1.8504644927475056e-08, 1.8507259724742653e-08, 1.8510663224446944e-08 ], "gamma_dfa": 0.10684622721601045, "acc_eval": 0.314453125, "loss_eval": 1.9271869659423828, "epoch": 86 }, { "hidden_norms": [ 35888.20703125, 72553136.0, 168401376.0, 332911328.0, 434057600.0 ], "bp_grad_norms_per_sample_med": [ 6.163116239576993e-08, 4.935953312745767e-10, 4.904400219274407e-10, 4.890517990574494e-10, 4.891231308867816e-10 ], "bp_grad_norms_F": [ 2.9438597266562283e-06, 1.902795432329185e-08, 1.8475304841558682e-08, 1.8477877006262133e-08, 1.848129471682114e-08 ], "gamma_dfa": 0.10682923735294025, "acc_eval": 0.30859375, "loss_eval": 1.9263050556182861, "epoch": 87 }, { "hidden_norms": [ 35914.35546875, 72735848.0, 168823680.0, 333752736.0, 435137376.0 ], "bp_grad_norms_per_sample_med": [ 6.153870657499283e-08, 4.920966967247864e-10, 4.894144534084433e-10, 4.876969939004994e-10, 4.884483928435657e-10 ], "bp_grad_norms_F": [ 2.9408777209027903e-06, 1.8999060102942167e-08, 1.8450597494279464e-08, 1.8453114591920894e-08, 1.84565323024799e-08 ], "gamma_dfa": 0.10694600266288035, "acc_eval": 0.3115234375, "loss_eval": 1.9252078533172607, "epoch": 88 }, { "hidden_norms": [ 35936.5546875, 72887360.0, 169178624.0, 334467840.0, 436061952.0 ], "bp_grad_norms_per_sample_med": [ 6.168602340039797e-08, 4.908231043820876e-10, 4.854965318656923e-10, 4.846267276370497e-10, 4.847209300606892e-10 ], "bp_grad_norms_F": [ 2.945510459539946e-06, 1.8982424521141184e-08, 1.8438125692910035e-08, 1.844062857969675e-08, 1.8444072935608347e-08 ], "gamma_dfa": 0.10697454003093299, "acc_eval": 0.3134765625, "loss_eval": 1.9264906644821167, "epoch": 89 }, { "hidden_norms": [ 35955.3671875, 73005808.0, 169498240.0, 335085920.0, 436862656.0 ], "bp_grad_norms_per_sample_med": [ 6.152810527737529e-08, 4.922047214250824e-10, 4.872572900715966e-10, 4.873856318532432e-10, 4.87353157829773e-10 ], "bp_grad_norms_F": [ 2.9327068205020623e-06, 1.8955052638602865e-08, 1.8409036073308016e-08, 1.8411496327530585e-08, 1.841491403808959e-08 ], "gamma_dfa": 0.10689280136284651, "acc_eval": 0.3095703125, "loss_eval": 1.9255037307739258, "epoch": 90 }, { "hidden_norms": [ 35973.34375, 73111368.0, 169770208.0, 335584768.0, 437507744.0 ], "bp_grad_norms_per_sample_med": [ 6.107820382794671e-08, 4.92519802719471e-10, 4.876242187812352e-10, 4.871342773604681e-10, 4.873002001914983e-10 ], "bp_grad_norms_F": [ 2.9368579816946294e-06, 1.8944499302619988e-08, 1.839602603581625e-08, 1.8398441881117833e-08, 1.8401848933535803e-08 ], "gamma_dfa": 0.10685028225998394, "acc_eval": 0.306640625, "loss_eval": 1.9265596866607666, "epoch": 91 }, { "hidden_norms": [ 35985.046875, 73193336.0, 169984976.0, 335981920.0, 438037376.0 ], "bp_grad_norms_per_sample_med": [ 6.100844984757714e-08, 4.92902163529152e-10, 4.862484304091197e-10, 4.871591463562197e-10, 4.871424374996991e-10 ], "bp_grad_norms_F": [ 2.930574055426405e-06, 1.8926412437281215e-08, 1.8379486377284593e-08, 1.8381888011731462e-08, 1.8385312827717826e-08 ], "gamma_dfa": 0.106783474504482, "acc_eval": 0.30859375, "loss_eval": 1.9269328117370605, "epoch": 92 }, { "hidden_norms": [ 35994.07421875, 73256784.0, 170148048.0, 336300032.0, 438460544.0 ], "bp_grad_norms_per_sample_med": [ 6.113810968599864e-08, 4.918689899824358e-10, 4.860293834063611e-10, 4.857191315821296e-10, 4.859731506101639e-10 ], "bp_grad_norms_F": [ 2.9313273444131482e-06, 1.8918141719836967e-08, 1.8372302790226058e-08, 1.837469731924557e-08, 1.8378123911588773e-08 ], "gamma_dfa": 0.10685011067107553, "acc_eval": 0.3095703125, "loss_eval": 1.9262909889221191, "epoch": 93 }, { "hidden_norms": [ 36002.55078125, 73308792.0, 170289472.0, 336572864.0, 438812896.0 ], "bp_grad_norms_per_sample_med": [ 6.121508988599089e-08, 4.917221074762779e-10, 4.853899504553283e-10, 4.847242052186118e-10, 4.849394219519354e-10 ], "bp_grad_norms_F": [ 2.933722271336592e-06, 1.8911242349872737e-08, 1.8366764109600808e-08, 1.836915508590664e-08, 1.8372583454606684e-08 ], "gamma_dfa": 0.10693995938345324, "acc_eval": 0.3076171875, "loss_eval": 1.9261877536773682, "epoch": 94 }, { "hidden_norms": [ 36008.01953125, 73348264.0, 170386624.0, 336761248.0, 439049248.0 ], "bp_grad_norms_per_sample_med": [ 6.123732987362018e-08, 4.916126949972011e-10, 4.860848945575924e-10, 4.87389184566922e-10, 4.868180303319036e-10 ], "bp_grad_norms_F": [ 2.9306668238859857e-06, 1.8901717524499873e-08, 1.835805107930355e-08, 1.8360427844754668e-08, 1.836385976616839e-08 ], "gamma_dfa": 0.10689331469620811, "acc_eval": 0.30859375, "loss_eval": 1.9260027408599854, "epoch": 95 }, { "hidden_norms": [ 36011.9296875, 73372720.0, 170447072.0, 336878464.0, 439192800.0 ], "bp_grad_norms_per_sample_med": [ 6.115104156378948e-08, 4.911633877391353e-10, 4.862875657707377e-10, 4.868677128122556e-10, 4.867456437906981e-10 ], "bp_grad_norms_F": [ 2.9297382297954755e-06, 1.889710254943111e-08, 1.8353631503487122e-08, 1.835600293986772e-08, 1.8359434861281443e-08 ], "gamma_dfa": 0.1068731502891751, "acc_eval": 0.306640625, "loss_eval": 1.9261021614074707, "epoch": 96 }, { "hidden_norms": [ 36014.109375, 73385416.0, 170481184.0, 336945120.0, 439280128.0 ], "bp_grad_norms_per_sample_med": [ 6.12362214269524e-08, 4.916780316222003e-10, 4.858832225451692e-10, 4.867402036978774e-10, 4.862423241824843e-10 ], "bp_grad_norms_F": [ 2.930293021563557e-06, 1.8895260467388653e-08, 1.8352444897118403e-08, 1.835481810985584e-08, 1.8358248254912723e-08 ], "gamma_dfa": 0.10688256371940952, "acc_eval": 0.3095703125, "loss_eval": 1.926184892654419, "epoch": 97 }, { "hidden_norms": [ 36015.9375, 73396752.0, 170510784.0, 337001056.0, 439352832.0 ], "bp_grad_norms_per_sample_med": [ 6.120947659837839e-08, 4.916590468084792e-10, 4.857179658479538e-10, 4.86417739420375e-10, 4.85919415815772e-10 ], "bp_grad_norms_F": [ 2.930209348050994e-06, 1.889360845552801e-08, 1.835070939648631e-08, 1.8353080832866908e-08, 1.835651275428063e-08 ], "gamma_dfa": 0.10688149025372695, "acc_eval": 0.306640625, "loss_eval": 1.9262256622314453, "epoch": 98 }, { "hidden_norms": [ 36016.734375, 73401888.0, 170523312.0, 337026592.0, 439384864.0 ], "bp_grad_norms_per_sample_med": [ 6.119820028516187e-08, 4.917350415745148e-10, 4.857160784688119e-10, 4.860361002556601e-10, 4.855379431845108e-10 ], "bp_grad_norms_F": [ 2.9303794235602254e-06, 1.8893027586841526e-08, 1.835026353091962e-08, 1.835263319094338e-08, 1.83560651123571e-08 ], "gamma_dfa": 0.10688879482768243, "acc_eval": 0.3076171875, "loss_eval": 1.926223874092102, "epoch": 99 }, { "hidden_norms": [ 36016.7734375, 73401992.0, 170523904.0, 337027392.0, 439386048.0 ], "bp_grad_norms_per_sample_med": [ 6.120198747794348e-08, 4.91758134213427e-10, 4.857037549932386e-10, 4.860785107752008e-10, 4.855802981929003e-10 ], "bp_grad_norms_F": [ 2.9303721476026112e-06, 1.8893056008550957e-08, 1.8350315045267962e-08, 1.8352682928934883e-08, 1.8356114850348604e-08 ], "gamma_dfa": 0.1068887785077095, "acc_eval": 0.3076171875, "loss_eval": 1.926220417022705, "epoch": 100 } ] }