diff options
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s42.json')
| -rw-r--r-- | results/snapshot_evolution_v2/snapshot_evolution_s42.json | 5473 |
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s42.json b/results/snapshot_evolution_v2/snapshot_evolution_s42.json new file mode 100644 index 0000000..fb4a73e --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_evolution_s42.json @@ -0,0 +1,5473 @@ +{ + "config": { + "output_dir": "results/snapshot_evolution_v2", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1 + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 77.06888580322266, + 79.12034606933594, + 82.7389144897461, + 87.31297302246094, + 93.80765533447266 + ], + "bp_grad_norms_per_sample_med": [ + 5.941955532762222e-05, + 5.619435978587717e-05, + 5.499917097040452e-05, + 5.5899512517498806e-05, + 5.7389137509744614e-05 + ], + "bp_grad_norms_F": [ + 0.0026216788683086634, + 0.0023027872666716576, + 0.002111479640007019, + 0.002080164849758148, + 0.0021061261650174856 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3798828125, + "loss_eval": 1.6751981973648071, + "epoch": 1 + }, + { + "hidden_norms": [ + 98.86981201171875, + 98.9476089477539, + 102.55016326904297, + 106.3559341430664, + 112.6939697265625 + ], + "bp_grad_norms_per_sample_med": [ + 4.658113539335318e-05, + 4.402571721584536e-05, + 4.2862800910370424e-05, + 4.381770850159228e-05, + 4.3870313675142825e-05 + ], + "bp_grad_norms_F": [ + 0.00196655560284853, + 0.0018041934818029404, + 0.0016866555670276284, + 0.0016513779992237687, + 0.0016559252981096506 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4541015625, + "loss_eval": 1.5228025913238525, + "epoch": 2 + }, + { + "hidden_norms": [ + 110.40647888183594, + 112.07202911376953, + 114.70049285888672, + 117.17343139648438, + 124.54205322265625 + ], + "bp_grad_norms_per_sample_med": [ + 4.4490061554824933e-05, + 4.3751915654866025e-05, + 4.270448334864341e-05, + 4.182140401098877e-05, + 4.151134271523915e-05 + ], + "bp_grad_norms_F": [ + 0.0019047901732847095, + 0.0017693191766738892, + 0.0016821600729599595, + 0.0016251102788373828, + 0.0015800207620486617 + ], + "gamma_dfa": NaN, + "acc_eval": 0.4697265625, + "loss_eval": 1.4416429996490479, + "epoch": 3 + }, + { + "hidden_norms": [ + 125.09136199951172, + 126.65565490722656, + 128.4573974609375, + 130.39990234375, + 138.1091766357422 + ], + "bp_grad_norms_per_sample_med": [ + 4.1048842831514776e-05, + 4.0168823034036905e-05, + 3.916600326192565e-05, + 3.953508348786272e-05, + 3.938759255106561e-05 + ], + "bp_grad_norms_F": [ + 0.0017511667683720589, + 0.001639657886698842, + 0.0015659942291676998, + 0.0015107291983440518, + 0.0014574137749150395 + ], + "gamma_dfa": NaN, + "acc_eval": 0.50390625, + "loss_eval": 1.3718887567520142, + "epoch": 4 + }, + { + "hidden_norms": [ + 139.76705932617188, + 139.05606079101562, + 139.5422821044922, + 141.0078582763672, + 148.9493865966797 + ], + "bp_grad_norms_per_sample_med": [ + 3.957379158237018e-05, + 4.0101109334500507e-05, + 3.9158370782388374e-05, + 3.927717261831276e-05, + 3.796629243879579e-05 + ], + "bp_grad_norms_F": [ + 0.0017042789841070771, + 0.001630594371818006, + 0.0015700262738391757, + 0.0015037605771794915, + 0.0014294973807409406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.498046875, + "loss_eval": 1.367867112159729, + "epoch": 5 + }, + { + "hidden_norms": [ + 147.73207092285156, + 148.01638793945312, + 148.1798553466797, + 149.07754516601562, + 156.61810302734375 + ], + "bp_grad_norms_per_sample_med": [ + 3.987981835962273e-05, + 3.9670325350016356e-05, + 3.970034231315367e-05, + 3.8273319660220295e-05, + 3.6929654015693814e-05 + ], + "bp_grad_norms_F": [ + 0.0017687880899757147, + 0.001693942816928029, + 0.0016310750506818295, + 0.0015193652361631393, + 0.0014129421906545758 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5234375, + "loss_eval": 1.3461639881134033, + "epoch": 6 + }, + { + "hidden_norms": [ + 159.30731201171875, + 158.4180450439453, + 158.36903381347656, + 158.61819458007812, + 165.9392547607422 + ], + "bp_grad_norms_per_sample_med": [ + 3.744649075088091e-05, + 3.805281448876485e-05, + 3.727989678736776e-05, + 3.5814937291434035e-05, + 3.422912777750753e-05 + ], + "bp_grad_norms_F": [ + 0.0017357978504151106, + 0.0016663926653563976, + 0.0016097063198685646, + 0.0014966910239309072, + 0.001379394088871777 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5283203125, + "loss_eval": 1.3227663040161133, + "epoch": 7 + }, + { + "hidden_norms": [ + 171.02230834960938, + 169.76348876953125, + 168.44949340820312, + 168.26429748535156, + 176.89520263671875 + ], + "bp_grad_norms_per_sample_med": [ + 3.716369246831164e-05, + 3.8349648093571886e-05, + 3.801397542702034e-05, + 3.6082456063013524e-05, + 3.359258334967308e-05 + ], + "bp_grad_norms_F": [ + 0.0016445739893242717, + 0.001604317338205874, + 0.0015634173760190606, + 0.0014586447505280375, + 0.0013399318559095263 + ], + "gamma_dfa": NaN, + "acc_eval": 0.541015625, + "loss_eval": 1.2933616638183594, + "epoch": 8 + }, + { + "hidden_norms": [ + 177.41796875, + 177.29603576660156, + 175.89486694335938, + 175.0777587890625, + 181.38400268554688 + ], + "bp_grad_norms_per_sample_med": [ + 3.602267679525539e-05, + 3.6796918720938265e-05, + 3.648500933195464e-05, + 3.566688246792182e-05, + 3.4070406400132924e-05 + ], + "bp_grad_norms_F": [ + 0.0015903833555057645, + 0.0015696624759584665, + 0.0015270623844116926, + 0.0014402325032278895, + 0.0013178731314837933 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5478515625, + "loss_eval": 1.2806801795959473, + "epoch": 9 + }, + { + "hidden_norms": [ + 187.4056854248047, + 186.72698974609375, + 186.21583557128906, + 185.0518035888672, + 193.2371063232422 + ], + "bp_grad_norms_per_sample_med": [ + 3.3276784961344674e-05, + 3.436602492001839e-05, + 3.432494486332871e-05, + 3.371347702341154e-05, + 3.1834206311032176e-05 + ], + "bp_grad_norms_F": [ + 0.0014970082556828856, + 0.0014613966923207045, + 0.001435543643310666, + 0.001374539453536272, + 0.0012561712646856904 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2740942239761353, + "epoch": 10 + }, + { + "hidden_norms": [ + 194.4965057373047, + 191.25531005859375, + 189.80703735351562, + 188.18850708007812, + 195.7776336669922 + ], + "bp_grad_norms_per_sample_med": [ + 3.298965748399496e-05, + 3.40789083566051e-05, + 3.381206624908373e-05, + 3.3352327591273934e-05, + 3.1442876206710935e-05 + ], + "bp_grad_norms_F": [ + 0.0015152172418311238, + 0.001501554623246193, + 0.0014814225723966956, + 0.001403055852279067, + 0.001272345893085003 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.265188455581665, + "epoch": 11 + }, + { + "hidden_norms": [ + 200.5504913330078, + 197.28366088867188, + 195.27011108398438, + 192.64669799804688, + 200.8507843017578 + ], + "bp_grad_norms_per_sample_med": [ + 3.453825775068253e-05, + 3.5414250305620953e-05, + 3.575523442123085e-05, + 3.455601472523995e-05, + 3.2858857593964785e-05 + ], + "bp_grad_norms_F": [ + 0.001518857548944652, + 0.001502488274127245, + 0.0014838415663689375, + 0.001404650043696165, + 0.0012748484732583165 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5458984375, + "loss_eval": 1.2733395099639893, + "epoch": 12 + }, + { + "hidden_norms": [ + 207.21469116210938, + 202.24969482421875, + 198.8241424560547, + 197.5497283935547, + 207.32147216796875 + ], + "bp_grad_norms_per_sample_med": [ + 3.2123080018209293e-05, + 3.345572258695029e-05, + 3.3888838515849784e-05, + 3.344774086144753e-05, + 3.095310239586979e-05 + ], + "bp_grad_norms_F": [ + 0.0014620382571592927, + 0.0014708929229527712, + 0.0014657732099294662, + 0.0013834136771038175, + 0.0012381445849314332 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2357412576675415, + "epoch": 13 + }, + { + "hidden_norms": [ + 214.6268310546875, + 208.3655242919922, + 205.5032501220703, + 202.8442840576172, + 211.64646911621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.207657573511824e-05, + 3.362155257491395e-05, + 3.38435493176803e-05, + 3.330525942146778e-05, + 3.142434434266761e-05 + ], + "bp_grad_norms_F": [ + 0.0014900992391631007, + 0.0015044353203848004, + 0.001489310641773045, + 0.0014063691487535834, + 0.0012448005145415664 + ], + "gamma_dfa": NaN, + "acc_eval": 0.56640625, + "loss_eval": 1.2451550960540771, + "epoch": 14 + }, + { + "hidden_norms": [ + 220.40109252929688, + 213.53439331054688, + 209.3384552001953, + 206.62062072753906, + 213.82391357421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.227095294278115e-05, + 3.415472019696608e-05, + 3.4918764868052676e-05, + 3.409514465602115e-05, + 3.082074908888899e-05 + ], + "bp_grad_norms_F": [ + 0.0015189005061984062, + 0.001544533297419548, + 0.0015320393722504377, + 0.0014468894805759192, + 0.0012609416153281927 + ], + "gamma_dfa": NaN, + "acc_eval": 0.564453125, + "loss_eval": 1.248854398727417, + "epoch": 15 + }, + { + "hidden_norms": [ + 226.32350158691406, + 219.70506286621094, + 213.84132385253906, + 210.67050170898438, + 219.11776733398438 + ], + "bp_grad_norms_per_sample_med": [ + 3.360298796906136e-05, + 3.4720324038062245e-05, + 3.473780452623032e-05, + 3.412307341932319e-05, + 3.0327399144880474e-05 + ], + "bp_grad_norms_F": [ + 0.0014919604873284698, + 0.0015073713148012757, + 0.001499581034295261, + 0.001411686884239316, + 0.0012323390692472458 + ], + "gamma_dfa": NaN, + "acc_eval": 0.57421875, + "loss_eval": 1.2207037210464478, + "epoch": 16 + }, + { + "hidden_norms": [ + 230.78538513183594, + 223.432373046875, + 216.73037719726562, + 212.86383056640625, + 220.8701171875 + ], + "bp_grad_norms_per_sample_med": [ + 3.253064278396778e-05, + 3.3939610148081556e-05, + 3.490943709039129e-05, + 3.4084565413650125e-05, + 3.0307599445222877e-05 + ], + "bp_grad_norms_F": [ + 0.0015068502398207784, + 0.0015421892749145627, + 0.0015326113207265735, + 0.0014369196724146605, + 0.0012492147507146 + ], + "gamma_dfa": NaN, + "acc_eval": 0.560546875, + "loss_eval": 1.216906189918518, + "epoch": 17 + }, + { + "hidden_norms": [ + 234.5084991455078, + 225.73875427246094, + 219.08822631835938, + 214.42320251464844, + 222.92369079589844 + ], + "bp_grad_norms_per_sample_med": [ + 3.451363227213733e-05, + 3.6047003959538415e-05, + 3.654924512375146e-05, + 3.617065158323385e-05, + 3.275999551988207e-05 + ], + "bp_grad_norms_F": [ + 0.001566705177538097, + 0.0015968933003023267, + 0.0015981856267899275, + 0.0014931216137483716, + 0.0012800253462046385 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5556640625, + "loss_eval": 1.2483153343200684, + "epoch": 18 + }, + { + "hidden_norms": [ + 238.0281219482422, + 229.677734375, + 223.0265350341797, + 217.872314453125, + 225.45947265625 + ], + "bp_grad_norms_per_sample_med": [ + 3.4922632039524615e-05, + 3.6500507121672854e-05, + 3.762893902603537e-05, + 3.615105015342124e-05, + 3.2680742151569575e-05 + ], + "bp_grad_norms_F": [ + 0.0015319561352953315, + 0.001577642629854381, + 0.001574998372234404, + 0.0014754259027540684, + 0.0012637749314308167 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5576171875, + "loss_eval": 1.2469550371170044, + "epoch": 19 + }, + { + "hidden_norms": [ + 241.45298767089844, + 233.28753662109375, + 226.9265899658203, + 222.43453979492188, + 229.83859252929688 + ], + "bp_grad_norms_per_sample_med": [ + 3.368386751390062e-05, + 3.570445187506266e-05, + 3.622082658694126e-05, + 3.5024619137402624e-05, + 3.180970816174522e-05 + ], + "bp_grad_norms_F": [ + 0.0015120706520974636, + 0.0015433274675160646, + 0.0015402185963466763, + 0.0014465245185419917, + 0.001252179266884923 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5634765625, + "loss_eval": 1.2113828659057617, + "epoch": 20 + }, + { + "hidden_norms": [ + 246.53602600097656, + 236.25527954101562, + 231.07940673828125, + 227.7357940673828, + 235.99017333984375 + ], + "bp_grad_norms_per_sample_med": [ + 3.2015348551794887e-05, + 3.388321783859283e-05, + 3.521092003211379e-05, + 3.46749002346769e-05, + 3.079533780692145e-05 + ], + "bp_grad_norms_F": [ + 0.0014757646713405848, + 0.001517578144557774, + 0.0015156606677919626, + 0.00144051609095186, + 0.0012491638772189617 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.2042850255966187, + "epoch": 21 + }, + { + "hidden_norms": [ + 250.74209594726562, + 241.11993408203125, + 232.76829528808594, + 228.410400390625, + 237.100341796875 + ], + "bp_grad_norms_per_sample_med": [ + 3.173810910084285e-05, + 3.328004459035583e-05, + 3.405071402085014e-05, + 3.34872274834197e-05, + 3.07901827909518e-05 + ], + "bp_grad_norms_F": [ + 0.0014801323413848877, + 0.0015176001470535994, + 0.0015198889886960387, + 0.0014302636263892055, + 0.001232756651006639 + ], + "gamma_dfa": NaN, + "acc_eval": 0.587890625, + "loss_eval": 1.1819555759429932, + "epoch": 22 + }, + { + "hidden_norms": [ + 251.96310424804688, + 242.98260498046875, + 235.83056640625, + 229.86978149414062, + 238.271240234375 + ], + "bp_grad_norms_per_sample_med": [ + 3.078249574173242e-05, + 3.301461765659042e-05, + 3.3559550502104685e-05, + 3.2682331948308274e-05, + 2.9418402846204117e-05 + ], + "bp_grad_norms_F": [ + 0.00149905972648412, + 0.0015357647789642215, + 0.0015457755653187633, + 0.0014610268408432603, + 0.0012446421897038817 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5732421875, + "loss_eval": 1.1770297288894653, + "epoch": 23 + }, + { + "hidden_norms": [ + 255.878662109375, + 244.79376220703125, + 236.5006561279297, + 233.29434204101562, + 239.50732421875 + ], + "bp_grad_norms_per_sample_med": [ + 3.191530049662106e-05, + 3.370656486367807e-05, + 3.539594035828486e-05, + 3.486185596557334e-05, + 3.131559424218722e-05 + ], + "bp_grad_norms_F": [ + 0.001507170731201768, + 0.0015490618534386158, + 0.0015714912442490458, + 0.0014840371441096067, + 0.0012607484823092818 + ], + "gamma_dfa": NaN, + "acc_eval": 0.572265625, + "loss_eval": 1.2011631727218628, + "epoch": 24 + }, + { + "hidden_norms": [ + 256.66448974609375, + 244.18772888183594, + 236.46058654785156, + 231.88583374023438, + 238.06246948242188 + ], + "bp_grad_norms_per_sample_med": [ + 3.2962809200398624e-05, + 3.441200897214003e-05, + 3.570063927327283e-05, + 3.488562651909888e-05, + 3.0770879675401375e-05 + ], + "bp_grad_norms_F": [ + 0.0015825299778953195, + 0.0016350955702364445, + 0.0016404123743996024, + 0.0015316286589950323, + 0.0012829666957259178 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5703125, + "loss_eval": 1.192138433456421, + "epoch": 25 + }, + { + "hidden_norms": [ + 259.5942687988281, + 247.43173217773438, + 239.85533142089844, + 233.21835327148438, + 241.53346252441406 + ], + "bp_grad_norms_per_sample_med": [ + 3.1691903132013977e-05, + 3.34988217218779e-05, + 3.45351618307177e-05, + 3.441058288444765e-05, + 3.0752617021789774e-05 + ], + "bp_grad_norms_F": [ + 0.0015797498635947704, + 0.0016322932206094265, + 0.001641901326365769, + 0.0015325341373682022, + 0.0012732355389744043 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5791015625, + "loss_eval": 1.1775751113891602, + "epoch": 26 + }, + { + "hidden_norms": [ + 260.6902770996094, + 249.26528930664062, + 240.86239624023438, + 235.91477966308594, + 242.1553497314453 + ], + "bp_grad_norms_per_sample_med": [ + 3.32598174281884e-05, + 3.471180752967484e-05, + 3.609888517530635e-05, + 3.496996214380488e-05, + 3.091244798270054e-05 + ], + "bp_grad_norms_F": [ + 0.0015408779727295041, + 0.001589508610777557, + 0.0016157848294824362, + 0.0015165223740041256, + 0.0012689991854131222 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5859375, + "loss_eval": 1.1941479444503784, + "epoch": 27 + }, + { + "hidden_norms": [ + 265.0726623535156, + 253.6020050048828, + 244.876953125, + 239.7056427001953, + 248.2157440185547 + ], + "bp_grad_norms_per_sample_med": [ + 3.255613773944788e-05, + 3.457435013842769e-05, + 3.5964570997748524e-05, + 3.529110108502209e-05, + 3.089939127676189e-05 + ], + "bp_grad_norms_F": [ + 0.001513357157818973, + 0.0015594394644722342, + 0.0015772230690345168, + 0.001489063142798841, + 0.0012491336092352867 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5810546875, + "loss_eval": 1.1790356636047363, + "epoch": 28 + }, + { + "hidden_norms": [ + 266.9394836425781, + 253.8067169189453, + 243.13002014160156, + 236.81365966796875, + 245.42434692382812 + ], + "bp_grad_norms_per_sample_med": [ + 3.378500332473777e-05, + 3.5516346542863175e-05, + 3.742165063158609e-05, + 3.6865043512079865e-05, + 3.170729542034678e-05 + ], + "bp_grad_norms_F": [ + 0.0015557212755084038, + 0.0016067115357145667, + 0.001632526982575655, + 0.0015416526002809405, + 0.0012708577560260892 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.1785690784454346, + "epoch": 29 + }, + { + "hidden_norms": [ + 271.3736572265625, + 257.6708984375, + 246.3377685546875, + 240.7875213623047, + 248.55162048339844 + ], + "bp_grad_norms_per_sample_med": [ + 3.2452040613861755e-05, + 3.456772174104117e-05, + 3.550515975803137e-05, + 3.530189496814273e-05, + 3.098960587522015e-05 + ], + "bp_grad_norms_F": [ + 0.0015420741401612759, + 0.0016120158834382892, + 0.0016289768973365426, + 0.0015373170608654618, + 0.0012695658951997757 + ], + "gamma_dfa": NaN, + "acc_eval": 0.57421875, + "loss_eval": 1.1686367988586426, + "epoch": 30 + }, + { + "hidden_norms": [ + 270.6155090332031, + 256.5137634277344, + 246.4404296875, + 238.71493530273438, + 245.14651489257812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4225693525513634e-05, + 3.6208981327945367e-05, + 3.771808042074554e-05, + 3.671547892736271e-05, + 3.175914389430545e-05 + ], + "bp_grad_norms_F": [ + 0.0016278985422104597, + 0.00169221474789083, + 0.0017131771892309189, + 0.0016123101813718677, + 0.001308745937421918 + ], + "gamma_dfa": NaN, + "acc_eval": 0.572265625, + "loss_eval": 1.1706045866012573, + "epoch": 31 + }, + { + "hidden_norms": [ + 271.2703552246094, + 258.5479431152344, + 247.48568725585938, + 241.0449676513672, + 248.61419677734375 + ], + "bp_grad_norms_per_sample_med": [ + 3.370125705259852e-05, + 3.563391510397196e-05, + 3.776583253056742e-05, + 3.622193253249861e-05, + 3.1177536584436893e-05 + ], + "bp_grad_norms_F": [ + 0.001631051884032786, + 0.0016799280419945717, + 0.0016939701745286584, + 0.001596588990651071, + 0.0012989162933081388 + ], + "gamma_dfa": NaN, + "acc_eval": 0.576171875, + "loss_eval": 1.1757416725158691, + "epoch": 32 + }, + { + "hidden_norms": [ + 271.5987854003906, + 257.3157043457031, + 247.04425048828125, + 239.22933959960938, + 247.08534240722656 + ], + "bp_grad_norms_per_sample_med": [ + 3.276485949754715e-05, + 3.4356282412773e-05, + 3.570897752069868e-05, + 3.5391843994148076e-05, + 3.004215977853164e-05 + ], + "bp_grad_norms_F": [ + 0.0015858211554586887, + 0.0016445693327113986, + 0.0016775003168731928, + 0.0015801271656528115, + 0.0012829708866775036 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5947265625, + "loss_eval": 1.1316245794296265, + "epoch": 33 + }, + { + "hidden_norms": [ + 276.85565185546875, + 262.14959716796875, + 248.80125427246094, + 239.6945037841797, + 246.55982971191406 + ], + "bp_grad_norms_per_sample_med": [ + 3.424682654440403e-05, + 3.617212496465072e-05, + 3.731884135049768e-05, + 3.583814759622328e-05, + 3.1317249522544444e-05 + ], + "bp_grad_norms_F": [ + 0.001694253645837307, + 0.0017545269802212715, + 0.0017868074355646968, + 0.0016729168128222227, + 0.0013285611057654023 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.1637687683105469, + "epoch": 34 + }, + { + "hidden_norms": [ + 274.4824523925781, + 260.23223876953125, + 249.41390991210938, + 242.22657775878906, + 248.33303833007812 + ], + "bp_grad_norms_per_sample_med": [ + 3.4118878829758614e-05, + 3.6190944229019806e-05, + 3.7162455555517226e-05, + 3.6398294469108805e-05, + 3.1276995287043974e-05 + ], + "bp_grad_norms_F": [ + 0.0016947221010923386, + 0.0017584856832399964, + 0.0017846780829131603, + 0.0016663862625136971, + 0.0013457784662023187 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5830078125, + "loss_eval": 1.1625440120697021, + "epoch": 35 + }, + { + "hidden_norms": [ + 279.3048095703125, + 263.830810546875, + 250.07839965820312, + 242.9677276611328, + 248.742431640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.378376641194336e-05, + 3.623673183028586e-05, + 3.8036723708501086e-05, + 3.8026879337849095e-05, + 3.20856343023479e-05 + ], + "bp_grad_norms_F": [ + 0.0016582749085500836, + 0.001725532696582377, + 0.0017548021860420704, + 0.0016622358234599233, + 0.0013314742827787995 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58203125, + "loss_eval": 1.1663323640823364, + "epoch": 36 + }, + { + "hidden_norms": [ + 277.88153076171875, + 263.3263244628906, + 254.0471954345703, + 246.00294494628906, + 251.6592559814453 + ], + "bp_grad_norms_per_sample_med": [ + 3.402382935746573e-05, + 3.644815296866e-05, + 3.812061549979262e-05, + 3.8299189327517524e-05, + 3.244871550123207e-05 + ], + "bp_grad_norms_F": [ + 0.0016575837507843971, + 0.001726161572150886, + 0.0017651193775236607, + 0.001658888068050146, + 0.001325216144323349 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5849609375, + "loss_eval": 1.1578618288040161, + "epoch": 37 + }, + { + "hidden_norms": [ + 278.96038818359375, + 264.09832763671875, + 252.11532592773438, + 243.7300567626953, + 250.29537963867188 + ], + "bp_grad_norms_per_sample_med": [ + 3.398891203687526e-05, + 3.60828016710002e-05, + 3.8209349440876395e-05, + 3.6874149373034015e-05, + 3.130899858660996e-05 + ], + "bp_grad_norms_F": [ + 0.0016938851913437247, + 0.0017578925471752882, + 0.0017999019473791122, + 0.0016839306335896254, + 0.0013463495997712016 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1660709381103516, + "epoch": 38 + }, + { + "hidden_norms": [ + 279.11102294921875, + 262.8247375488281, + 250.32635498046875, + 241.73477172851562, + 246.8911590576172 + ], + "bp_grad_norms_per_sample_med": [ + 3.476023630355485e-05, + 3.673156606964767e-05, + 3.8200654671527445e-05, + 3.745179856196046e-05, + 3.111823389190249e-05 + ], + "bp_grad_norms_F": [ + 0.0017367384862154722, + 0.001807119813747704, + 0.0018404393922537565, + 0.0017188042402267456, + 0.0013523433590307832 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1548914909362793, + "epoch": 39 + }, + { + "hidden_norms": [ + 278.79083251953125, + 263.49237060546875, + 252.0679931640625, + 243.65948486328125, + 249.34564208984375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3709933632053435e-05, + 3.595885937102139e-05, + 3.795271186390892e-05, + 3.70899579138495e-05, + 3.1362116715172306e-05 + ], + "bp_grad_norms_F": [ + 0.0017184949247166514, + 0.0017862631939351559, + 0.0018348938319832087, + 0.0017180118011310697, + 0.0013606568099930882 + ], + "gamma_dfa": NaN, + "acc_eval": 0.591796875, + "loss_eval": 1.159794569015503, + "epoch": 40 + }, + { + "hidden_norms": [ + 281.3595886230469, + 263.4467468261719, + 250.73536682128906, + 243.140380859375, + 247.22425842285156 + ], + "bp_grad_norms_per_sample_med": [ + 3.411353100091219e-05, + 3.656598346424289e-05, + 3.8585232687182724e-05, + 3.752345946850255e-05, + 3.1474613933824e-05 + ], + "bp_grad_norms_F": [ + 0.0017623946769163013, + 0.0018276257906109095, + 0.0018694576574489474, + 0.0017436364432796836, + 0.0013814391568303108 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5888671875, + "loss_eval": 1.153226375579834, + "epoch": 41 + }, + { + "hidden_norms": [ + 279.79888916015625, + 263.5989685058594, + 252.2397918701172, + 243.49703979492188, + 248.86973571777344 + ], + "bp_grad_norms_per_sample_med": [ + 3.528413435560651e-05, + 3.805026790359989e-05, + 4.0152310248231515e-05, + 3.962377377320081e-05, + 3.250985173508525e-05 + ], + "bp_grad_norms_F": [ + 0.0017320383340120316, + 0.0018105976050719619, + 0.001847731531597674, + 0.0017405269900336862, + 0.0013762396993115544 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.1387929916381836, + "epoch": 42 + }, + { + "hidden_norms": [ + 280.80633544921875, + 263.2684326171875, + 251.36338806152344, + 242.25201416015625, + 245.46954345703125 + ], + "bp_grad_norms_per_sample_med": [ + 3.463789835222997e-05, + 3.694587940117344e-05, + 3.909278166247532e-05, + 3.8173999200807884e-05, + 3.152083809254691e-05 + ], + "bp_grad_norms_F": [ + 0.001763346022926271, + 0.0018382675480097532, + 0.0018745084526017308, + 0.0017674838891252875, + 0.0013920797500759363 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1115086078643799, + "epoch": 43 + }, + { + "hidden_norms": [ + 278.4877624511719, + 261.4671630859375, + 247.66079711914062, + 240.21690368652344, + 244.1111602783203 + ], + "bp_grad_norms_per_sample_med": [ + 3.559369361028075e-05, + 3.895946065313183e-05, + 4.048463233630173e-05, + 3.892362292390317e-05, + 3.229418143746443e-05 + ], + "bp_grad_norms_F": [ + 0.0018469772767275572, + 0.0019197544315829873, + 0.001963041489943862, + 0.0018302135867998004, + 0.001429378753527999 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.16768217086792, + "epoch": 44 + }, + { + "hidden_norms": [ + 280.8171691894531, + 263.16705322265625, + 251.45835876464844, + 243.88563537597656, + 246.92945861816406 + ], + "bp_grad_norms_per_sample_med": [ + 3.3486583561170846e-05, + 3.533214839990251e-05, + 3.789112452068366e-05, + 3.651758743217215e-05, + 3.081141403526999e-05 + ], + "bp_grad_norms_F": [ + 0.0017694556154310703, + 0.0018461478175595403, + 0.0018877091351896524, + 0.001781664090231061, + 0.0014001834206283092 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1236202716827393, + "epoch": 45 + }, + { + "hidden_norms": [ + 280.0203552246094, + 261.3996887207031, + 248.5751953125, + 240.40728759765625, + 243.84178161621094 + ], + "bp_grad_norms_per_sample_med": [ + 3.66695094271563e-05, + 3.912827742169611e-05, + 4.0782215364743024e-05, + 3.97856165363919e-05, + 3.258495053160004e-05 + ], + "bp_grad_norms_F": [ + 0.0018954386468976736, + 0.0019765326287597418, + 0.0020179273560643196, + 0.0018787897424772382, + 0.0014408754650503397 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5947265625, + "loss_eval": 1.142503261566162, + "epoch": 46 + }, + { + "hidden_norms": [ + 278.37445068359375, + 260.7147521972656, + 247.63418579101562, + 239.64564514160156, + 241.75396728515625 + ], + "bp_grad_norms_per_sample_med": [ + 3.824803570751101e-05, + 4.062152947881259e-05, + 4.1070070437854156e-05, + 4.01996003347449e-05, + 3.288290827185847e-05 + ], + "bp_grad_norms_F": [ + 0.001872657099738717, + 0.0019627343863248825, + 0.002008425537496805, + 0.0018816223600879312, + 0.001456336583942175 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6064453125, + "loss_eval": 1.137413740158081, + "epoch": 47 + }, + { + "hidden_norms": [ + 281.14813232421875, + 263.6340637207031, + 250.13082885742188, + 242.0965118408203, + 244.81060791015625 + ], + "bp_grad_norms_per_sample_med": [ + 3.531872062012553e-05, + 3.7883237382629886e-05, + 4.0227863792097196e-05, + 3.96844552597031e-05, + 3.296942304586992e-05 + ], + "bp_grad_norms_F": [ + 0.0018434273079037666, + 0.0019304269226267934, + 0.0019746439065784216, + 0.0018603875068947673, + 0.0014465745771303773 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6025390625, + "loss_eval": 1.1396205425262451, + "epoch": 48 + }, + { + "hidden_norms": [ + 281.31280517578125, + 262.5829772949219, + 247.9232940673828, + 239.8461456298828, + 242.20977783203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.71285859728232e-05, + 3.963968629250303e-05, + 4.135111521463841e-05, + 4.0518349123885855e-05, + 3.323471173644066e-05 + ], + "bp_grad_norms_F": [ + 0.00189371092710644, + 0.0019808171782642603, + 0.002019244944676757, + 0.001904282602481544, + 0.0014800610952079296 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1411675214767456, + "epoch": 49 + }, + { + "hidden_norms": [ + 278.64208984375, + 260.1700744628906, + 246.7251434326172, + 239.43145751953125, + 240.350830078125 + ], + "bp_grad_norms_per_sample_med": [ + 3.6054647353012115e-05, + 3.858766285702586e-05, + 4.05439204769209e-05, + 4.046479079988785e-05, + 3.3791853638831526e-05 + ], + "bp_grad_norms_F": [ + 0.0018870895728468895, + 0.00198533502407372, + 0.0020502021070569754, + 0.001929490827023983, + 0.0014933926286175847 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59375, + "loss_eval": 1.1310430765151978, + "epoch": 50 + }, + { + "hidden_norms": [ + 281.7696533203125, + 261.5150451660156, + 247.67295837402344, + 239.7654266357422, + 240.27789306640625 + ], + "bp_grad_norms_per_sample_med": [ + 3.671262675197795e-05, + 3.92102992918808e-05, + 4.1406125092180446e-05, + 4.029196497867815e-05, + 3.32514064211864e-05 + ], + "bp_grad_norms_F": [ + 0.001880357856862247, + 0.001981948269531131, + 0.0020440546795725822, + 0.0019350070506334305, + 0.0014877711655572057 + ], + "gamma_dfa": NaN, + "acc_eval": 0.60546875, + "loss_eval": 1.1188440322875977, + "epoch": 51 + }, + { + "hidden_norms": [ + 279.01318359375, + 259.6091003417969, + 244.6603240966797, + 235.1455535888672, + 237.438232421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.0185608668252826e-05, + 4.309232099330984e-05, + 4.5118234993424267e-05, + 4.371534669189714e-05, + 3.5620210837805644e-05 + ], + "bp_grad_norms_F": [ + 0.0020104716531932354, + 0.002107330597937107, + 0.002167000202462077, + 0.0020260754972696304, + 0.0015411453787237406 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1525764465332031, + "epoch": 52 + }, + { + "hidden_norms": [ + 278.2245178222656, + 257.14617919921875, + 243.9732666015625, + 234.4013214111328, + 236.68521118164062 + ], + "bp_grad_norms_per_sample_med": [ + 3.85418206860777e-05, + 4.142443503951654e-05, + 4.363177140476182e-05, + 4.2996281990781426e-05, + 3.424972965149209e-05 + ], + "bp_grad_norms_F": [ + 0.0020445864647626877, + 0.002142493613064289, + 0.0022005243226885796, + 0.002054274780675769, + 0.0015541499014943838 + ], + "gamma_dfa": NaN, + "acc_eval": 0.59765625, + "loss_eval": 1.162191390991211, + "epoch": 53 + }, + { + "hidden_norms": [ + 278.7825622558594, + 258.4292297363281, + 243.01690673828125, + 234.15765380859375, + 235.1446533203125 + ], + "bp_grad_norms_per_sample_med": [ + 3.855194881907664e-05, + 4.1293307731393725e-05, + 4.296215047361329e-05, + 4.1900369978975505e-05, + 3.372962964931503e-05 + ], + "bp_grad_norms_F": [ + 0.002041360829025507, + 0.0021457262337207794, + 0.0021996963769197464, + 0.0020641626324504614, + 0.001561368815600872 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6171875, + "loss_eval": 1.130479335784912, + "epoch": 54 + }, + { + "hidden_norms": [ + 275.3794860839844, + 256.83026123046875, + 242.16006469726562, + 231.49655151367188, + 232.30279541015625 + ], + "bp_grad_norms_per_sample_med": [ + 4.011294731753878e-05, + 4.240096313878894e-05, + 4.396942676976323e-05, + 4.347893627709709e-05, + 3.485888009890914e-05 + ], + "bp_grad_norms_F": [ + 0.0021268154960125685, + 0.002230642130598426, + 0.0022892621345818043, + 0.002145433332771063, + 0.0016037407331168652 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6005859375, + "loss_eval": 1.1599653959274292, + "epoch": 55 + }, + { + "hidden_norms": [ + 277.5028076171875, + 257.1715087890625, + 241.6505584716797, + 234.09323120117188, + 233.63377380371094 + ], + "bp_grad_norms_per_sample_med": [ + 3.876453047269024e-05, + 4.156330396654084e-05, + 4.3727923184633255e-05, + 4.2131912778131664e-05, + 3.510245369398035e-05 + ], + "bp_grad_norms_F": [ + 0.002074806485325098, + 0.002173666376620531, + 0.002245684852823615, + 0.0021073734387755394, + 0.0015908328350633383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.144984245300293, + "epoch": 56 + }, + { + "hidden_norms": [ + 276.0826416015625, + 255.17193603515625, + 239.51519775390625, + 231.28643798828125, + 230.85292053222656 + ], + "bp_grad_norms_per_sample_med": [ + 3.960869798902422e-05, + 4.2907246097456664e-05, + 4.45116929768119e-05, + 4.3612952140392736e-05, + 3.500159073155373e-05 + ], + "bp_grad_norms_F": [ + 0.0021277335472404957, + 0.0022348251659423113, + 0.0022981096990406513, + 0.002155488822609186, + 0.001618923619389534 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.1534931659698486, + "epoch": 57 + }, + { + "hidden_norms": [ + 275.6867370605469, + 254.65744018554688, + 238.1124267578125, + 229.36215209960938, + 227.90867614746094 + ], + "bp_grad_norms_per_sample_med": [ + 3.966662916354835e-05, + 4.33680324931629e-05, + 4.5270633563632146e-05, + 4.528860517893918e-05, + 3.5298704460728914e-05 + ], + "bp_grad_norms_F": [ + 0.002194908680394292, + 0.002305977512151003, + 0.0023776311427354813, + 0.002223761286586523, + 0.001651395345106721 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1494864225387573, + "epoch": 58 + }, + { + "hidden_norms": [ + 274.8414306640625, + 253.18215942382812, + 238.03150939941406, + 228.1765594482422, + 229.46058654785156 + ], + "bp_grad_norms_per_sample_med": [ + 4.132632238906808e-05, + 4.4773249101126567e-05, + 4.6669130824739113e-05, + 4.591346441884525e-05, + 3.6523833841783926e-05 + ], + "bp_grad_norms_F": [ + 0.0022293017245829105, + 0.002341218525543809, + 0.002405093051493168, + 0.0022504546213895082, + 0.0016715668607503176 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5927734375, + "loss_eval": 1.1698435544967651, + "epoch": 59 + }, + { + "hidden_norms": [ + 273.4884338378906, + 251.2228240966797, + 236.2550048828125, + 226.7325439453125, + 225.68386840820312 + ], + "bp_grad_norms_per_sample_med": [ + 4.192883352516219e-05, + 4.3471976823639125e-05, + 4.7195244405884296e-05, + 4.490713035920635e-05, + 3.646116965683177e-05 + ], + "bp_grad_norms_F": [ + 0.0022312228102236986, + 0.002349371323361993, + 0.0024164437782019377, + 0.002271530916914344, + 0.0016918154433369637 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1560128927230835, + "epoch": 60 + }, + { + "hidden_norms": [ + 273.4084777832031, + 250.5165557861328, + 236.19557189941406, + 227.0643768310547, + 226.594970703125 + ], + "bp_grad_norms_per_sample_med": [ + 4.2211744585074484e-05, + 4.488111881073564e-05, + 4.760283627547324e-05, + 4.589638047036715e-05, + 3.658623973024078e-05 + ], + "bp_grad_norms_F": [ + 0.0022313676308840513, + 0.002337696962058544, + 0.0024093035608530045, + 0.002264693146571517, + 0.0016880000475794077 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6044921875, + "loss_eval": 1.1498074531555176, + "epoch": 61 + }, + { + "hidden_norms": [ + 273.1318664550781, + 249.35223388671875, + 234.15737915039062, + 223.48074340820312, + 223.0059356689453 + ], + "bp_grad_norms_per_sample_med": [ + 4.4729218643624336e-05, + 4.768320650327951e-05, + 4.822494520340115e-05, + 4.791786341229454e-05, + 3.7625926779583097e-05 + ], + "bp_grad_norms_F": [ + 0.0023362624924629927, + 0.0024679312482476234, + 0.0025367215275764465, + 0.0023599599953740835, + 0.0017239096341654658 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1377537250518799, + "epoch": 62 + }, + { + "hidden_norms": [ + 270.9543762207031, + 249.6943817138672, + 234.0796356201172, + 223.80093383789062, + 222.75062561035156 + ], + "bp_grad_norms_per_sample_med": [ + 4.4321575842332095e-05, + 4.7786033974261954e-05, + 4.9388974730391055e-05, + 4.749266372527927e-05, + 3.7502803024835885e-05 + ], + "bp_grad_norms_F": [ + 0.0023458057548850775, + 0.0024719720240682364, + 0.0025427823420614004, + 0.0023789280094206333, + 0.0017488099401816726 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1472076177597046, + "epoch": 63 + }, + { + "hidden_norms": [ + 270.6864318847656, + 249.71315002441406, + 233.9838409423828, + 223.17515563964844, + 222.17759704589844 + ], + "bp_grad_norms_per_sample_med": [ + 4.36245281889569e-05, + 4.725098915514536e-05, + 4.936556069878861e-05, + 4.7286572225857526e-05, + 3.7781614082632586e-05 + ], + "bp_grad_norms_F": [ + 0.0023510511964559555, + 0.0024691869039088488, + 0.0025394195690751076, + 0.0023858139757066965, + 0.0017493697814643383 + ], + "gamma_dfa": NaN, + "acc_eval": 0.5986328125, + "loss_eval": 1.1437795162200928, + "epoch": 64 + }, + { + "hidden_norms": [ + 269.1813659667969, + 247.57632446289062, + 231.57135009765625, + 220.31541442871094, + 220.33135986328125 + ], + "bp_grad_norms_per_sample_med": [ + 4.363871266832575e-05, + 4.776224886882119e-05, + 4.8712514399085194e-05, + 4.777491994900629e-05, + 3.733497578650713e-05 + ], + "bp_grad_norms_F": [ + 0.0023870510049164295, + 0.0025214161723852158, + 0.0025991688016802073, + 0.0024342697579413652, + 0.0017686353530734777 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.138253927230835, + "epoch": 65 + }, + { + "hidden_norms": [ + 268.92877197265625, + 245.84384155273438, + 230.63307189941406, + 220.8726806640625, + 219.60350036621094 + ], + "bp_grad_norms_per_sample_med": [ + 4.505042306846008e-05, + 4.780786548508331e-05, + 5.067480378784239e-05, + 4.878537220065482e-05, + 3.842872683890164e-05 + ], + "bp_grad_norms_F": [ + 0.00237255753017962, + 0.002493572887033224, + 0.0025717453099787235, + 0.0024270617868751287, + 0.0017787005053833127 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1350346803665161, + "epoch": 66 + }, + { + "hidden_norms": [ + 268.9022521972656, + 244.85621643066406, + 229.2279510498047, + 218.72445678710938, + 217.325439453125 + ], + "bp_grad_norms_per_sample_med": [ + 4.515323234954849e-05, + 4.8419675295008346e-05, + 5.0062186346622184e-05, + 4.777919821208343e-05, + 3.962183836847544e-05 + ], + "bp_grad_norms_F": [ + 0.0024519655853509903, + 0.002586368238553405, + 0.00266969739459455, + 0.0024983694311231375, + 0.001813769806176424 + ], + "gamma_dfa": NaN, + "acc_eval": 0.58984375, + "loss_eval": 1.143377661705017, + "epoch": 67 + }, + { + "hidden_norms": [ + 267.7603454589844, + 245.58932495117188, + 229.04205322265625, + 219.0813446044922, + 217.887939453125 + ], + "bp_grad_norms_per_sample_med": [ + 4.398225064505823e-05, + 4.6881206799298525e-05, + 4.986919157090597e-05, + 4.9659283831715584e-05, + 3.928233854821883e-05 + ], + "bp_grad_norms_F": [ + 0.0024525129701942205, + 0.0025901535991579294, + 0.002675000112503767, + 0.0025050004478543997, + 0.0018165758810937405 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1445319652557373, + "epoch": 68 + }, + { + "hidden_norms": [ + 267.32110595703125, + 244.51095581054688, + 228.1964569091797, + 217.7543182373047, + 215.99093627929688 + ], + "bp_grad_norms_per_sample_med": [ + 4.567872019833885e-05, + 4.9028451030608267e-05, + 5.0534836191218346e-05, + 4.8578112910036e-05, + 3.865628605126403e-05 + ], + "bp_grad_norms_F": [ + 0.002467149868607521, + 0.0026051453314721584, + 0.0026927595026791096, + 0.002530105412006378, + 0.0018421142594888806 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.143081545829773, + "epoch": 69 + }, + { + "hidden_norms": [ + 266.6060791015625, + 242.973388671875, + 227.23739624023438, + 216.60504150390625, + 213.26922607421875 + ], + "bp_grad_norms_per_sample_med": [ + 4.524671021499671e-05, + 4.8752917791716754e-05, + 5.0053116865456104e-05, + 4.897990220342763e-05, + 3.949753590859473e-05 + ], + "bp_grad_norms_F": [ + 0.002536450745537877, + 0.002682002494111657, + 0.002782325493171811, + 0.002600395353510976, + 0.0018774428172037005 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1569209098815918, + "epoch": 70 + }, + { + "hidden_norms": [ + 265.7056579589844, + 243.6046142578125, + 226.88746643066406, + 217.55291748046875, + 213.99151611328125 + ], + "bp_grad_norms_per_sample_med": [ + 4.667519897338934e-05, + 4.9728132580639794e-05, + 5.27437987329904e-05, + 5.151727600605227e-05, + 4.0550570702180266e-05 + ], + "bp_grad_norms_F": [ + 0.002509700832888484, + 0.0026521242689341307, + 0.0027410376351326704, + 0.002574845217168331, + 0.001871992484666407 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.1381304264068604, + "epoch": 71 + }, + { + "hidden_norms": [ + 264.63116455078125, + 241.50344848632812, + 225.20465087890625, + 214.67364501953125, + 212.77584838867188 + ], + "bp_grad_norms_per_sample_med": [ + 4.526918928604573e-05, + 5.0124705012422055e-05, + 5.2680206863442436e-05, + 5.1697836170205846e-05, + 3.9593822293682024e-05 + ], + "bp_grad_norms_F": [ + 0.0025687876623123884, + 0.0027084490284323692, + 0.0027945584151893854, + 0.0026290949899703264, + 0.0018978636944666505 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.149982213973999, + "epoch": 72 + }, + { + "hidden_norms": [ + 264.168701171875, + 241.78074645996094, + 224.8336944580078, + 214.45762634277344, + 212.4181671142578 + ], + "bp_grad_norms_per_sample_med": [ + 4.745498517877422e-05, + 5.042303018854e-05, + 5.3622185077983886e-05, + 5.276402589515783e-05, + 4.0586572140455246e-05 + ], + "bp_grad_norms_F": [ + 0.0026231552474200726, + 0.002779489615932107, + 0.002866284688934684, + 0.00268669705837965, + 0.0019228557357564569 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.158836007118225, + "epoch": 73 + }, + { + "hidden_norms": [ + 263.89593505859375, + 240.3160858154297, + 223.6101531982422, + 212.4967803955078, + 210.63546752929688 + ], + "bp_grad_norms_per_sample_med": [ + 4.678544428315945e-05, + 5.029747626394965e-05, + 5.3069161367602646e-05, + 5.2157745813019574e-05, + 4.0450311644235626e-05 + ], + "bp_grad_norms_F": [ + 0.0026451845187693834, + 0.002798875328153372, + 0.0028935885056853294, + 0.0027081011794507504, + 0.001933218096382916 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1447510719299316, + "epoch": 74 + }, + { + "hidden_norms": [ + 262.4220275878906, + 239.43899536132812, + 223.32151794433594, + 212.5982666015625, + 209.80105590820312 + ], + "bp_grad_norms_per_sample_med": [ + 4.713214002549648e-05, + 5.087011959403753e-05, + 5.283053906168789e-05, + 5.280825644149445e-05, + 4.054068267578259e-05 + ], + "bp_grad_norms_F": [ + 0.002688886132091284, + 0.002841175301000476, + 0.002931408118456602, + 0.0027343749534338713, + 0.001953375292941928 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.1561517715454102, + "epoch": 75 + }, + { + "hidden_norms": [ + 262.65814208984375, + 240.0749969482422, + 223.0806121826172, + 212.08688354492188, + 209.22561645507812 + ], + "bp_grad_norms_per_sample_med": [ + 4.8153047828236595e-05, + 5.145415343577042e-05, + 5.4130876378621906e-05, + 5.3563955589197576e-05, + 4.1630475607234985e-05 + ], + "bp_grad_norms_F": [ + 0.0026582488790154457, + 0.0028067713137716055, + 0.00290639977902174, + 0.0027312941383570433, + 0.0019485733937472105 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1465811729431152, + "epoch": 76 + }, + { + "hidden_norms": [ + 262.0201721191406, + 239.08547973632812, + 222.36146545410156, + 211.62014770507812, + 208.1699676513672 + ], + "bp_grad_norms_per_sample_med": [ + 4.763290053233504e-05, + 5.171096199774183e-05, + 5.4121221182867885e-05, + 5.251873881206848e-05, + 4.096185875823721e-05 + ], + "bp_grad_norms_F": [ + 0.0027110630180686712, + 0.002856222679838538, + 0.002954155672341585, + 0.0027671835850924253, + 0.001963438233360648 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6142578125, + "loss_eval": 1.140420913696289, + "epoch": 77 + }, + { + "hidden_norms": [ + 261.04132080078125, + 238.44912719726562, + 221.8912353515625, + 210.62893676757812, + 207.68223571777344 + ], + "bp_grad_norms_per_sample_med": [ + 4.7598918172298e-05, + 5.09894234710373e-05, + 5.384815813158639e-05, + 5.2337087254272774e-05, + 4.065291432198137e-05 + ], + "bp_grad_norms_F": [ + 0.00274560390971601, + 0.0029035566840320826, + 0.0030046424362808466, + 0.0028060651384294033, + 0.001984622096642852 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.1556674242019653, + "epoch": 78 + }, + { + "hidden_norms": [ + 260.81304931640625, + 237.52015686035156, + 221.12814331054688, + 210.04925537109375, + 206.80441284179688 + ], + "bp_grad_norms_per_sample_med": [ + 4.8430883907712996e-05, + 5.440305176307447e-05, + 5.596410119323991e-05, + 5.4586391343036667e-05, + 4.195213477942161e-05 + ], + "bp_grad_norms_F": [ + 0.002767855068668723, + 0.002925564767792821, + 0.003015928901731968, + 0.002823467366397381, + 0.0020000736694782972 + ], + "gamma_dfa": NaN, + "acc_eval": 0.599609375, + "loss_eval": 1.155595302581787, + "epoch": 79 + }, + { + "hidden_norms": [ + 260.0649108886719, + 236.74310302734375, + 220.48731994628906, + 209.0772247314453, + 205.55821228027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.8615416744723916e-05, + 5.309982589096762e-05, + 5.548154513235204e-05, + 5.3888015827396885e-05, + 4.1955223423428833e-05 + ], + "bp_grad_norms_F": [ + 0.0028222037944942713, + 0.0029849831480532885, + 0.003080391325056553, + 0.0028690374456346035, + 0.002019484294578433 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.151352882385254, + "epoch": 80 + }, + { + "hidden_norms": [ + 259.8204650878906, + 236.13253784179688, + 219.08865356445312, + 207.6793975830078, + 205.0387725830078 + ], + "bp_grad_norms_per_sample_med": [ + 4.734982212539762e-05, + 5.1937022362835705e-05, + 5.472155680763535e-05, + 5.394391337176785e-05, + 4.0832986996974796e-05 + ], + "bp_grad_norms_F": [ + 0.00282403570599854, + 0.0029848285485059023, + 0.0030928945634514093, + 0.002879998181015253, + 0.0020237534772604704 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.153958797454834, + "epoch": 81 + }, + { + "hidden_norms": [ + 259.70703125, + 235.5811767578125, + 218.87939453125, + 207.87005615234375, + 204.21360778808594 + ], + "bp_grad_norms_per_sample_med": [ + 4.972740134689957e-05, + 5.442327164928429e-05, + 5.538179539144039e-05, + 5.4411018936662003e-05, + 4.185390207567252e-05 + ], + "bp_grad_norms_F": [ + 0.002822998445481062, + 0.00298913661390543, + 0.0030840388499200344, + 0.0028817548882216215, + 0.0020279802847653627 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6201171875, + "loss_eval": 1.153503656387329, + "epoch": 82 + }, + { + "hidden_norms": [ + 258.22747802734375, + 235.3745880126953, + 218.20066833496094, + 206.82144165039062, + 203.41139221191406 + ], + "bp_grad_norms_per_sample_med": [ + 5.077639434603043e-05, + 5.5536078434670344e-05, + 5.664999844157137e-05, + 5.608425635728054e-05, + 4.293184611015022e-05 + ], + "bp_grad_norms_F": [ + 0.002843277994543314, + 0.0030130224768072367, + 0.0031098793260753155, + 0.00290561281144619, + 0.0020425335969775915 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.1597235202789307, + "epoch": 83 + }, + { + "hidden_norms": [ + 258.78253173828125, + 234.73965454101562, + 217.91439819335938, + 207.1282958984375, + 203.4480743408203 + ], + "bp_grad_norms_per_sample_med": [ + 4.941036968375556e-05, + 5.3143365221330896e-05, + 5.529402187676169e-05, + 5.3718889830634e-05, + 4.207601887173951e-05 + ], + "bp_grad_norms_F": [ + 0.0028217420913279057, + 0.0029905554838478565, + 0.0030917164403945208, + 0.002896753139793873, + 0.00204362440854311 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1545956134796143, + "epoch": 84 + }, + { + "hidden_norms": [ + 258.10736083984375, + 234.35299682617188, + 217.81224060058594, + 206.38864135742188, + 202.70126342773438 + ], + "bp_grad_norms_per_sample_med": [ + 4.899106716038659e-05, + 5.2254512411309406e-05, + 5.481128755491227e-05, + 5.298088217386976e-05, + 4.121303936699405e-05 + ], + "bp_grad_norms_F": [ + 0.002849399344995618, + 0.0030259499326348305, + 0.0031236386857926846, + 0.002921136561781168, + 0.0020506957080215216 + ], + "gamma_dfa": NaN, + "acc_eval": 0.615234375, + "loss_eval": 1.150564193725586, + "epoch": 85 + }, + { + "hidden_norms": [ + 258.50750732421875, + 234.4120330810547, + 217.49217224121094, + 205.7490692138672, + 202.62380981445312 + ], + "bp_grad_norms_per_sample_med": [ + 4.976892887498252e-05, + 5.383255484048277e-05, + 5.497025267686695e-05, + 5.391201557358727e-05, + 4.2558931454550475e-05 + ], + "bp_grad_norms_F": [ + 0.0028686418663710356, + 0.003045660676434636, + 0.0031442255713045597, + 0.002935740165412426, + 0.0020568587351590395 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.152902603149414, + "epoch": 86 + }, + { + "hidden_norms": [ + 258.063720703125, + 233.87294006347656, + 217.34030151367188, + 205.4007110595703, + 202.4425506591797 + ], + "bp_grad_norms_per_sample_med": [ + 5.047345257480629e-05, + 5.492625859915279e-05, + 5.640966628561728e-05, + 5.587706982623786e-05, + 4.286773400963284e-05 + ], + "bp_grad_norms_F": [ + 0.002875820267945528, + 0.003056521760299802, + 0.0031533341389149427, + 0.002944495528936386, + 0.0020668748766183853 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.152883529663086, + "epoch": 87 + }, + { + "hidden_norms": [ + 258.1524353027344, + 234.54095458984375, + 216.9737548828125, + 205.64048767089844, + 202.26617431640625 + ], + "bp_grad_norms_per_sample_med": [ + 4.9309845053358003e-05, + 5.373455860535614e-05, + 5.6388864322798327e-05, + 5.448140291264281e-05, + 4.2345352994743735e-05 + ], + "bp_grad_norms_F": [ + 0.0028876049909740686, + 0.0030658405739814043, + 0.0031632501631975174, + 0.002954283496364951, + 0.0020715948194265366 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.155066967010498, + "epoch": 88 + }, + { + "hidden_norms": [ + 257.7385559082031, + 233.87037658691406, + 216.7277069091797, + 205.37454223632812, + 202.0509033203125 + ], + "bp_grad_norms_per_sample_med": [ + 5.0028131227009e-05, + 5.394254549173638e-05, + 5.677127046510577e-05, + 5.581674486165866e-05, + 4.2508807382546365e-05 + ], + "bp_grad_norms_F": [ + 0.0028917219024151564, + 0.0030712694860994816, + 0.0031723883002996445, + 0.0029576809611171484, + 0.0020730902906507254 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1531357765197754, + "epoch": 89 + }, + { + "hidden_norms": [ + 257.52423095703125, + 233.51254272460938, + 216.73731994628906, + 205.52561950683594, + 202.19493103027344 + ], + "bp_grad_norms_per_sample_med": [ + 4.9573794967727736e-05, + 5.4153944802237675e-05, + 5.742486973758787e-05, + 5.468217204906978e-05, + 4.2126855987589806e-05 + ], + "bp_grad_norms_F": [ + 0.0029005431570112705, + 0.0030793119221925735, + 0.003179334569722414, + 0.0029661250300705433, + 0.002075627911835909 + ], + "gamma_dfa": NaN, + "acc_eval": 0.603515625, + "loss_eval": 1.155139684677124, + "epoch": 90 + }, + { + "hidden_norms": [ + 257.5526428222656, + 233.24456787109375, + 216.63601684570312, + 205.40318298339844, + 201.8704376220703 + ], + "bp_grad_norms_per_sample_med": [ + 4.996290954295546e-05, + 5.331254214979708e-05, + 5.576194598688744e-05, + 5.50017248315271e-05, + 4.1135557694360614e-05 + ], + "bp_grad_norms_F": [ + 0.002902554115280509, + 0.003083745948970318, + 0.0031855429988354445, + 0.0029742431361228228, + 0.002079661935567856 + ], + "gamma_dfa": NaN, + "acc_eval": 0.611328125, + "loss_eval": 1.15346360206604, + "epoch": 91 + }, + { + "hidden_norms": [ + 257.3648681640625, + 233.42010498046875, + 216.6300506591797, + 204.97442626953125, + 201.4558868408203 + ], + "bp_grad_norms_per_sample_med": [ + 5.06279211549554e-05, + 5.411348683992401e-05, + 5.6813423725543544e-05, + 5.523188519873656e-05, + 4.197460293653421e-05 + ], + "bp_grad_norms_F": [ + 0.0029165328014642, + 0.003098647342994809, + 0.00319958315230906, + 0.002985388273373246, + 0.002088340697810054 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6015625, + "loss_eval": 1.155455470085144, + "epoch": 92 + }, + { + "hidden_norms": [ + 257.30535888671875, + 233.4147491455078, + 216.60826110839844, + 205.0714874267578, + 201.24066162109375 + ], + "bp_grad_norms_per_sample_med": [ + 5.053050699643791e-05, + 5.4108801123220474e-05, + 5.702309499611147e-05, + 5.574637179961428e-05, + 4.271106809028424e-05 + ], + "bp_grad_norms_F": [ + 0.002917014993727207, + 0.0030978922732174397, + 0.0031987964175641537, + 0.0029851715080440044, + 0.0020893686451017857 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6103515625, + "loss_eval": 1.1536216735839844, + "epoch": 93 + }, + { + "hidden_norms": [ + 257.18878173828125, + 232.8798370361328, + 216.17039489746094, + 204.66229248046875, + 201.07859802246094 + ], + "bp_grad_norms_per_sample_med": [ + 5.010717359255068e-05, + 5.397907079895958e-05, + 5.614722249447368e-05, + 5.553716255235486e-05, + 4.292877929401584e-05 + ], + "bp_grad_norms_F": [ + 0.0029321948532015085, + 0.003115386702120304, + 0.0032163059804588556, + 0.002997474977746606, + 0.002096242969855666 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6123046875, + "loss_eval": 1.1570696830749512, + "epoch": 94 + }, + { + "hidden_norms": [ + 257.0701904296875, + 232.91481018066406, + 216.06378173828125, + 204.648681640625, + 201.00148010253906 + ], + "bp_grad_norms_per_sample_med": [ + 4.9896454584086314e-05, + 5.386451448430307e-05, + 5.5900127335917205e-05, + 5.5407243053196e-05, + 4.247200922691263e-05 + ], + "bp_grad_norms_F": [ + 0.0029298008885234594, + 0.0031122476793825626, + 0.0032105366699397564, + 0.0029950770549476147, + 0.0020956522785127163 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1554739475250244, + "epoch": 95 + }, + { + "hidden_norms": [ + 257.0519104003906, + 232.83355712890625, + 216.1780242919922, + 204.67999267578125, + 201.0236358642578 + ], + "bp_grad_norms_per_sample_med": [ + 5.054255234426819e-05, + 5.421326932264492e-05, + 5.641246752929874e-05, + 5.574019087362103e-05, + 4.288824857212603e-05 + ], + "bp_grad_norms_F": [ + 0.0029319566674530506, + 0.0031146046239882708, + 0.003213704563677311, + 0.002997281262651086, + 0.0020963428542017937 + ], + "gamma_dfa": NaN, + "acc_eval": 0.607421875, + "loss_eval": 1.1545898914337158, + "epoch": 96 + }, + { + "hidden_norms": [ + 257.1473388671875, + 232.85020446777344, + 216.2519989013672, + 204.68023681640625, + 200.93080139160156 + ], + "bp_grad_norms_per_sample_med": [ + 5.0549009756650776e-05, + 5.3789182857144624e-05, + 5.673874693457037e-05, + 5.580837023444474e-05, + 4.2498151742620394e-05 + ], + "bp_grad_norms_F": [ + 0.0029327664524316788, + 0.0031159960199147463, + 0.003215631702914834, + 0.002998515497893095, + 0.0020966045558452606 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1546047925949097, + "epoch": 97 + }, + { + "hidden_norms": [ + 257.09906005859375, + 232.74813842773438, + 216.1462860107422, + 204.6047821044922, + 200.89031982421875 + ], + "bp_grad_norms_per_sample_med": [ + 5.086465898784809e-05, + 5.3742358431918547e-05, + 5.673644773196429e-05, + 5.5752621847204864e-05, + 4.2624127672752365e-05 + ], + "bp_grad_norms_F": [ + 0.0029341024346649647, + 0.003117120126262307, + 0.0032170764170587063, + 0.0029998423997312784, + 0.002097061835229397 + ], + "gamma_dfa": NaN, + "acc_eval": 0.6083984375, + "loss_eval": 1.1545934677124023, + "epoch": 98 + }, + { + "hidden_norms": [ + 257.09326171875, + 232.7879638671875, + 216.1444091796875, + 204.5867919921875, + 200.89596557617188 + ], + "bp_grad_norms_per_sample_med": [ + 5.078025787952356e-05, + 5.40847031516023e-05, + 5.667618097504601e-05, + 5.571893780143e-05, + 4.271125726518221e-05 + ], + "bp_grad_norms_F": [ + 0.0029357182793319225, + 0.0031186225824058056, + 0.003218533471226692, + 0.0030010156333446503, + 0.002097515854984522 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.154747486114502, + "epoch": 99 + }, + { + "hidden_norms": [ + 257.0869140625, + 232.78091430664062, + 216.12852478027344, + 204.58143615722656, + 200.87417602539062 + ], + "bp_grad_norms_per_sample_med": [ + 5.08715384057723e-05, + 5.4204192565521225e-05, + 5.669457823387347e-05, + 5.573080852627754e-05, + 4.275495302863419e-05 + ], + "bp_grad_norms_F": [ + 0.002935809548944235, + 0.003118706401437521, + 0.0032186671160161495, + 0.003001126926392317, + 0.0020975489169359207 + ], + "gamma_dfa": NaN, + "acc_eval": 0.609375, + "loss_eval": 1.1547397375106812, + "epoch": 100 + } + ], + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": 0.007406219025142491, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 802.1658935546875, + 3058.3173828125, + 4910.8408203125, + 6491.31494140625, + 7304.1533203125 + ], + "bp_grad_norms_per_sample_med": [ + 2.526000798752648e-06, + 1.3625027577290894e-06, + 1.3747999219049234e-06, + 1.378283172925876e-06, + 1.3869492931917193e-06 + ], + "bp_grad_norms_F": [ + 0.00013306058826856315, + 7.476000610040501e-05, + 7.328101492021233e-05, + 7.293069211300462e-05, + 7.309897773666307e-05 + ], + "gamma_dfa": 0.08989996102172881, + "acc_eval": 0.310546875, + "loss_eval": 1.9283097982406616, + "epoch": 1 + }, + { + "hidden_norms": [ + 1580.1480712890625, + 13320.0517578125, + 22793.435546875, + 32440.041015625, + 37758.640625 + ], + "bp_grad_norms_per_sample_med": [ + 1.1427439403632889e-06, + 3.0901847480890865e-07, + 3.1107475706448895e-07, + 3.1377521736430936e-07, + 3.1722706239634135e-07 + ], + "bp_grad_norms_F": [ + 6.523138290503994e-05, + 2.3476462956750765e-05, + 2.0436000340851024e-05, + 1.96047385543352e-05, + 1.9654715288197622e-05 + ], + "gamma_dfa": 0.0858152944711037, + "acc_eval": 0.2880859375, + "loss_eval": 1.9359606504440308, + "epoch": 2 + }, + { + "hidden_norms": [ + 2343.090576171875, + 32438.32421875, + 58119.84375, + 87185.09375, + 104586.15625 + ], + "bp_grad_norms_per_sample_med": [ + 8.229510513046989e-07, + 1.3056541092737461e-07, + 1.2754330214193033e-07, + 1.2950138739142858e-07, + 1.2936459370394005e-07 + ], + "bp_grad_norms_F": [ + 0.0001579313538968563, + 2.960947858809959e-05, + 1.2371615412121173e-05, + 8.468440682918299e-06, + 7.067524620651966e-06 + ], + "gamma_dfa": 0.08629915304481983, + "acc_eval": 0.3017578125, + "loss_eval": 1.9288904666900635, + "epoch": 3 + }, + { + "hidden_norms": [ + 3129.4423828125, + 62780.5, + 117608.9375, + 182640.09375, + 223504.390625 + ], + "bp_grad_norms_per_sample_med": [ + 6.484323762379063e-07, + 7.041825256237644e-08, + 6.729855783760286e-08, + 6.816127040565334e-08, + 6.818439857170233e-08 + ], + "bp_grad_norms_F": [ + 2.9993034331710078e-05, + 2.8730657959386008e-06, + 2.3409718323819106e-06, + 2.367017486903933e-06, + 2.3597553990839515e-06 + ], + "gamma_dfa": 0.08862219587899745, + "acc_eval": 0.3076171875, + "loss_eval": 1.926429033279419, + "epoch": 4 + }, + { + "hidden_norms": [ + 3942.00390625, + 109015.7890625, + 203168.390625, + 329067.625, + 404167.84375 + ], + "bp_grad_norms_per_sample_med": [ + 5.148021386958135e-07, + 4.3746137379230277e-08, + 4.211498705330996e-08, + 4.271550579915129e-08, + 4.2616289164243426e-08 + ], + "bp_grad_norms_F": [ + 2.426102219033055e-05, + 1.769960135789006e-06, + 1.4341048881760798e-06, + 1.45279318530811e-06, + 1.44924592859752e-06 + ], + "gamma_dfa": 0.0876110177487135, + "acc_eval": 0.328125, + "loss_eval": 1.9219281673431396, + "epoch": 5 + }, + { + "hidden_norms": [ + 4737.880859375, + 173361.203125, + 331121.75, + 547707.8125, + 677363.375 + ], + "bp_grad_norms_per_sample_med": [ + 4.4596529846785415e-07, + 2.929639286719521e-08, + 2.8080462399771022e-08, + 2.8515311001342525e-08, + 2.847208158129888e-08 + ], + "bp_grad_norms_F": [ + 2.1308444047463126e-05, + 1.213497625940363e-06, + 9.622256129659945e-07, + 9.734020522955689e-07, + 9.715020041767275e-07 + ], + "gamma_dfa": 0.08417161786928773, + "acc_eval": 0.2919921875, + "loss_eval": 1.942756175994873, + "epoch": 6 + }, + { + "hidden_norms": [ + 5535.86865234375, + 258337.40625, + 501117.59375, + 823776.9375, + 1026549.875 + ], + "bp_grad_norms_per_sample_med": [ + 3.856409307445574e-07, + 2.2078769035260848e-08, + 2.0866384176088104e-08, + 2.09813144635973e-08, + 2.1003458527957264e-08 + ], + "bp_grad_norms_F": [ + 1.847265775722917e-05, + 8.849666528476519e-07, + 7.187628057181428e-07, + 7.262269718921743e-07, + 7.249743703141576e-07 + ], + "gamma_dfa": 0.08587896963581443, + "acc_eval": 0.2919921875, + "loss_eval": 1.9307396411895752, + "epoch": 7 + }, + { + "hidden_norms": [ + 6304.064453125, + 367445.5625, + 717525.125, + 1200281.0, + 1512872.125 + ], + "bp_grad_norms_per_sample_med": [ + 3.410295903449878e-07, + 1.670872862291617e-08, + 1.5770844186135946e-08, + 1.5891666649281433e-08, + 1.588542275499094e-08 + ], + "bp_grad_norms_F": [ + 1.6556636182940565e-05, + 6.716044254062581e-07, + 5.55544488634041e-07, + 5.606318040918268e-07, + 5.59783927656099e-07 + ], + "gamma_dfa": 0.08515941491350532, + "acc_eval": 0.306640625, + "loss_eval": 1.9279191493988037, + "epoch": 8 + }, + { + "hidden_norms": [ + 7086.48388671875, + 505478.71875, + 997925.8125, + 1708849.375, + 2150479.25 + ], + "bp_grad_norms_per_sample_med": [ + 3.013988703060022e-07, + 1.3297809964285534e-08, + 1.2481795153007624e-08, + 1.262175253202713e-08, + 1.2595491760691857e-08 + ], + "bp_grad_norms_F": [ + 1.4646101590187754e-05, + 5.195778953748231e-07, + 4.4164838186588895e-07, + 4.451969459751126e-07, + 4.4467057591646153e-07 + ], + "gamma_dfa": 0.08757842611521482, + "acc_eval": 0.318359375, + "loss_eval": 1.9144790172576904, + "epoch": 9 + }, + { + "hidden_norms": [ + 7891.7685546875, + 675713.625, + 1320934.25, + 2319375.25, + 2933561.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.7613364750322944e-07, + 1.1096022767276281e-08, + 1.0442049891423721e-08, + 1.0500828651061056e-08, + 1.0485931234427426e-08 + ], + "bp_grad_norms_F": [ + 1.3369051885092631e-05, + 4.295688142974541e-07, + 3.6954631355001766e-07, + 3.72132660686475e-07, + 3.718281220699282e-07 + ], + "gamma_dfa": 0.08759273961186409, + "acc_eval": 0.3037109375, + "loss_eval": 1.928476095199585, + "epoch": 10 + }, + { + "hidden_norms": [ + 8605.7783203125, + 881309.9375, + 1719981.25, + 3048018.25, + 3848896.25 + ], + "bp_grad_norms_per_sample_med": [ + 2.546977952988527e-07, + 9.457612470953336e-09, + 8.959561981214392e-09, + 8.996098976865596e-09, + 8.995014511015142e-09 + ], + "bp_grad_norms_F": [ + 1.2278720532776788e-05, + 3.6486676435742993e-07, + 3.18511354180373e-07, + 3.204301890491479e-07, + 3.2022188634073245e-07 + ], + "gamma_dfa": 0.08920952118933201, + "acc_eval": 0.3017578125, + "loss_eval": 1.9193304777145386, + "epoch": 11 + }, + { + "hidden_norms": [ + 9378.4287109375, + 1120098.75, + 2197340.0, + 3930402.25, + 4945595.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.424853278171213e-07, + 8.285154784459792e-09, + 7.84627474104127e-09, + 7.900293752527432e-09, + 7.906582943917329e-09 + ], + "bp_grad_norms_F": [ + 1.1596725016715936e-05, + 3.161075028401683e-07, + 2.796709850372281e-07, + 2.81156104620095e-07, + 2.810372734529665e-07 + ], + "gamma_dfa": 0.09209982817992568, + "acc_eval": 0.287109375, + "loss_eval": 1.927558422088623, + "epoch": 12 + }, + { + "hidden_norms": [ + 10124.396484375, + 1412441.875, + 2752346.75, + 5010036.0, + 6325289.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.236940588318248e-07, + 7.092171738776187e-09, + 6.815563668993718e-09, + 6.8297678623707725e-09, + 6.830232379684276e-09 + ], + "bp_grad_norms_F": [ + 1.0770681910798885e-05, + 2.7517026524037647e-07, + 2.434409793750092e-07, + 2.4456548430862313e-07, + 2.445065661049739e-07 + ], + "gamma_dfa": 0.0919318727683276, + "acc_eval": 0.2900390625, + "loss_eval": 1.9280297756195068, + "epoch": 13 + }, + { + "hidden_norms": [ + 10873.9169921875, + 1726814.125, + 3365165.0, + 6225292.5, + 7941070.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.0750607632180618e-07, + 6.175024491739123e-09, + 5.938003866390318e-09, + 5.979505779407646e-09, + 5.979241990416995e-09 + ], + "bp_grad_norms_F": [ + 9.84854341368191e-06, + 2.3993459308258025e-07, + 2.1497004354387172e-07, + 2.1585482556929492e-07, + 2.1582005160780682e-07 + ], + "gamma_dfa": 0.09486197168007493, + "acc_eval": 0.2978515625, + "loss_eval": 1.9190003871917725, + "epoch": 14 + }, + { + "hidden_norms": [ + 11534.0087890625, + 2084976.25, + 4091674.75, + 7667605.5, + 9821730.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9337822720899567e-07, + 5.5730837722478554e-09, + 5.387873702744628e-09, + 5.409793057964407e-09, + 5.415522696949893e-09 + ], + "bp_grad_norms_F": [ + 9.290296475228388e-06, + 2.1226249202754843e-07, + 1.9121620198347955e-07, + 1.9190700584204023e-07, + 1.9189823774468096e-07 + ], + "gamma_dfa": 0.09578572702594101, + "acc_eval": 0.28515625, + "loss_eval": 1.9317920207977295, + "epoch": 15 + }, + { + "hidden_norms": [ + 12231.0380859375, + 2494592.5, + 4969235.5, + 9387796.0, + 12017026.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7950755193396617e-07, + 4.997119606997558e-09, + 4.8298063326512874e-09, + 4.8657629037052175e-09, + 4.859395552614387e-09 + ], + "bp_grad_norms_F": [ + 8.774502930464223e-06, + 1.8752842834146577e-07, + 1.7071489821773866e-07, + 1.7126839679804107e-07, + 1.7126781415299774e-07 + ], + "gamma_dfa": 0.09745451644994318, + "acc_eval": 0.2978515625, + "loss_eval": 1.927154541015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 12895.0341796875, + 2937750.0, + 5861416.5, + 11095317.0, + 14303387.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7269709928768862e-07, + 4.551929055907067e-09, + 4.4097947515808755e-09, + 4.41813474694186e-09, + 4.416958798714177e-09 + ], + "bp_grad_norms_F": [ + 8.354931196663529e-06, + 1.7010511044190935e-07, + 1.556661288759642e-07, + 1.5612842219070444e-07, + 1.5612160098044114e-07 + ], + "gamma_dfa": 0.09986255329567939, + "acc_eval": 0.3115234375, + "loss_eval": 1.9158110618591309, + "epoch": 17 + }, + { + "hidden_norms": [ + 13624.58984375, + 3430302.75, + 6892795.0, + 13179784.0, + 16997646.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.642013387481711e-07, + 4.094950600830316e-09, + 4.012986831725129e-09, + 4.022568500516854e-09, + 4.023625876925507e-09 + ], + "bp_grad_norms_F": [ + 7.884121259849053e-06, + 1.54415545239317e-07, + 1.407240830531009e-07, + 1.411058434541701e-07, + 1.4110656820776057e-07 + ], + "gamma_dfa": 0.09882167540490627, + "acc_eval": 0.296875, + "loss_eval": 1.9182151556015015, + "epoch": 18 + }, + { + "hidden_norms": [ + 14323.6708984375, + 3985548.0, + 8076905.5, + 15465362.0, + 20015594.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.551940442823252e-07, + 3.79724474086629e-09, + 3.6876826037257615e-09, + 3.700401984829682e-09, + 3.6983835993709135e-09 + ], + "bp_grad_norms_F": [ + 7.607863608427579e-06, + 1.393282218487002e-07, + 1.283839452526081e-07, + 1.2869591614617093e-07, + 1.2869809040694236e-07 + ], + "gamma_dfa": 0.1002046266803518, + "acc_eval": 0.294921875, + "loss_eval": 1.9388974905014038, + "epoch": 19 + }, + { + "hidden_norms": [ + 14955.4462890625, + 4541631.5, + 9327444.0, + 17893654.0, + 23108114.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4713883444983367e-07, + 3.464018405452407e-09, + 3.3744134153579353e-09, + 3.379040602879968e-09, + 3.381670721225305e-09 + ], + "bp_grad_norms_F": [ + 7.235442353703547e-06, + 1.2747574373861426e-07, + 1.1753004969250469e-07, + 1.1780696951291247e-07, + 1.1780796427274254e-07 + ], + "gamma_dfa": 0.10065551439765841, + "acc_eval": 0.30859375, + "loss_eval": 1.9343281984329224, + "epoch": 20 + }, + { + "hidden_norms": [ + 15583.8564453125, + 5145675.5, + 10628445.0, + 20547210.0, + 26561584.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4314694851691456e-07, + 3.170894435911009e-09, + 3.083378885548882e-09, + 3.0910656256821767e-09, + 3.0932543193529227e-09 + ], + "bp_grad_norms_F": [ + 6.938716524018673e-06, + 1.1743370009753562e-07, + 1.0794892091325892e-07, + 1.0819184126376058e-07, + 1.0819199047773509e-07 + ], + "gamma_dfa": 0.10184943513013422, + "acc_eval": 0.3154296875, + "loss_eval": 1.9154099225997925, + "epoch": 21 + }, + { + "hidden_norms": [ + 16234.9208984375, + 5839592.5, + 12062968.0, + 23496628.0, + 30428386.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.379862197836701e-07, + 2.91886981251821e-09, + 2.8514124394973805e-09, + 2.8584146161136914e-09, + 2.860225389866855e-09 + ], + "bp_grad_norms_F": [ + 6.72459282213822e-06, + 1.0762735769276333e-07, + 9.920048427147776e-08, + 9.94118352082296e-08, + 9.941232548271728e-08 + ], + "gamma_dfa": 0.1024534439202398, + "acc_eval": 0.3095703125, + "loss_eval": 1.9225246906280518, + "epoch": 22 + }, + { + "hidden_norms": [ + 16833.765625, + 6566770.0, + 13630788.0, + 26729236.0, + 34665300.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.331996628550769e-07, + 2.688527622751735e-09, + 2.6381341555747895e-09, + 2.6441848710589966e-09, + 2.644968466469777e-09 + ], + "bp_grad_norms_F": [ + 6.5681074374879245e-06, + 9.902939268613409e-08, + 9.131563416531208e-08, + 9.149899682370233e-08, + 9.149922419737777e-08 + ], + "gamma_dfa": 0.10199526121141389, + "acc_eval": 0.30859375, + "loss_eval": 1.9233064651489258, + "epoch": 23 + }, + { + "hidden_norms": [ + 17456.634765625, + 7337101.0, + 15401232.0, + 30171576.0, + 39161244.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2747005939672817e-07, + 2.4809998500074926e-09, + 2.4282977850731413e-09, + 2.432346990488554e-09, + 2.431272960734532e-09 + ], + "bp_grad_norms_F": [ + 6.5036538217100315e-06, + 9.14754565428666e-08, + 8.484188640522916e-08, + 8.500099824004792e-08, + 8.500632731056612e-08 + ], + "gamma_dfa": 0.10456769005395472, + "acc_eval": 0.30078125, + "loss_eval": 1.9299731254577637, + "epoch": 24 + }, + { + "hidden_norms": [ + 18049.205078125, + 8139419.5, + 17132936.0, + 33801196.0, + 43890588.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2153788020441425e-07, + 2.2737314253618024e-09, + 2.2332342641817604e-09, + 2.232388940370811e-09, + 2.237900753598865e-09 + ], + "bp_grad_norms_F": [ + 6.099615802668268e-06, + 8.523231542767462e-08, + 7.842250226985925e-08, + 7.855853567662052e-08, + 7.856372263859157e-08 + ], + "gamma_dfa": 0.10287670505931601, + "acc_eval": 0.3232421875, + "loss_eval": 1.923604965209961, + "epoch": 25 + }, + { + "hidden_norms": [ + 18644.9375, + 9035569.0, + 19136636.0, + 37813052.0, + 49194300.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.212478508705317e-07, + 2.0938955014315752e-09, + 2.0560451119422396e-09, + 2.058360148993188e-09, + 2.061209425363586e-09 + ], + "bp_grad_norms_F": [ + 5.810702987218974e-06, + 7.886949049407121e-08, + 7.294480752761956e-08, + 7.307144755941408e-08, + 7.307325233796291e-08 + ], + "gamma_dfa": 0.10249267728067935, + "acc_eval": 0.3037109375, + "loss_eval": 1.9200568199157715, + "epoch": 26 + }, + { + "hidden_norms": [ + 19280.703125, + 9952065.0, + 21071430.0, + 41963900.0, + 54690120.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1414142875310063e-07, + 1.9668882078605066e-09, + 1.928355919389446e-09, + 1.9296169107008154e-09, + 1.929810311551705e-09 + ], + "bp_grad_norms_F": [ + 5.566818344959756e-06, + 7.357547104902551e-08, + 6.781976935599232e-08, + 6.792832607516175e-08, + 6.79302942785398e-08 + ], + "gamma_dfa": 0.10335587273584679, + "acc_eval": 0.310546875, + "loss_eval": 1.92685067653656, + "epoch": 27 + }, + { + "hidden_norms": [ + 19887.205078125, + 10899353.0, + 23080260.0, + 46142640.0, + 60105148.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1361055385350483e-07, + 1.8462845696731733e-09, + 1.815088412904231e-09, + 1.8113950339682106e-09, + 1.8156832704008252e-09 + ], + "bp_grad_norms_F": [ + 5.398809662437998e-06, + 6.89453401037099e-08, + 6.4051612014282e-08, + 6.414857267600382e-08, + 6.415204012455433e-08 + ], + "gamma_dfa": 0.10455695656128228, + "acc_eval": 0.302734375, + "loss_eval": 1.923227310180664, + "epoch": 28 + }, + { + "hidden_norms": [ + 20438.587890625, + 11953376.0, + 25259200.0, + 50259240.0, + 65732368.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1073134231764925e-07, + 1.7497674420496878e-09, + 1.7245866956727696e-09, + 1.7265968654811559e-09, + 1.727246901062074e-09 + ], + "bp_grad_norms_F": [ + 5.281461653794395e-06, + 6.489771209317041e-08, + 6.026093046784808e-08, + 6.034837696233808e-08, + 6.035197941400838e-08 + ], + "gamma_dfa": 0.10511547370697372, + "acc_eval": 0.326171875, + "loss_eval": 1.9300421476364136, + "epoch": 29 + }, + { + "hidden_norms": [ + 20991.0234375, + 13017462.0, + 27475572.0, + 54971628.0, + 71927184.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0625635837868685e-07, + 1.6529324575742521e-09, + 1.6255721213553898e-09, + 1.6247864165208625e-09, + 1.6244732226056158e-09 + ], + "bp_grad_norms_F": [ + 5.098012934467988e-06, + 6.077872427567854e-08, + 5.674080227890954e-08, + 5.681971870785674e-08, + 5.6821534144546604e-08 + ], + "gamma_dfa": 0.10590779440826736, + "acc_eval": 0.3017578125, + "loss_eval": 1.9211739301681519, + "epoch": 30 + }, + { + "hidden_norms": [ + 21617.34765625, + 14125094.0, + 29881326.0, + 59926964.0, + 78189832.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0433515029717455e-07, + 1.5471924852406005e-09, + 1.5234034034250499e-09, + 1.5246930384904545e-09, + 1.5239296491387222e-09 + ], + "bp_grad_norms_F": [ + 4.977115622750716e-06, + 5.780140810429657e-08, + 5.362210941939338e-08, + 5.3694908075385683e-08, + 5.369727773540944e-08 + ], + "gamma_dfa": 0.10481705865822732, + "acc_eval": 0.3212890625, + "loss_eval": 1.9209015369415283, + "epoch": 31 + }, + { + "hidden_norms": [ + 22126.13671875, + 15300531.0, + 32579362.0, + 65167536.0, + 85083400.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0149238249823611e-07, + 1.4551810867402537e-09, + 1.4291762218121562e-09, + 1.432274854273885e-09, + 1.4318950469771607e-09 + ], + "bp_grad_norms_F": [ + 4.9215527724300046e-06, + 5.434217342781267e-08, + 5.088266163966182e-08, + 5.094950239481477e-08, + 5.0953229191463834e-08 + ], + "gamma_dfa": 0.10599250381346792, + "acc_eval": 0.30859375, + "loss_eval": 1.9330241680145264, + "epoch": 32 + }, + { + "hidden_norms": [ + 22662.396484375, + 16481282.0, + 35263600.0, + 70793304.0, + 92166136.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.882934648430819e-08, + 1.3810197430075277e-09, + 1.3668104426045602e-09, + 1.3675354182396404e-09, + 1.366150526038723e-09 + ], + "bp_grad_norms_F": [ + 4.6740801735722926e-06, + 5.137474090588512e-08, + 4.796589792022132e-08, + 4.802501862855024e-08, + 4.8027377630432966e-08 + ], + "gamma_dfa": 0.10529429838061333, + "acc_eval": 0.3115234375, + "loss_eval": 1.9205418825149536, + "epoch": 33 + }, + { + "hidden_norms": [ + 23192.3125, + 17779744.0, + 38108720.0, + 76522688.0, + 99643120.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.530750588737646e-08, + 1.3089170858293642e-09, + 1.2901538726239892e-09, + 1.2906937740808644e-09, + 1.2914372904404559e-09 + ], + "bp_grad_norms_F": [ + 4.669429472414777e-06, + 4.88593805414439e-08, + 4.5740907950175824e-08, + 4.579441181817856e-08, + 4.5798362435789386e-08 + ], + "gamma_dfa": 0.1058788642694708, + "acc_eval": 0.30078125, + "loss_eval": 1.9393997192382812, + "epoch": 34 + }, + { + "hidden_norms": [ + 23683.251953125, + 18992256.0, + 40936536.0, + 82030200.0, + 106929248.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.458356942104729e-08, + 1.2407530558533608e-09, + 1.2231146095942336e-09, + 1.2233244417458877e-09, + 1.2247586278490985e-09 + ], + "bp_grad_norms_F": [ + 4.483116299525136e-06, + 4.651869289773458e-08, + 4.358627236911161e-08, + 4.363666050721804e-08, + 4.3638891611408326e-08 + ], + "gamma_dfa": 0.10620562738040462, + "acc_eval": 0.3251953125, + "loss_eval": 1.9221802949905396, + "epoch": 35 + }, + { + "hidden_norms": [ + 24223.7265625, + 20421224.0, + 43883308.0, + 87849264.0, + 114523200.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.247051480087976e-08, + 1.182353992490448e-09, + 1.1679496259020539e-09, + 1.169668362166476e-09, + 1.1697178781133744e-09 + ], + "bp_grad_norms_F": [ + 4.388592969917227e-06, + 4.4431864409943955e-08, + 4.157495325785021e-08, + 4.162143696362364e-08, + 4.16235543809762e-08 + ], + "gamma_dfa": 0.10484841075958684, + "acc_eval": 0.2998046875, + "loss_eval": 1.9306102991104126, + "epoch": 36 + }, + { + "hidden_norms": [ + 24732.05078125, + 21765008.0, + 46887340.0, + 93818392.0, + 122372552.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.012441637423763e-08, + 1.1452657711075176e-09, + 1.1280866241136778e-09, + 1.1283430856323662e-09, + 1.1287816237270931e-09 + ], + "bp_grad_norms_F": [ + 4.297942268749466e-06, + 4.29258228962226e-08, + 3.9989565436826524e-08, + 4.003141995667647e-08, + 4.003394948881578e-08 + ], + "gamma_dfa": 0.10523941312567331, + "acc_eval": 0.302734375, + "loss_eval": 1.9360214471817017, + "epoch": 37 + }, + { + "hidden_norms": [ + 25179.26953125, + 23094218.0, + 50076040.0, + 100053064.0, + 130605352.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.80345041309738e-08, + 1.0831726626747695e-09, + 1.0690409668612233e-09, + 1.0700328401114234e-09, + 1.0692404739387484e-09 + ], + "bp_grad_norms_F": [ + 4.235343567415839e-06, + 4.072955306355652e-08, + 3.817867622046833e-08, + 3.8218924913735464e-08, + 3.822109917450689e-08 + ], + "gamma_dfa": 0.10568258634884842, + "acc_eval": 0.3193359375, + "loss_eval": 1.927825689315796, + "epoch": 38 + }, + { + "hidden_norms": [ + 25586.23828125, + 24470240.0, + 53013036.0, + 105981368.0, + 138543408.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.783595717432036e-08, + 1.0381262516290235e-09, + 1.0265919225815878e-09, + 1.0273364381419015e-09, + 1.0274008310773297e-09 + ], + "bp_grad_norms_F": [ + 4.177269602223532e-06, + 3.924894187434802e-08, + 3.684685978555535e-08, + 3.688498040332888e-08, + 3.688741045948518e-08 + ], + "gamma_dfa": 0.10561428684741259, + "acc_eval": 0.302734375, + "loss_eval": 1.9321579933166504, + "epoch": 39 + }, + { + "hidden_norms": [ + 26049.974609375, + 25812240.0, + 56223324.0, + 112200904.0, + 146978224.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.555475972116255e-08, + 9.982903392824483e-10, + 9.87055215340149e-10, + 9.8631947054173e-10, + 9.876408579856388e-10 + ], + "bp_grad_norms_F": [ + 4.088252808287507e-06, + 3.767732792425704e-08, + 3.5331073178213046e-08, + 3.536514370239274e-08, + 3.5367978767908426e-08 + ], + "gamma_dfa": 0.10579964506905526, + "acc_eval": 0.318359375, + "loss_eval": 1.930686116218567, + "epoch": 40 + }, + { + "hidden_norms": [ + 26467.328125, + 27200558.0, + 59437036.0, + 118688848.0, + 155514592.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.46039256430231e-08, + 9.647596055373242e-10, + 9.512606258255119e-10, + 9.511659238015113e-10, + 9.522146404705722e-10 + ], + "bp_grad_norms_F": [ + 4.015588729089359e-06, + 3.636354861669133e-08, + 3.413835614196614e-08, + 3.417060767674229e-08, + 3.417307326003538e-08 + ], + "gamma_dfa": 0.10565257369307801, + "acc_eval": 0.314453125, + "loss_eval": 1.9317667484283447, + "epoch": 41 + }, + { + "hidden_norms": [ + 26919.3671875, + 28678974.0, + 62716300.0, + 125549296.0, + 163974208.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.232915860162393e-08, + 9.29719468079071e-10, + 9.197844152986079e-10, + 9.194760508535182e-10, + 9.196678418810222e-10 + ], + "bp_grad_norms_F": [ + 3.951602138840826e-06, + 3.508949220076829e-08, + 3.2971975372220186e-08, + 3.3001178678659926e-08, + 3.300409190387654e-08 + ], + "gamma_dfa": 0.10566475696396083, + "acc_eval": 0.3056640625, + "loss_eval": 1.9284584522247314, + "epoch": 42 + }, + { + "hidden_norms": [ + 27317.033203125, + 30078810.0, + 66046968.0, + 132107504.0, + 172659440.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.130339068657122e-08, + 9.03509489447174e-10, + 8.925334360476711e-10, + 8.917908633776506e-10, + 8.925368222278962e-10 + ], + "bp_grad_norms_F": [ + 3.9174719859147444e-06, + 3.398368519924588e-08, + 3.1965900149089066e-08, + 3.199273024279137e-08, + 3.199540898890518e-08 + ], + "gamma_dfa": 0.10646540904417634, + "acc_eval": 0.3115234375, + "loss_eval": 1.9241154193878174, + "epoch": 43 + }, + { + "hidden_norms": [ + 27715.529296875, + 31383778.0, + 69356640.0, + 138681856.0, + 181338928.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.031172171740764e-08, + 8.735605017129444e-10, + 8.597746958827202e-10, + 8.612066615398817e-10, + 8.621173774869817e-10 + ], + "bp_grad_norms_F": [ + 3.837071290035965e-06, + 3.286310601424702e-08, + 3.101721191001161e-08, + 3.104238288642591e-08, + 3.104513979224066e-08 + ], + "gamma_dfa": 0.10568622383289039, + "acc_eval": 0.2939453125, + "loss_eval": 1.938409447669983, + "epoch": 44 + }, + { + "hidden_norms": [ + 28149.3203125, + 32840858.0, + 72848112.0, + 145667440.0, + 190265088.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.894184506085367e-08, + 8.401777051858517e-10, + 8.299890774665641e-10, + 8.304122944835512e-10, + 8.303523979513727e-10 + ], + "bp_grad_norms_F": [ + 3.798121497311513e-06, + 3.184389640864538e-08, + 3.004597459721481e-08, + 3.0069060130699654e-08, + 3.007191295978373e-08 + ], + "gamma_dfa": 0.10558789351489395, + "acc_eval": 0.3037109375, + "loss_eval": 1.9300565719604492, + "epoch": 45 + }, + { + "hidden_norms": [ + 28522.55078125, + 34358040.0, + 76134080.0, + 152412848.0, + 198973936.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.830858095303483e-08, + 8.109956595170331e-10, + 8.036356025087343e-10, + 8.033995135825478e-10, + 8.031720843959533e-10 + ], + "bp_grad_norms_F": [ + 3.7768336369481403e-06, + 3.096561229654071e-08, + 2.9296373327269976e-08, + 2.9317961391939207e-08, + 2.9320871064442144e-08 + ], + "gamma_dfa": 0.10623026502435096, + "acc_eval": 0.3115234375, + "loss_eval": 1.930029273033142, + "epoch": 46 + }, + { + "hidden_norms": [ + 28924.912109375, + 35808620.0, + 79629336.0, + 159269824.0, + 208087264.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.754207587140627e-08, + 7.940589297206202e-10, + 7.852188899093449e-10, + 7.844204730211857e-10, + 7.861447048895798e-10 + ], + "bp_grad_norms_F": [ + 3.695072564369184e-06, + 3.0030403053160626e-08, + 2.8479737679276695e-08, + 2.849986913133762e-08, + 2.8502654458861798e-08 + ], + "gamma_dfa": 0.1059467513114214, + "acc_eval": 0.30078125, + "loss_eval": 1.9284684658050537, + "epoch": 47 + }, + { + "hidden_norms": [ + 29289.236328125, + 37312204.0, + 83049256.0, + 165977216.0, + 216710016.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.562951509498816e-08, + 7.782112176890621e-10, + 7.675478586044449e-10, + 7.666810519779688e-10, + 7.681388303204528e-10 + ], + "bp_grad_norms_F": [ + 3.6269300380809e-06, + 2.9297559933638695e-08, + 2.782604902051844e-08, + 2.7844757610751003e-08, + 2.7847393724300673e-08 + ], + "gamma_dfa": 0.10581977141555399, + "acc_eval": 0.3037109375, + "loss_eval": 1.9282777309417725, + "epoch": 48 + }, + { + "hidden_norms": [ + 29638.296875, + 38754036.0, + 86627536.0, + 172893504.0, + 225686464.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.50456763398688e-08, + 7.526539391733422e-10, + 7.443530236628249e-10, + 7.439299176681402e-10, + 7.444729277494844e-10 + ], + "bp_grad_norms_F": [ + 3.6355218071548734e-06, + 2.845291824371543e-08, + 2.7127033064289208e-08, + 2.714476821097378e-08, + 2.7147471826083347e-08 + ], + "gamma_dfa": 0.1066790189652238, + "acc_eval": 0.3056640625, + "loss_eval": 1.925389051437378, + "epoch": 49 + }, + { + "hidden_norms": [ + 29950.615234375, + 40150236.0, + 90007640.0, + 179977856.0, + 235206976.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.382724476201474e-08, + 7.370593024802474e-10, + 7.280710478951846e-10, + 7.283330605289962e-10, + 7.279294389483937e-10 + ], + "bp_grad_norms_F": [ + 3.5918935736845015e-06, + 2.7770946431360244e-08, + 2.6450262424759785e-08, + 2.6465910352158062e-08, + 2.6468752523101102e-08 + ], + "gamma_dfa": 0.10654840966162737, + "acc_eval": 0.3076171875, + "loss_eval": 1.929931402206421, + "epoch": 50 + }, + { + "hidden_norms": [ + 30266.310546875, + 41604512.0, + 93401064.0, + 187075808.0, + 244203616.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.343555097349963e-08, + 7.144400626657443e-10, + 7.057154305378788e-10, + 7.05836944447924e-10, + 7.073042707084198e-10 + ], + "bp_grad_norms_F": [ + 3.5134323752572527e-06, + 2.7063506990998576e-08, + 2.580901536930469e-08, + 2.582418012764265e-08, + 2.582707381293403e-08 + ], + "gamma_dfa": 0.10640880587743595, + "acc_eval": 0.314453125, + "loss_eval": 1.9268465042114258, + "epoch": 51 + }, + { + "hidden_norms": [ + 30588.291015625, + 43073320.0, + 96898208.0, + 193783280.0, + 253267328.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.257300893570573e-08, + 6.925075513031231e-10, + 6.871804236752155e-10, + 6.855109813130866e-10, + 6.860176871015256e-10 + ], + "bp_grad_norms_F": [ + 3.4990612221008632e-06, + 2.652852693074692e-08, + 2.5297810068991566e-08, + 2.5311907236869047e-08, + 2.531497678148753e-08 + ], + "gamma_dfa": 0.10629434209840838, + "acc_eval": 0.3125, + "loss_eval": 1.932523488998413, + "epoch": 52 + }, + { + "hidden_norms": [ + 30898.34765625, + 44412940.0, + 100019336.0, + 199966816.0, + 261667760.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.140450719589353e-08, + 6.861456958162648e-10, + 6.789319106914604e-10, + 6.784582895491553e-10, + 6.785109696316738e-10 + ], + "bp_grad_norms_F": [ + 3.470987167020212e-06, + 2.5969489669819268e-08, + 2.478421379237261e-08, + 2.479695204726795e-08, + 2.4800137055080995e-08 + ], + "gamma_dfa": 0.1070190458704019, + "acc_eval": 0.310546875, + "loss_eval": 1.932159662246704, + "epoch": 53 + }, + { + "hidden_norms": [ + 31188.375, + 45820600.0, + 103429992.0, + 206547120.0, + 270181600.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.079076169702603e-08, + 6.688025688816879e-10, + 6.633480986728557e-10, + 6.629659043966285e-10, + 6.630911930649575e-10 + ], + "bp_grad_norms_F": [ + 3.4183981370006222e-06, + 2.540217280966317e-08, + 2.4278467236626966e-08, + 2.4290830680229192e-08, + 2.429379897250783e-08 + ], + "gamma_dfa": 0.10550818023330066, + "acc_eval": 0.2998046875, + "loss_eval": 1.9357173442840576, + "epoch": 54 + }, + { + "hidden_norms": [ + 31478.2109375, + 47178892.0, + 107044784.0, + 213196560.0, + 278895232.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.016877390242371e-08, + 6.609012226377331e-10, + 6.520708972779232e-10, + 6.519841333485488e-10, + 6.530669338644657e-10 + ], + "bp_grad_norms_F": [ + 3.405668167033582e-06, + 2.4965938649756936e-08, + 2.3893584000234114e-08, + 2.390493669679472e-08, + 2.390810749375305e-08 + ], + "gamma_dfa": 0.10673638083972037, + "acc_eval": 0.294921875, + "loss_eval": 1.9359304904937744, + "epoch": 55 + }, + { + "hidden_norms": [ + 31753.5859375, + 48563264.0, + 110454832.0, + 219550528.0, + 287320896.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.007908919831607e-08, + 6.483197867446222e-10, + 6.408613084651904e-10, + 6.410805775125539e-10, + 6.409432429244077e-10 + ], + "bp_grad_norms_F": [ + 3.369002797626308e-06, + 2.447991498399915e-08, + 2.3494733270013057e-08, + 2.350535943662635e-08, + 2.350850003551841e-08 + ], + "gamma_dfa": 0.10726616549072787, + "acc_eval": 0.3076171875, + "loss_eval": 1.9281866550445557, + "epoch": 56 + }, + { + "hidden_norms": [ + 32002.76953125, + 49866268.0, + 113724368.0, + 225759120.0, + 295231328.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.914736161434121e-08, + 6.332004365283694e-10, + 6.232644400583354e-10, + 6.233273341926804e-10, + 6.240686856173738e-10 + ], + "bp_grad_norms_F": [ + 3.3845158213807736e-06, + 2.415495181651295e-08, + 2.3192731291032942e-08, + 2.3202973764568924e-08, + 2.3206132127029377e-08 + ], + "gamma_dfa": 0.10715722179156728, + "acc_eval": 0.3095703125, + "loss_eval": 1.9343407154083252, + "epoch": 57 + }, + { + "hidden_norms": [ + 32277.291015625, + 51206064.0, + 116617608.0, + 231756352.0, + 303064864.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.926612172719615e-08, + 6.240719607752965e-10, + 6.182420131395361e-10, + 6.17405682135086e-10, + 6.178215161689593e-10 + ], + "bp_grad_norms_F": [ + 3.317889877507696e-06, + 2.3704412654979024e-08, + 2.2745311412109004e-08, + 2.2754765183208292e-08, + 2.2757769002623718e-08 + ], + "gamma_dfa": 0.10657632350921631, + "acc_eval": 0.302734375, + "loss_eval": 1.9305057525634766, + "epoch": 58 + }, + { + "hidden_norms": [ + 32521.890625, + 52538716.0, + 119605040.0, + 237773904.0, + 310920672.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.805787933217289e-08, + 6.190028489783117e-10, + 6.10553496649402e-10, + 6.107545580391616e-10, + 6.10922701316241e-10 + ], + "bp_grad_norms_F": [ + 3.2823897981870687e-06, + 2.3313557306892108e-08, + 2.2385792775025948e-08, + 2.239448981811165e-08, + 2.239757002087117e-08 + ], + "gamma_dfa": 0.10671919275773689, + "acc_eval": 0.302734375, + "loss_eval": 1.9269468784332275, + "epoch": 59 + }, + { + "hidden_norms": [ + 32717.80859375, + 53698120.0, + 122676120.0, + 243745136.0, + 318772768.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.75130422678194e-08, + 6.033377686343044e-10, + 5.948920800413759e-10, + 5.949861159315617e-10, + 5.951407144877408e-10 + ], + "bp_grad_norms_F": [ + 3.2588357044005534e-06, + 2.2926835541170476e-08, + 2.205681148836902e-08, + 2.206508220581327e-08, + 2.2068283200837868e-08 + ], + "gamma_dfa": 0.10711025857017376, + "acc_eval": 0.314453125, + "loss_eval": 1.9273767471313477, + "epoch": 60 + }, + { + "hidden_norms": [ + 32950.74609375, + 54885932.0, + 125689616.0, + 249312240.0, + 326217856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.673791119737871e-08, + 5.923626589243725e-10, + 5.863842189590684e-10, + 5.866296337586618e-10, + 5.870876007563197e-10 + ], + "bp_grad_norms_F": [ + 3.2307948458765168e-06, + 2.2597017590442192e-08, + 2.1738133071380616e-08, + 2.1745805156569986e-08, + 2.1749071876797643e-08 + ], + "gamma_dfa": 0.10673619594308548, + "acc_eval": 0.31640625, + "loss_eval": 1.9271256923675537, + "epoch": 61 + }, + { + "hidden_norms": [ + 33148.1328125, + 55976648.0, + 128534072.0, + 254655232.0, + 333162784.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.663199769718631e-08, + 5.852057172184288e-10, + 5.787633705622852e-10, + 5.792484825128952e-10, + 5.793157620281875e-10 + ], + "bp_grad_norms_F": [ + 3.197097157681128e-06, + 2.2320827852695402e-08, + 2.1484760637235922e-08, + 2.149219824332249e-08, + 2.1495376145708178e-08 + ], + "gamma_dfa": 0.10659754439257085, + "acc_eval": 0.310546875, + "loss_eval": 1.9244905710220337, + "epoch": 62 + }, + { + "hidden_norms": [ + 33369.18359375, + 57164716.0, + 131352720.0, + 259876736.0, + 339964160.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.583201184184873e-08, + 5.737598174349046e-10, + 5.67273561458137e-10, + 5.66656666034504e-10, + 5.665773961105458e-10 + ], + "bp_grad_norms_F": [ + 3.2037539767770795e-06, + 2.2096731555620863e-08, + 2.127841902677119e-08, + 2.1285371687440602e-08, + 2.1288625973170383e-08 + ], + "gamma_dfa": 0.10679806087864563, + "acc_eval": 0.3154296875, + "loss_eval": 1.9308257102966309, + "epoch": 63 + }, + { + "hidden_norms": [ + 33540.88671875, + 58301528.0, + 133722112.0, + 264798368.0, + 346396256.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.606099844930213e-08, + 5.686319748399171e-10, + 5.629098853709991e-10, + 5.619399945366865e-10, + 5.626447086015673e-10 + ], + "bp_grad_norms_F": [ + 3.1530219075648347e-06, + 2.1766210167584177e-08, + 2.0992644067518995e-08, + 2.0999330274662498e-08, + 2.1002534822400776e-08 + ], + "gamma_dfa": 0.10647483140928671, + "acc_eval": 0.3115234375, + "loss_eval": 1.925765037536621, + "epoch": 64 + }, + { + "hidden_norms": [ + 33728.984375, + 59420104.0, + 136277376.0, + 270265568.0, + 353408672.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.57889458466343e-08, + 5.627094901150542e-10, + 5.575621631059846e-10, + 5.567652450189087e-10, + 5.571588745922895e-10 + ], + "bp_grad_norms_F": [ + 3.138873807984055e-06, + 2.1483266721133987e-08, + 2.0736742101234995e-08, + 2.0742897177683517e-08, + 2.0746110607205992e-08 + ], + "gamma_dfa": 0.10677585859230021, + "acc_eval": 0.3154296875, + "loss_eval": 1.9289934635162354, + "epoch": 65 + }, + { + "hidden_norms": [ + 33919.515625, + 60492864.0, + 138846208.0, + 275456896.0, + 359821632.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.451340084367985e-08, + 5.607461717183071e-10, + 5.556192728128906e-10, + 5.553609239150603e-10, + 5.557289628477236e-10 + ], + "bp_grad_norms_F": [ + 3.125772991552367e-06, + 2.1269308092541905e-08, + 2.0518179155715188e-08, + 2.052397540808215e-08, + 2.0527094690692138e-08 + ], + "gamma_dfa": 0.10671760967670707, + "acc_eval": 0.3125, + "loss_eval": 1.9296305179595947, + "epoch": 66 + }, + { + "hidden_norms": [ + 34098.5, + 61508056.0, + 141295472.0, + 280204000.0, + 365860768.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.474934366451635e-08, + 5.519530943409734e-10, + 5.459506735583375e-10, + 5.446967876743258e-10, + 5.452004958605983e-10 + ], + "bp_grad_norms_F": [ + 3.1189638320938684e-06, + 2.1083655710185667e-08, + 2.0349753881987453e-08, + 2.0355370722313637e-08, + 2.0358520202989894e-08 + ], + "gamma_dfa": 0.10652847628807649, + "acc_eval": 0.3046875, + "loss_eval": 1.9298161268234253, + "epoch": 67 + }, + { + "hidden_norms": [ + 34267.96875, + 62529272.0, + 143621744.0, + 284772064.0, + 371754336.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.392743046035321e-08, + 5.466314068058864e-10, + 5.412825743178473e-10, + 5.413390846698007e-10, + 5.416116999334974e-10 + ], + "bp_grad_norms_F": [ + 3.0790877190156607e-06, + 2.0871810946232472e-08, + 2.0159163227617682e-08, + 2.0164401703937074e-08, + 2.0167590264463797e-08 + ], + "gamma_dfa": 0.10652959482831648, + "acc_eval": 0.298828125, + "loss_eval": 1.926388144493103, + "epoch": 68 + }, + { + "hidden_norms": [ + 34420.42578125, + 63473892.0, + 145906128.0, + 289224256.0, + 377581856.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.427427479138714e-08, + 5.377295275721394e-10, + 5.307561612433176e-10, + 5.305922923248829e-10, + 5.308011252758149e-10 + ], + "bp_grad_norms_F": [ + 3.096157115578535e-06, + 2.067219107004803e-08, + 2.0005694878477698e-08, + 2.001087118230771e-08, + 2.001400645212925e-08 + ], + "gamma_dfa": 0.10710431921324925, + "acc_eval": 0.310546875, + "loss_eval": 1.9277684688568115, + "epoch": 69 + }, + { + "hidden_norms": [ + 34573.87890625, + 64328388.0, + 148036320.0, + 293257856.0, + 382751104.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.389419127117435e-08, + 5.373848033229933e-10, + 5.314943485323909e-10, + 5.314927387090052e-10, + 5.31539035009132e-10 + ], + "bp_grad_norms_F": [ + 3.072862682529376e-06, + 2.049388392322271e-08, + 1.98319511923728e-08, + 1.9836669196138246e-08, + 1.9840014076066836e-08 + ], + "gamma_dfa": 0.10700461147644091, + "acc_eval": 0.3076171875, + "loss_eval": 1.9307092428207397, + "epoch": 70 + }, + { + "hidden_norms": [ + 34690.74609375, + 65142160.0, + 150006800.0, + 297046144.0, + 387685792.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.348407310952098e-08, + 5.322000062868426e-10, + 5.271332259582096e-10, + 5.264539360005926e-10, + 5.263872671079639e-10 + ], + "bp_grad_norms_F": [ + 3.055365141335642e-06, + 2.0346906381973895e-08, + 1.9688986441224188e-08, + 1.969357477094036e-08, + 1.969680063496071e-08 + ], + "gamma_dfa": 0.10688555391971022, + "acc_eval": 0.314453125, + "loss_eval": 1.9277830123901367, + "epoch": 71 + }, + { + "hidden_norms": [ + 34818.79296875, + 65891160.0, + 151813680.0, + 300644832.0, + 392342848.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.302482802311715e-08, + 5.310150652526602e-10, + 5.265936020570905e-10, + 5.26124921407245e-10, + 5.26482579754628e-10 + ], + "bp_grad_norms_F": [ + 3.027237426067586e-06, + 2.0201985861945104e-08, + 1.9550000729395833e-08, + 1.955433681644081e-08, + 1.9557578667672715e-08 + ], + "gamma_dfa": 0.10652808679151349, + "acc_eval": 0.2998046875, + "loss_eval": 1.9273805618286133, + "epoch": 72 + }, + { + "hidden_norms": [ + 34951.515625, + 66590476.0, + 153730848.0, + 304118720.0, + 396925408.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.403244157127119e-08, + 5.26472032635894e-10, + 5.205495479110311e-10, + 5.201504782448296e-10, + 5.20502474454787e-10 + ], + "bp_grad_norms_F": [ + 3.0631524623458972e-06, + 2.0121730059941e-08, + 1.9494045488954725e-08, + 1.9498189729461046e-08, + 1.950143335704979e-08 + ], + "gamma_dfa": 0.1070192107144976, + "acc_eval": 0.3017578125, + "loss_eval": 1.934456467628479, + "epoch": 73 + }, + { + "hidden_norms": [ + 35056.31640625, + 67311408.0, + 155368816.0, + 307494752.0, + 401124448.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.303329769252741e-08, + 5.209726539057158e-10, + 5.160313842900166e-10, + 5.156270965755994e-10, + 5.161130411934778e-10 + ], + "bp_grad_norms_F": [ + 3.0127189347695094e-06, + 1.993531562050066e-08, + 1.93110221147208e-08, + 1.9314887467203334e-08, + 1.9318180832783582e-08 + ], + "gamma_dfa": 0.10658633662387729, + "acc_eval": 0.3076171875, + "loss_eval": 1.9260145425796509, + "epoch": 74 + }, + { + "hidden_norms": [ + 35158.68359375, + 67933192.0, + 157091536.0, + 310654048.0, + 405321344.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.339039515523837e-08, + 5.170803230036825e-10, + 5.107546607874269e-10, + 5.104218714357955e-10, + 5.108970468903351e-10 + ], + "bp_grad_norms_F": [ + 3.0164017061906634e-06, + 1.9819051289005074e-08, + 1.921591774589615e-08, + 1.921967651696832e-08, + 1.9223040936822144e-08 + ], + "gamma_dfa": 0.10703902837121859, + "acc_eval": 0.3095703125, + "loss_eval": 1.927987813949585, + "epoch": 75 + }, + { + "hidden_norms": [ + 35270.68359375, + 68510120.0, + 158496816.0, + 313641408.0, + 409130592.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.246813200050383e-08, + 5.133981018090594e-10, + 5.070178166199923e-10, + 5.070903141835004e-10, + 5.071925657240683e-10 + ], + "bp_grad_norms_F": [ + 3.004009158757981e-06, + 1.970923690919335e-08, + 1.910464320076244e-08, + 1.9108172821802327e-08, + 1.9111526583515115e-08 + ], + "gamma_dfa": 0.1070477613247931, + "acc_eval": 0.3193359375, + "loss_eval": 1.9260926246643066, + "epoch": 76 + }, + { + "hidden_norms": [ + 35364.3125, + 69078320.0, + 159830400.0, + 316294976.0, + 412518496.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.217867820623724e-08, + 5.12098419225282e-10, + 5.052269158589695e-10, + 5.058938268298618e-10, + 5.053178431246863e-10 + ], + "bp_grad_norms_F": [ + 2.9913805974501884e-06, + 1.9599063705300068e-08, + 1.900307999846973e-08, + 1.9006522578024487e-08, + 1.9009846141671005e-08 + ], + "gamma_dfa": 0.10688473540358245, + "acc_eval": 0.3076171875, + "loss_eval": 1.926918864250183, + "epoch": 77 + }, + { + "hidden_norms": [ + 35441.375, + 69602704.0, + 161117808.0, + 318818240.0, + 415766208.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.249013040360296e-08, + 5.102671063461628e-10, + 5.039960671027188e-10, + 5.038492956188634e-10, + 5.034740402365401e-10 + ], + "bp_grad_norms_F": [ + 2.9863124382245587e-06, + 1.9512324200832154e-08, + 1.8926254341522508e-08, + 1.8929529943534362e-08, + 1.8932860612608238e-08 + ], + "gamma_dfa": 0.10701000291737728, + "acc_eval": 0.306640625, + "loss_eval": 1.9271972179412842, + "epoch": 78 + }, + { + "hidden_norms": [ + 35514.78125, + 70081152.0, + 162190624.0, + 321009312.0, + 418699392.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.149930698029493e-08, + 5.099357047733122e-10, + 5.055039165036135e-10, + 5.048302331722709e-10, + 5.054044960317583e-10 + ], + "bp_grad_norms_F": [ + 2.969128445329261e-06, + 1.9427163877594467e-08, + 1.883810085701043e-08, + 1.884115441441736e-08, + 1.884450639977331e-08 + ], + "gamma_dfa": 0.10680000087450026, + "acc_eval": 0.3017578125, + "loss_eval": 1.9285144805908203, + "epoch": 79 + }, + { + "hidden_norms": [ + 35582.9765625, + 70499392.0, + 163284976.0, + 323095264.0, + 421363552.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.187113399391819e-08, + 5.05410657769545e-10, + 4.990756696798826e-10, + 4.979930912085706e-10, + 4.985904467069702e-10 + ], + "bp_grad_norms_F": [ + 2.9715449727518717e-06, + 1.9354965630213883e-08, + 1.877567434860339e-08, + 1.8778711918798763e-08, + 1.8782076338652587e-08 + ], + "gamma_dfa": 0.10694103027344681, + "acc_eval": 0.310546875, + "loss_eval": 1.92802095413208, + "epoch": 80 + }, + { + "hidden_norms": [ + 35639.56640625, + 70899536.0, + 164253712.0, + 324923200.0, + 423745824.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.238182237439105e-08, + 5.018311322046998e-10, + 4.970572842211141e-10, + 4.953790155859394e-10, + 4.961450694729308e-10 + ], + "bp_grad_norms_F": [ + 2.971921048811055e-06, + 1.9296171771543413e-08, + 1.872837351868384e-08, + 1.8731368456315067e-08, + 1.873476662694884e-08 + ], + "gamma_dfa": 0.10704115682892734, + "acc_eval": 0.3076171875, + "loss_eval": 1.926428198814392, + "epoch": 81 + }, + { + "hidden_norms": [ + 35689.78515625, + 71256024.0, + 165127008.0, + 326618208.0, + 425949792.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.238117578050151e-08, + 4.972192657604069e-10, + 4.926972718699574e-10, + 4.921834606541609e-10, + 4.923969565417963e-10 + ], + "bp_grad_norms_F": [ + 2.9655700473085744e-06, + 1.9235280035445612e-08, + 1.8671270751724478e-08, + 1.8674217727721043e-08, + 1.8677596358429582e-08 + ], + "gamma_dfa": 0.10696214074414456, + "acc_eval": 0.3056640625, + "loss_eval": 1.924986481666565, + "epoch": 82 + }, + { + "hidden_norms": [ + 35742.58984375, + 71595640.0, + 165912336.0, + 328130016.0, + 427838752.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.213700487478491e-08, + 4.983659041002397e-10, + 4.936055453264032e-10, + 4.941617670617404e-10, + 4.939196274200697e-10 + ], + "bp_grad_norms_F": [ + 2.951217993540922e-06, + 1.919361736213432e-08, + 1.863161003257119e-08, + 1.8634468190725784e-08, + 1.8637845045077484e-08 + ], + "gamma_dfa": 0.10690056857129093, + "acc_eval": 0.3046875, + "loss_eval": 1.9250625371932983, + "epoch": 83 + }, + { + "hidden_norms": [ + 35784.6640625, + 71885704.0, + 166691376.0, + 329546848.0, + 429668704.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.175997668833588e-08, + 4.971995593017198e-10, + 4.919967211414189e-10, + 4.91977791838849e-10, + 4.926699603835516e-10 + ], + "bp_grad_norms_F": [ + 2.9550594717875356e-06, + 1.9144454910247077e-08, + 1.8583381944381472e-08, + 1.858614595562358e-08, + 1.8589524586332118e-08 + ], + "gamma_dfa": 0.10689649073174223, + "acc_eval": 0.3076171875, + "loss_eval": 1.926330327987671, + "epoch": 84 + }, + { + "hidden_norms": [ + 35822.33984375, + 72122744.0, + 167344016.0, + 330816224.0, + 431313312.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.139300978702522e-08, + 4.980582613001161e-10, + 4.935602482269985e-10, + 4.934832542602408e-10, + 4.934415098745148e-10 + ], + "bp_grad_norms_F": [ + 2.9577784061984858e-06, + 1.9112555094125128e-08, + 1.8551357783280764e-08, + 1.8553992120473595e-08, + 1.8557404501962083e-08 + ], + "gamma_dfa": 0.10689723303948995, + "acc_eval": 0.3056640625, + "loss_eval": 1.9307332038879395, + "epoch": 85 + }, + { + "hidden_norms": [ + 35859.390625, + 72358304.0, + 167947920.0, + 331984992.0, + 432823232.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.135296359843778e-08, + 4.947317000514317e-10, + 4.903184525062443e-10, + 4.896648087004962e-10, + 4.905649775288623e-10 + ], + "bp_grad_norms_F": [ + 2.9511427328543505e-06, + 1.906450464161935e-08, + 1.8504644927475056e-08, + 1.8507259724742653e-08, + 1.8510663224446944e-08 + ], + "gamma_dfa": 0.10684622721601045, + "acc_eval": 0.314453125, + "loss_eval": 1.9271869659423828, + "epoch": 86 + }, + { + "hidden_norms": [ + 35888.20703125, + 72553136.0, + 168401376.0, + 332911328.0, + 434057600.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.163116239576993e-08, + 4.935953312745767e-10, + 4.904400219274407e-10, + 4.890517990574494e-10, + 4.891231308867816e-10 + ], + "bp_grad_norms_F": [ + 2.9438597266562283e-06, + 1.902795432329185e-08, + 1.8475304841558682e-08, + 1.8477877006262133e-08, + 1.848129471682114e-08 + ], + "gamma_dfa": 0.10682923735294025, + "acc_eval": 0.30859375, + "loss_eval": 1.9263050556182861, + "epoch": 87 + }, + { + "hidden_norms": [ + 35914.35546875, + 72735848.0, + 168823680.0, + 333752736.0, + 435137376.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.153870657499283e-08, + 4.920966967247864e-10, + 4.894144534084433e-10, + 4.876969939004994e-10, + 4.884483928435657e-10 + ], + "bp_grad_norms_F": [ + 2.9408777209027903e-06, + 1.8999060102942167e-08, + 1.8450597494279464e-08, + 1.8453114591920894e-08, + 1.84565323024799e-08 + ], + "gamma_dfa": 0.10694600266288035, + "acc_eval": 0.3115234375, + "loss_eval": 1.9252078533172607, + "epoch": 88 + }, + { + "hidden_norms": [ + 35936.5546875, + 72887360.0, + 169178624.0, + 334467840.0, + 436061952.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.168602340039797e-08, + 4.908231043820876e-10, + 4.854965318656923e-10, + 4.846267276370497e-10, + 4.847209300606892e-10 + ], + "bp_grad_norms_F": [ + 2.945510459539946e-06, + 1.8982424521141184e-08, + 1.8438125692910035e-08, + 1.844062857969675e-08, + 1.8444072935608347e-08 + ], + "gamma_dfa": 0.10697454003093299, + "acc_eval": 0.3134765625, + "loss_eval": 1.9264906644821167, + "epoch": 89 + }, + { + "hidden_norms": [ + 35955.3671875, + 73005808.0, + 169498240.0, + 335085920.0, + 436862656.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.152810527737529e-08, + 4.922047214250824e-10, + 4.872572900715966e-10, + 4.873856318532432e-10, + 4.87353157829773e-10 + ], + "bp_grad_norms_F": [ + 2.9327068205020623e-06, + 1.8955052638602865e-08, + 1.8409036073308016e-08, + 1.8411496327530585e-08, + 1.841491403808959e-08 + ], + "gamma_dfa": 0.10689280136284651, + "acc_eval": 0.3095703125, + "loss_eval": 1.9255037307739258, + "epoch": 90 + }, + { + "hidden_norms": [ + 35973.34375, + 73111368.0, + 169770208.0, + 335584768.0, + 437507744.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.107820382794671e-08, + 4.92519802719471e-10, + 4.876242187812352e-10, + 4.871342773604681e-10, + 4.873002001914983e-10 + ], + "bp_grad_norms_F": [ + 2.9368579816946294e-06, + 1.8944499302619988e-08, + 1.839602603581625e-08, + 1.8398441881117833e-08, + 1.8401848933535803e-08 + ], + "gamma_dfa": 0.10685028225998394, + "acc_eval": 0.306640625, + "loss_eval": 1.9265596866607666, + "epoch": 91 + }, + { + "hidden_norms": [ + 35985.046875, + 73193336.0, + 169984976.0, + 335981920.0, + 438037376.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.100844984757714e-08, + 4.92902163529152e-10, + 4.862484304091197e-10, + 4.871591463562197e-10, + 4.871424374996991e-10 + ], + "bp_grad_norms_F": [ + 2.930574055426405e-06, + 1.8926412437281215e-08, + 1.8379486377284593e-08, + 1.8381888011731462e-08, + 1.8385312827717826e-08 + ], + "gamma_dfa": 0.106783474504482, + "acc_eval": 0.30859375, + "loss_eval": 1.9269328117370605, + "epoch": 92 + }, + { + "hidden_norms": [ + 35994.07421875, + 73256784.0, + 170148048.0, + 336300032.0, + 438460544.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.113810968599864e-08, + 4.918689899824358e-10, + 4.860293834063611e-10, + 4.857191315821296e-10, + 4.859731506101639e-10 + ], + "bp_grad_norms_F": [ + 2.9313273444131482e-06, + 1.8918141719836967e-08, + 1.8372302790226058e-08, + 1.837469731924557e-08, + 1.8378123911588773e-08 + ], + "gamma_dfa": 0.10685011067107553, + "acc_eval": 0.3095703125, + "loss_eval": 1.9262909889221191, + "epoch": 93 + }, + { + "hidden_norms": [ + 36002.55078125, + 73308792.0, + 170289472.0, + 336572864.0, + 438812896.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.121508988599089e-08, + 4.917221074762779e-10, + 4.853899504553283e-10, + 4.847242052186118e-10, + 4.849394219519354e-10 + ], + "bp_grad_norms_F": [ + 2.933722271336592e-06, + 1.8911242349872737e-08, + 1.8366764109600808e-08, + 1.836915508590664e-08, + 1.8372583454606684e-08 + ], + "gamma_dfa": 0.10693995938345324, + "acc_eval": 0.3076171875, + "loss_eval": 1.9261877536773682, + "epoch": 94 + }, + { + "hidden_norms": [ + 36008.01953125, + 73348264.0, + 170386624.0, + 336761248.0, + 439049248.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.123732987362018e-08, + 4.916126949972011e-10, + 4.860848945575924e-10, + 4.87389184566922e-10, + 4.868180303319036e-10 + ], + "bp_grad_norms_F": [ + 2.9306668238859857e-06, + 1.8901717524499873e-08, + 1.835805107930355e-08, + 1.8360427844754668e-08, + 1.836385976616839e-08 + ], + "gamma_dfa": 0.10689331469620811, + "acc_eval": 0.30859375, + "loss_eval": 1.9260027408599854, + "epoch": 95 + }, + { + "hidden_norms": [ + 36011.9296875, + 73372720.0, + 170447072.0, + 336878464.0, + 439192800.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.115104156378948e-08, + 4.911633877391353e-10, + 4.862875657707377e-10, + 4.868677128122556e-10, + 4.867456437906981e-10 + ], + "bp_grad_norms_F": [ + 2.9297382297954755e-06, + 1.889710254943111e-08, + 1.8353631503487122e-08, + 1.835600293986772e-08, + 1.8359434861281443e-08 + ], + "gamma_dfa": 0.1068731502891751, + "acc_eval": 0.306640625, + "loss_eval": 1.9261021614074707, + "epoch": 96 + }, + { + "hidden_norms": [ + 36014.109375, + 73385416.0, + 170481184.0, + 336945120.0, + 439280128.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.12362214269524e-08, + 4.916780316222003e-10, + 4.858832225451692e-10, + 4.867402036978774e-10, + 4.862423241824843e-10 + ], + "bp_grad_norms_F": [ + 2.930293021563557e-06, + 1.8895260467388653e-08, + 1.8352444897118403e-08, + 1.835481810985584e-08, + 1.8358248254912723e-08 + ], + "gamma_dfa": 0.10688256371940952, + "acc_eval": 0.3095703125, + "loss_eval": 1.926184892654419, + "epoch": 97 + }, + { + "hidden_norms": [ + 36015.9375, + 73396752.0, + 170510784.0, + 337001056.0, + 439352832.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.120947659837839e-08, + 4.916590468084792e-10, + 4.857179658479538e-10, + 4.86417739420375e-10, + 4.85919415815772e-10 + ], + "bp_grad_norms_F": [ + 2.930209348050994e-06, + 1.889360845552801e-08, + 1.835070939648631e-08, + 1.8353080832866908e-08, + 1.835651275428063e-08 + ], + "gamma_dfa": 0.10688149025372695, + "acc_eval": 0.306640625, + "loss_eval": 1.9262256622314453, + "epoch": 98 + }, + { + "hidden_norms": [ + 36016.734375, + 73401888.0, + 170523312.0, + 337026592.0, + 439384864.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.119820028516187e-08, + 4.917350415745148e-10, + 4.857160784688119e-10, + 4.860361002556601e-10, + 4.855379431845108e-10 + ], + "bp_grad_norms_F": [ + 2.9303794235602254e-06, + 1.8893027586841526e-08, + 1.835026353091962e-08, + 1.835263319094338e-08, + 1.83560651123571e-08 + ], + "gamma_dfa": 0.10688879482768243, + "acc_eval": 0.3076171875, + "loss_eval": 1.926223874092102, + "epoch": 99 + }, + { + "hidden_norms": [ + 36016.7734375, + 73401992.0, + 170523904.0, + 337027392.0, + 439386048.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.120198747794348e-08, + 4.91758134213427e-10, + 4.857037549932386e-10, + 4.860785107752008e-10, + 4.855802981929003e-10 + ], + "bp_grad_norms_F": [ + 2.9303721476026112e-06, + 1.8893056008550957e-08, + 1.8350315045267962e-08, + 1.8352682928934883e-08, + 1.8356114850348604e-08 + ], + "gamma_dfa": 0.1068887785077095, + "acc_eval": 0.3076171875, + "loss_eval": 1.926220417022705, + "epoch": 100 + } + ] +}
\ No newline at end of file |
