summaryrefslogtreecommitdiff
path: root/results/snapshot_evolution_v2/snapshot_evolution_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_evolution_s42.json')
-rw-r--r--results/snapshot_evolution_v2/snapshot_evolution_s42.json5473
1 files changed, 5473 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_evolution_s42.json b/results/snapshot_evolution_v2/snapshot_evolution_s42.json
new file mode 100644
index 0000000..fb4a73e
--- /dev/null
+++ b/results/snapshot_evolution_v2/snapshot_evolution_s42.json
@@ -0,0 +1,5473 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_evolution_v2",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 42,
+ "depth": 4,
+ "d_hidden": 256,
+ "log_every": 1
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "bp_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010068593546748161,
+ 0.000997236929833889,
+ 0.0009934091940522194,
+ 0.0009870644425973296,
+ 0.0009829498594626784
+ ],
+ "bp_grad_norms_F": [
+ 0.03544403985142708,
+ 0.03507080301642418,
+ 0.03477022796869278,
+ 0.03443896397948265,
+ 0.03407429903745651
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.115234375,
+ "loss_eval": 2.383650302886963,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 77.06888580322266,
+ 79.12034606933594,
+ 82.7389144897461,
+ 87.31297302246094,
+ 93.80765533447266
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.941955532762222e-05,
+ 5.619435978587717e-05,
+ 5.499917097040452e-05,
+ 5.5899512517498806e-05,
+ 5.7389137509744614e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026216788683086634,
+ 0.0023027872666716576,
+ 0.002111479640007019,
+ 0.002080164849758148,
+ 0.0021061261650174856
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3798828125,
+ "loss_eval": 1.6751981973648071,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 98.86981201171875,
+ 98.9476089477539,
+ 102.55016326904297,
+ 106.3559341430664,
+ 112.6939697265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.658113539335318e-05,
+ 4.402571721584536e-05,
+ 4.2862800910370424e-05,
+ 4.381770850159228e-05,
+ 4.3870313675142825e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00196655560284853,
+ 0.0018041934818029404,
+ 0.0016866555670276284,
+ 0.0016513779992237687,
+ 0.0016559252981096506
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4541015625,
+ "loss_eval": 1.5228025913238525,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 110.40647888183594,
+ 112.07202911376953,
+ 114.70049285888672,
+ 117.17343139648438,
+ 124.54205322265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4490061554824933e-05,
+ 4.3751915654866025e-05,
+ 4.270448334864341e-05,
+ 4.182140401098877e-05,
+ 4.151134271523915e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0019047901732847095,
+ 0.0017693191766738892,
+ 0.0016821600729599595,
+ 0.0016251102788373828,
+ 0.0015800207620486617
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.4697265625,
+ "loss_eval": 1.4416429996490479,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 125.09136199951172,
+ 126.65565490722656,
+ 128.4573974609375,
+ 130.39990234375,
+ 138.1091766357422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.1048842831514776e-05,
+ 4.0168823034036905e-05,
+ 3.916600326192565e-05,
+ 3.953508348786272e-05,
+ 3.938759255106561e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017511667683720589,
+ 0.001639657886698842,
+ 0.0015659942291676998,
+ 0.0015107291983440518,
+ 0.0014574137749150395
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.50390625,
+ "loss_eval": 1.3718887567520142,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 139.76705932617188,
+ 139.05606079101562,
+ 139.5422821044922,
+ 141.0078582763672,
+ 148.9493865966797
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.957379158237018e-05,
+ 4.0101109334500507e-05,
+ 3.9158370782388374e-05,
+ 3.927717261831276e-05,
+ 3.796629243879579e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017042789841070771,
+ 0.001630594371818006,
+ 0.0015700262738391757,
+ 0.0015037605771794915,
+ 0.0014294973807409406
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.498046875,
+ "loss_eval": 1.367867112159729,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 147.73207092285156,
+ 148.01638793945312,
+ 148.1798553466797,
+ 149.07754516601562,
+ 156.61810302734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.987981835962273e-05,
+ 3.9670325350016356e-05,
+ 3.970034231315367e-05,
+ 3.8273319660220295e-05,
+ 3.6929654015693814e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017687880899757147,
+ 0.001693942816928029,
+ 0.0016310750506818295,
+ 0.0015193652361631393,
+ 0.0014129421906545758
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5234375,
+ "loss_eval": 1.3461639881134033,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 159.30731201171875,
+ 158.4180450439453,
+ 158.36903381347656,
+ 158.61819458007812,
+ 165.9392547607422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.744649075088091e-05,
+ 3.805281448876485e-05,
+ 3.727989678736776e-05,
+ 3.5814937291434035e-05,
+ 3.422912777750753e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017357978504151106,
+ 0.0016663926653563976,
+ 0.0016097063198685646,
+ 0.0014966910239309072,
+ 0.001379394088871777
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5283203125,
+ "loss_eval": 1.3227663040161133,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 171.02230834960938,
+ 169.76348876953125,
+ 168.44949340820312,
+ 168.26429748535156,
+ 176.89520263671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.716369246831164e-05,
+ 3.8349648093571886e-05,
+ 3.801397542702034e-05,
+ 3.6082456063013524e-05,
+ 3.359258334967308e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016445739893242717,
+ 0.001604317338205874,
+ 0.0015634173760190606,
+ 0.0014586447505280375,
+ 0.0013399318559095263
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.541015625,
+ "loss_eval": 1.2933616638183594,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 177.41796875,
+ 177.29603576660156,
+ 175.89486694335938,
+ 175.0777587890625,
+ 181.38400268554688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.602267679525539e-05,
+ 3.6796918720938265e-05,
+ 3.648500933195464e-05,
+ 3.566688246792182e-05,
+ 3.4070406400132924e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015903833555057645,
+ 0.0015696624759584665,
+ 0.0015270623844116926,
+ 0.0014402325032278895,
+ 0.0013178731314837933
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5478515625,
+ "loss_eval": 1.2806801795959473,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 187.4056854248047,
+ 186.72698974609375,
+ 186.21583557128906,
+ 185.0518035888672,
+ 193.2371063232422
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3276784961344674e-05,
+ 3.436602492001839e-05,
+ 3.432494486332871e-05,
+ 3.371347702341154e-05,
+ 3.1834206311032176e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014970082556828856,
+ 0.0014613966923207045,
+ 0.001435543643310666,
+ 0.001374539453536272,
+ 0.0012561712646856904
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.2740942239761353,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 194.4965057373047,
+ 191.25531005859375,
+ 189.80703735351562,
+ 188.18850708007812,
+ 195.7776336669922
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.298965748399496e-05,
+ 3.40789083566051e-05,
+ 3.381206624908373e-05,
+ 3.3352327591273934e-05,
+ 3.1442876206710935e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015152172418311238,
+ 0.001501554623246193,
+ 0.0014814225723966956,
+ 0.001403055852279067,
+ 0.001272345893085003
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.560546875,
+ "loss_eval": 1.265188455581665,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 200.5504913330078,
+ 197.28366088867188,
+ 195.27011108398438,
+ 192.64669799804688,
+ 200.8507843017578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.453825775068253e-05,
+ 3.5414250305620953e-05,
+ 3.575523442123085e-05,
+ 3.455601472523995e-05,
+ 3.2858857593964785e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001518857548944652,
+ 0.001502488274127245,
+ 0.0014838415663689375,
+ 0.001404650043696165,
+ 0.0012748484732583165
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5458984375,
+ "loss_eval": 1.2733395099639893,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 207.21469116210938,
+ 202.24969482421875,
+ 198.8241424560547,
+ 197.5497283935547,
+ 207.32147216796875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2123080018209293e-05,
+ 3.345572258695029e-05,
+ 3.3888838515849784e-05,
+ 3.344774086144753e-05,
+ 3.095310239586979e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014620382571592927,
+ 0.0014708929229527712,
+ 0.0014657732099294662,
+ 0.0013834136771038175,
+ 0.0012381445849314332
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.2357412576675415,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 214.6268310546875,
+ 208.3655242919922,
+ 205.5032501220703,
+ 202.8442840576172,
+ 211.64646911621094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.207657573511824e-05,
+ 3.362155257491395e-05,
+ 3.38435493176803e-05,
+ 3.330525942146778e-05,
+ 3.142434434266761e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014900992391631007,
+ 0.0015044353203848004,
+ 0.001489310641773045,
+ 0.0014063691487535834,
+ 0.0012448005145415664
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.56640625,
+ "loss_eval": 1.2451550960540771,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 220.40109252929688,
+ 213.53439331054688,
+ 209.3384552001953,
+ 206.62062072753906,
+ 213.82391357421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.227095294278115e-05,
+ 3.415472019696608e-05,
+ 3.4918764868052676e-05,
+ 3.409514465602115e-05,
+ 3.082074908888899e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015189005061984062,
+ 0.001544533297419548,
+ 0.0015320393722504377,
+ 0.0014468894805759192,
+ 0.0012609416153281927
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.564453125,
+ "loss_eval": 1.248854398727417,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 226.32350158691406,
+ 219.70506286621094,
+ 213.84132385253906,
+ 210.67050170898438,
+ 219.11776733398438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.360298796906136e-05,
+ 3.4720324038062245e-05,
+ 3.473780452623032e-05,
+ 3.412307341932319e-05,
+ 3.0327399144880474e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014919604873284698,
+ 0.0015073713148012757,
+ 0.001499581034295261,
+ 0.001411686884239316,
+ 0.0012323390692472458
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.57421875,
+ "loss_eval": 1.2207037210464478,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 230.78538513183594,
+ 223.432373046875,
+ 216.73037719726562,
+ 212.86383056640625,
+ 220.8701171875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.253064278396778e-05,
+ 3.3939610148081556e-05,
+ 3.490943709039129e-05,
+ 3.4084565413650125e-05,
+ 3.0307599445222877e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015068502398207784,
+ 0.0015421892749145627,
+ 0.0015326113207265735,
+ 0.0014369196724146605,
+ 0.0012492147507146
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.560546875,
+ "loss_eval": 1.216906189918518,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 234.5084991455078,
+ 225.73875427246094,
+ 219.08822631835938,
+ 214.42320251464844,
+ 222.92369079589844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.451363227213733e-05,
+ 3.6047003959538415e-05,
+ 3.654924512375146e-05,
+ 3.617065158323385e-05,
+ 3.275999551988207e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001566705177538097,
+ 0.0015968933003023267,
+ 0.0015981856267899275,
+ 0.0014931216137483716,
+ 0.0012800253462046385
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5556640625,
+ "loss_eval": 1.2483153343200684,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 238.0281219482422,
+ 229.677734375,
+ 223.0265350341797,
+ 217.872314453125,
+ 225.45947265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4922632039524615e-05,
+ 3.6500507121672854e-05,
+ 3.762893902603537e-05,
+ 3.615105015342124e-05,
+ 3.2680742151569575e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015319561352953315,
+ 0.001577642629854381,
+ 0.001574998372234404,
+ 0.0014754259027540684,
+ 0.0012637749314308167
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5576171875,
+ "loss_eval": 1.2469550371170044,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 241.45298767089844,
+ 233.28753662109375,
+ 226.9265899658203,
+ 222.43453979492188,
+ 229.83859252929688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.368386751390062e-05,
+ 3.570445187506266e-05,
+ 3.622082658694126e-05,
+ 3.5024619137402624e-05,
+ 3.180970816174522e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015120706520974636,
+ 0.0015433274675160646,
+ 0.0015402185963466763,
+ 0.0014465245185419917,
+ 0.001252179266884923
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5634765625,
+ "loss_eval": 1.2113828659057617,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 246.53602600097656,
+ 236.25527954101562,
+ 231.07940673828125,
+ 227.7357940673828,
+ 235.99017333984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2015348551794887e-05,
+ 3.388321783859283e-05,
+ 3.521092003211379e-05,
+ 3.46749002346769e-05,
+ 3.079533780692145e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014757646713405848,
+ 0.001517578144557774,
+ 0.0015156606677919626,
+ 0.00144051609095186,
+ 0.0012491638772189617
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.2042850255966187,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 250.74209594726562,
+ 241.11993408203125,
+ 232.76829528808594,
+ 228.410400390625,
+ 237.100341796875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.173810910084285e-05,
+ 3.328004459035583e-05,
+ 3.405071402085014e-05,
+ 3.34872274834197e-05,
+ 3.07901827909518e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0014801323413848877,
+ 0.0015176001470535994,
+ 0.0015198889886960387,
+ 0.0014302636263892055,
+ 0.001232756651006639
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.587890625,
+ "loss_eval": 1.1819555759429932,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 251.96310424804688,
+ 242.98260498046875,
+ 235.83056640625,
+ 229.86978149414062,
+ 238.271240234375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.078249574173242e-05,
+ 3.301461765659042e-05,
+ 3.3559550502104685e-05,
+ 3.2682331948308274e-05,
+ 2.9418402846204117e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00149905972648412,
+ 0.0015357647789642215,
+ 0.0015457755653187633,
+ 0.0014610268408432603,
+ 0.0012446421897038817
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5732421875,
+ "loss_eval": 1.1770297288894653,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 255.878662109375,
+ 244.79376220703125,
+ 236.5006561279297,
+ 233.29434204101562,
+ 239.50732421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.191530049662106e-05,
+ 3.370656486367807e-05,
+ 3.539594035828486e-05,
+ 3.486185596557334e-05,
+ 3.131559424218722e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001507170731201768,
+ 0.0015490618534386158,
+ 0.0015714912442490458,
+ 0.0014840371441096067,
+ 0.0012607484823092818
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.572265625,
+ "loss_eval": 1.2011631727218628,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 256.66448974609375,
+ 244.18772888183594,
+ 236.46058654785156,
+ 231.88583374023438,
+ 238.06246948242188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2962809200398624e-05,
+ 3.441200897214003e-05,
+ 3.570063927327283e-05,
+ 3.488562651909888e-05,
+ 3.0770879675401375e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015825299778953195,
+ 0.0016350955702364445,
+ 0.0016404123743996024,
+ 0.0015316286589950323,
+ 0.0012829666957259178
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5703125,
+ "loss_eval": 1.192138433456421,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 259.5942687988281,
+ 247.43173217773438,
+ 239.85533142089844,
+ 233.21835327148438,
+ 241.53346252441406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.1691903132013977e-05,
+ 3.34988217218779e-05,
+ 3.45351618307177e-05,
+ 3.441058288444765e-05,
+ 3.0752617021789774e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015797498635947704,
+ 0.0016322932206094265,
+ 0.001641901326365769,
+ 0.0015325341373682022,
+ 0.0012732355389744043
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5791015625,
+ "loss_eval": 1.1775751113891602,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 260.6902770996094,
+ 249.26528930664062,
+ 240.86239624023438,
+ 235.91477966308594,
+ 242.1553497314453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.32598174281884e-05,
+ 3.471180752967484e-05,
+ 3.609888517530635e-05,
+ 3.496996214380488e-05,
+ 3.091244798270054e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015408779727295041,
+ 0.001589508610777557,
+ 0.0016157848294824362,
+ 0.0015165223740041256,
+ 0.0012689991854131222
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5859375,
+ "loss_eval": 1.1941479444503784,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 265.0726623535156,
+ 253.6020050048828,
+ 244.876953125,
+ 239.7056427001953,
+ 248.2157440185547
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.255613773944788e-05,
+ 3.457435013842769e-05,
+ 3.5964570997748524e-05,
+ 3.529110108502209e-05,
+ 3.089939127676189e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001513357157818973,
+ 0.0015594394644722342,
+ 0.0015772230690345168,
+ 0.001489063142798841,
+ 0.0012491336092352867
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5810546875,
+ "loss_eval": 1.1790356636047363,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 266.9394836425781,
+ 253.8067169189453,
+ 243.13002014160156,
+ 236.81365966796875,
+ 245.42434692382812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.378500332473777e-05,
+ 3.5516346542863175e-05,
+ 3.742165063158609e-05,
+ 3.6865043512079865e-05,
+ 3.170729542034678e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015557212755084038,
+ 0.0016067115357145667,
+ 0.001632526982575655,
+ 0.0015416526002809405,
+ 0.0012708577560260892
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.1785690784454346,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 271.3736572265625,
+ 257.6708984375,
+ 246.3377685546875,
+ 240.7875213623047,
+ 248.55162048339844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2452040613861755e-05,
+ 3.456772174104117e-05,
+ 3.550515975803137e-05,
+ 3.530189496814273e-05,
+ 3.098960587522015e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015420741401612759,
+ 0.0016120158834382892,
+ 0.0016289768973365426,
+ 0.0015373170608654618,
+ 0.0012695658951997757
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.57421875,
+ "loss_eval": 1.1686367988586426,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 270.6155090332031,
+ 256.5137634277344,
+ 246.4404296875,
+ 238.71493530273438,
+ 245.14651489257812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4225693525513634e-05,
+ 3.6208981327945367e-05,
+ 3.771808042074554e-05,
+ 3.671547892736271e-05,
+ 3.175914389430545e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016278985422104597,
+ 0.00169221474789083,
+ 0.0017131771892309189,
+ 0.0016123101813718677,
+ 0.001308745937421918
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.572265625,
+ "loss_eval": 1.1706045866012573,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 271.2703552246094,
+ 258.5479431152344,
+ 247.48568725585938,
+ 241.0449676513672,
+ 248.61419677734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.370125705259852e-05,
+ 3.563391510397196e-05,
+ 3.776583253056742e-05,
+ 3.622193253249861e-05,
+ 3.1177536584436893e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001631051884032786,
+ 0.0016799280419945717,
+ 0.0016939701745286584,
+ 0.001596588990651071,
+ 0.0012989162933081388
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.576171875,
+ "loss_eval": 1.1757416725158691,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 271.5987854003906,
+ 257.3157043457031,
+ 247.04425048828125,
+ 239.22933959960938,
+ 247.08534240722656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.276485949754715e-05,
+ 3.4356282412773e-05,
+ 3.570897752069868e-05,
+ 3.5391843994148076e-05,
+ 3.004215977853164e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0015858211554586887,
+ 0.0016445693327113986,
+ 0.0016775003168731928,
+ 0.0015801271656528115,
+ 0.0012829708866775036
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5947265625,
+ "loss_eval": 1.1316245794296265,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 276.85565185546875,
+ 262.14959716796875,
+ 248.80125427246094,
+ 239.6945037841797,
+ 246.55982971191406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.424682654440403e-05,
+ 3.617212496465072e-05,
+ 3.731884135049768e-05,
+ 3.583814759622328e-05,
+ 3.1317249522544444e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001694253645837307,
+ 0.0017545269802212715,
+ 0.0017868074355646968,
+ 0.0016729168128222227,
+ 0.0013285611057654023
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.1637687683105469,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 274.4824523925781,
+ 260.23223876953125,
+ 249.41390991210938,
+ 242.22657775878906,
+ 248.33303833007812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.4118878829758614e-05,
+ 3.6190944229019806e-05,
+ 3.7162455555517226e-05,
+ 3.6398294469108805e-05,
+ 3.1276995287043974e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016947221010923386,
+ 0.0017584856832399964,
+ 0.0017846780829131603,
+ 0.0016663862625136971,
+ 0.0013457784662023187
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5830078125,
+ "loss_eval": 1.1625440120697021,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 279.3048095703125,
+ 263.830810546875,
+ 250.07839965820312,
+ 242.9677276611328,
+ 248.742431640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.378376641194336e-05,
+ 3.623673183028586e-05,
+ 3.8036723708501086e-05,
+ 3.8026879337849095e-05,
+ 3.20856343023479e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016582749085500836,
+ 0.001725532696582377,
+ 0.0017548021860420704,
+ 0.0016622358234599233,
+ 0.0013314742827787995
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58203125,
+ "loss_eval": 1.1663323640823364,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 277.88153076171875,
+ 263.3263244628906,
+ 254.0471954345703,
+ 246.00294494628906,
+ 251.6592559814453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.402382935746573e-05,
+ 3.644815296866e-05,
+ 3.812061549979262e-05,
+ 3.8299189327517524e-05,
+ 3.244871550123207e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016575837507843971,
+ 0.001726161572150886,
+ 0.0017651193775236607,
+ 0.001658888068050146,
+ 0.001325216144323349
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5849609375,
+ "loss_eval": 1.1578618288040161,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 278.96038818359375,
+ 264.09832763671875,
+ 252.11532592773438,
+ 243.7300567626953,
+ 250.29537963867188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.398891203687526e-05,
+ 3.60828016710002e-05,
+ 3.8209349440876395e-05,
+ 3.6874149373034015e-05,
+ 3.130899858660996e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0016938851913437247,
+ 0.0017578925471752882,
+ 0.0017999019473791122,
+ 0.0016839306335896254,
+ 0.0013463495997712016
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1660709381103516,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 279.11102294921875,
+ 262.8247375488281,
+ 250.32635498046875,
+ 241.73477172851562,
+ 246.8911590576172
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.476023630355485e-05,
+ 3.673156606964767e-05,
+ 3.8200654671527445e-05,
+ 3.745179856196046e-05,
+ 3.111823389190249e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017367384862154722,
+ 0.001807119813747704,
+ 0.0018404393922537565,
+ 0.0017188042402267456,
+ 0.0013523433590307832
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58984375,
+ "loss_eval": 1.1548914909362793,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 278.79083251953125,
+ 263.49237060546875,
+ 252.0679931640625,
+ 243.65948486328125,
+ 249.34564208984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3709933632053435e-05,
+ 3.595885937102139e-05,
+ 3.795271186390892e-05,
+ 3.70899579138495e-05,
+ 3.1362116715172306e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017184949247166514,
+ 0.0017862631939351559,
+ 0.0018348938319832087,
+ 0.0017180118011310697,
+ 0.0013606568099930882
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.591796875,
+ "loss_eval": 1.159794569015503,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 281.3595886230469,
+ 263.4467468261719,
+ 250.73536682128906,
+ 243.140380859375,
+ 247.22425842285156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.411353100091219e-05,
+ 3.656598346424289e-05,
+ 3.8585232687182724e-05,
+ 3.752345946850255e-05,
+ 3.1474613933824e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017623946769163013,
+ 0.0018276257906109095,
+ 0.0018694576574489474,
+ 0.0017436364432796836,
+ 0.0013814391568303108
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5888671875,
+ "loss_eval": 1.153226375579834,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 279.79888916015625,
+ 263.5989685058594,
+ 252.2397918701172,
+ 243.49703979492188,
+ 248.86973571777344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.528413435560651e-05,
+ 3.805026790359989e-05,
+ 4.0152310248231515e-05,
+ 3.962377377320081e-05,
+ 3.250985173508525e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017320383340120316,
+ 0.0018105976050719619,
+ 0.001847731531597674,
+ 0.0017405269900336862,
+ 0.0013762396993115544
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58984375,
+ "loss_eval": 1.1387929916381836,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 280.80633544921875,
+ 263.2684326171875,
+ 251.36338806152344,
+ 242.25201416015625,
+ 245.46954345703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.463789835222997e-05,
+ 3.694587940117344e-05,
+ 3.909278166247532e-05,
+ 3.8173999200807884e-05,
+ 3.152083809254691e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001763346022926271,
+ 0.0018382675480097532,
+ 0.0018745084526017308,
+ 0.0017674838891252875,
+ 0.0013920797500759363
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5986328125,
+ "loss_eval": 1.1115086078643799,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 278.4877624511719,
+ 261.4671630859375,
+ 247.66079711914062,
+ 240.21690368652344,
+ 244.1111602783203
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.559369361028075e-05,
+ 3.895946065313183e-05,
+ 4.048463233630173e-05,
+ 3.892362292390317e-05,
+ 3.229418143746443e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018469772767275572,
+ 0.0019197544315829873,
+ 0.001963041489943862,
+ 0.0018302135867998004,
+ 0.001429378753527999
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.16768217086792,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 280.8171691894531,
+ 263.16705322265625,
+ 251.45835876464844,
+ 243.88563537597656,
+ 246.92945861816406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.3486583561170846e-05,
+ 3.533214839990251e-05,
+ 3.789112452068366e-05,
+ 3.651758743217215e-05,
+ 3.081141403526999e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0017694556154310703,
+ 0.0018461478175595403,
+ 0.0018877091351896524,
+ 0.001781664090231061,
+ 0.0014001834206283092
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1236202716827393,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 280.0203552246094,
+ 261.3996887207031,
+ 248.5751953125,
+ 240.40728759765625,
+ 243.84178161621094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.66695094271563e-05,
+ 3.912827742169611e-05,
+ 4.0782215364743024e-05,
+ 3.97856165363919e-05,
+ 3.258495053160004e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018954386468976736,
+ 0.0019765326287597418,
+ 0.0020179273560643196,
+ 0.0018787897424772382,
+ 0.0014408754650503397
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5947265625,
+ "loss_eval": 1.142503261566162,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 278.37445068359375,
+ 260.7147521972656,
+ 247.63418579101562,
+ 239.64564514160156,
+ 241.75396728515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.824803570751101e-05,
+ 4.062152947881259e-05,
+ 4.1070070437854156e-05,
+ 4.01996003347449e-05,
+ 3.288290827185847e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001872657099738717,
+ 0.0019627343863248825,
+ 0.002008425537496805,
+ 0.0018816223600879312,
+ 0.001456336583942175
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6064453125,
+ "loss_eval": 1.137413740158081,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 281.14813232421875,
+ 263.6340637207031,
+ 250.13082885742188,
+ 242.0965118408203,
+ 244.81060791015625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.531872062012553e-05,
+ 3.7883237382629886e-05,
+ 4.0227863792097196e-05,
+ 3.96844552597031e-05,
+ 3.296942304586992e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018434273079037666,
+ 0.0019304269226267934,
+ 0.0019746439065784216,
+ 0.0018603875068947673,
+ 0.0014465745771303773
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6025390625,
+ "loss_eval": 1.1396205425262451,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 281.31280517578125,
+ 262.5829772949219,
+ 247.9232940673828,
+ 239.8461456298828,
+ 242.20977783203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.71285859728232e-05,
+ 3.963968629250303e-05,
+ 4.135111521463841e-05,
+ 4.0518349123885855e-05,
+ 3.323471173644066e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00189371092710644,
+ 0.0019808171782642603,
+ 0.002019244944676757,
+ 0.001904282602481544,
+ 0.0014800610952079296
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1411675214767456,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 278.64208984375,
+ 260.1700744628906,
+ 246.7251434326172,
+ 239.43145751953125,
+ 240.350830078125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.6054647353012115e-05,
+ 3.858766285702586e-05,
+ 4.05439204769209e-05,
+ 4.046479079988785e-05,
+ 3.3791853638831526e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0018870895728468895,
+ 0.00198533502407372,
+ 0.0020502021070569754,
+ 0.001929490827023983,
+ 0.0014933926286175847
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59375,
+ "loss_eval": 1.1310430765151978,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 281.7696533203125,
+ 261.5150451660156,
+ 247.67295837402344,
+ 239.7654266357422,
+ 240.27789306640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.671262675197795e-05,
+ 3.92102992918808e-05,
+ 4.1406125092180446e-05,
+ 4.029196497867815e-05,
+ 3.32514064211864e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.001880357856862247,
+ 0.001981948269531131,
+ 0.0020440546795725822,
+ 0.0019350070506334305,
+ 0.0014877711655572057
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.60546875,
+ "loss_eval": 1.1188440322875977,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 279.01318359375,
+ 259.6091003417969,
+ 244.6603240966797,
+ 235.1455535888672,
+ 237.438232421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.0185608668252826e-05,
+ 4.309232099330984e-05,
+ 4.5118234993424267e-05,
+ 4.371534669189714e-05,
+ 3.5620210837805644e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020104716531932354,
+ 0.002107330597937107,
+ 0.002167000202462077,
+ 0.0020260754972696304,
+ 0.0015411453787237406
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1525764465332031,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 278.2245178222656,
+ 257.14617919921875,
+ 243.9732666015625,
+ 234.4013214111328,
+ 236.68521118164062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.85418206860777e-05,
+ 4.142443503951654e-05,
+ 4.363177140476182e-05,
+ 4.2996281990781426e-05,
+ 3.424972965149209e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0020445864647626877,
+ 0.002142493613064289,
+ 0.0022005243226885796,
+ 0.002054274780675769,
+ 0.0015541499014943838
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.59765625,
+ "loss_eval": 1.162191390991211,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 278.7825622558594,
+ 258.4292297363281,
+ 243.01690673828125,
+ 234.15765380859375,
+ 235.1446533203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.855194881907664e-05,
+ 4.1293307731393725e-05,
+ 4.296215047361329e-05,
+ 4.1900369978975505e-05,
+ 3.372962964931503e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002041360829025507,
+ 0.0021457262337207794,
+ 0.0021996963769197464,
+ 0.0020641626324504614,
+ 0.001561368815600872
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6171875,
+ "loss_eval": 1.130479335784912,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 275.3794860839844,
+ 256.83026123046875,
+ 242.16006469726562,
+ 231.49655151367188,
+ 232.30279541015625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.011294731753878e-05,
+ 4.240096313878894e-05,
+ 4.396942676976323e-05,
+ 4.347893627709709e-05,
+ 3.485888009890914e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021268154960125685,
+ 0.002230642130598426,
+ 0.0022892621345818043,
+ 0.002145433332771063,
+ 0.0016037407331168652
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6005859375,
+ "loss_eval": 1.1599653959274292,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 277.5028076171875,
+ 257.1715087890625,
+ 241.6505584716797,
+ 234.09323120117188,
+ 233.63377380371094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.876453047269024e-05,
+ 4.156330396654084e-05,
+ 4.3727923184633255e-05,
+ 4.2131912778131664e-05,
+ 3.510245369398035e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002074806485325098,
+ 0.002173666376620531,
+ 0.002245684852823615,
+ 0.0021073734387755394,
+ 0.0015908328350633383
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.144984245300293,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 276.0826416015625,
+ 255.17193603515625,
+ 239.51519775390625,
+ 231.28643798828125,
+ 230.85292053222656
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.960869798902422e-05,
+ 4.2907246097456664e-05,
+ 4.45116929768119e-05,
+ 4.3612952140392736e-05,
+ 3.500159073155373e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0021277335472404957,
+ 0.0022348251659423113,
+ 0.0022981096990406513,
+ 0.002155488822609186,
+ 0.001618923619389534
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.1534931659698486,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 275.6867370605469,
+ 254.65744018554688,
+ 238.1124267578125,
+ 229.36215209960938,
+ 227.90867614746094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.966662916354835e-05,
+ 4.33680324931629e-05,
+ 4.5270633563632146e-05,
+ 4.528860517893918e-05,
+ 3.5298704460728914e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002194908680394292,
+ 0.002305977512151003,
+ 0.0023776311427354813,
+ 0.002223761286586523,
+ 0.001651395345106721
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1494864225387573,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 274.8414306640625,
+ 253.18215942382812,
+ 238.03150939941406,
+ 228.1765594482422,
+ 229.46058654785156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.132632238906808e-05,
+ 4.4773249101126567e-05,
+ 4.6669130824739113e-05,
+ 4.591346441884525e-05,
+ 3.6523833841783926e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022293017245829105,
+ 0.002341218525543809,
+ 0.002405093051493168,
+ 0.0022504546213895082,
+ 0.0016715668607503176
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5927734375,
+ "loss_eval": 1.1698435544967651,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 273.4884338378906,
+ 251.2228240966797,
+ 236.2550048828125,
+ 226.7325439453125,
+ 225.68386840820312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.192883352516219e-05,
+ 4.3471976823639125e-05,
+ 4.7195244405884296e-05,
+ 4.490713035920635e-05,
+ 3.646116965683177e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022312228102236986,
+ 0.002349371323361993,
+ 0.0024164437782019377,
+ 0.002271530916914344,
+ 0.0016918154433369637
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1560128927230835,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 273.4084777832031,
+ 250.5165557861328,
+ 236.19557189941406,
+ 227.0643768310547,
+ 226.594970703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.2211744585074484e-05,
+ 4.488111881073564e-05,
+ 4.760283627547324e-05,
+ 4.589638047036715e-05,
+ 3.658623973024078e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0022313676308840513,
+ 0.002337696962058544,
+ 0.0024093035608530045,
+ 0.002264693146571517,
+ 0.0016880000475794077
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6044921875,
+ "loss_eval": 1.1498074531555176,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 273.1318664550781,
+ 249.35223388671875,
+ 234.15737915039062,
+ 223.48074340820312,
+ 223.0059356689453
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4729218643624336e-05,
+ 4.768320650327951e-05,
+ 4.822494520340115e-05,
+ 4.791786341229454e-05,
+ 3.7625926779583097e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023362624924629927,
+ 0.0024679312482476234,
+ 0.0025367215275764465,
+ 0.0023599599953740835,
+ 0.0017239096341654658
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1377537250518799,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 270.9543762207031,
+ 249.6943817138672,
+ 234.0796356201172,
+ 223.80093383789062,
+ 222.75062561035156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4321575842332095e-05,
+ 4.7786033974261954e-05,
+ 4.9388974730391055e-05,
+ 4.749266372527927e-05,
+ 3.7502803024835885e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023458057548850775,
+ 0.0024719720240682364,
+ 0.0025427823420614004,
+ 0.0023789280094206333,
+ 0.0017488099401816726
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1472076177597046,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 270.6864318847656,
+ 249.71315002441406,
+ 233.9838409423828,
+ 223.17515563964844,
+ 222.17759704589844
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.36245281889569e-05,
+ 4.725098915514536e-05,
+ 4.936556069878861e-05,
+ 4.7286572225857526e-05,
+ 3.7781614082632586e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023510511964559555,
+ 0.0024691869039088488,
+ 0.0025394195690751076,
+ 0.0023858139757066965,
+ 0.0017493697814643383
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.5986328125,
+ "loss_eval": 1.1437795162200928,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 269.1813659667969,
+ 247.57632446289062,
+ 231.57135009765625,
+ 220.31541442871094,
+ 220.33135986328125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.363871266832575e-05,
+ 4.776224886882119e-05,
+ 4.8712514399085194e-05,
+ 4.777491994900629e-05,
+ 3.733497578650713e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0023870510049164295,
+ 0.0025214161723852158,
+ 0.0025991688016802073,
+ 0.0024342697579413652,
+ 0.0017686353530734777
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.138253927230835,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 268.92877197265625,
+ 245.84384155273438,
+ 230.63307189941406,
+ 220.8726806640625,
+ 219.60350036621094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.505042306846008e-05,
+ 4.780786548508331e-05,
+ 5.067480378784239e-05,
+ 4.878537220065482e-05,
+ 3.842872683890164e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00237255753017962,
+ 0.002493572887033224,
+ 0.0025717453099787235,
+ 0.0024270617868751287,
+ 0.0017787005053833127
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1350346803665161,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 268.9022521972656,
+ 244.85621643066406,
+ 229.2279510498047,
+ 218.72445678710938,
+ 217.325439453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.515323234954849e-05,
+ 4.8419675295008346e-05,
+ 5.0062186346622184e-05,
+ 4.777919821208343e-05,
+ 3.962183836847544e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024519655853509903,
+ 0.002586368238553405,
+ 0.00266969739459455,
+ 0.0024983694311231375,
+ 0.001813769806176424
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.58984375,
+ "loss_eval": 1.143377661705017,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 267.7603454589844,
+ 245.58932495117188,
+ 229.04205322265625,
+ 219.0813446044922,
+ 217.887939453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.398225064505823e-05,
+ 4.6881206799298525e-05,
+ 4.986919157090597e-05,
+ 4.9659283831715584e-05,
+ 3.928233854821883e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0024525129701942205,
+ 0.0025901535991579294,
+ 0.002675000112503767,
+ 0.0025050004478543997,
+ 0.0018165758810937405
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1445319652557373,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 267.32110595703125,
+ 244.51095581054688,
+ 228.1964569091797,
+ 217.7543182373047,
+ 215.99093627929688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.567872019833885e-05,
+ 4.9028451030608267e-05,
+ 5.0534836191218346e-05,
+ 4.8578112910036e-05,
+ 3.865628605126403e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002467149868607521,
+ 0.0026051453314721584,
+ 0.0026927595026791096,
+ 0.002530105412006378,
+ 0.0018421142594888806
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.143081545829773,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 266.6060791015625,
+ 242.973388671875,
+ 227.23739624023438,
+ 216.60504150390625,
+ 213.26922607421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.524671021499671e-05,
+ 4.8752917791716754e-05,
+ 5.0053116865456104e-05,
+ 4.897990220342763e-05,
+ 3.949753590859473e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002536450745537877,
+ 0.002682002494111657,
+ 0.002782325493171811,
+ 0.002600395353510976,
+ 0.0018774428172037005
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1569209098815918,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 265.7056579589844,
+ 243.6046142578125,
+ 226.88746643066406,
+ 217.55291748046875,
+ 213.99151611328125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.667519897338934e-05,
+ 4.9728132580639794e-05,
+ 5.27437987329904e-05,
+ 5.151727600605227e-05,
+ 4.0550570702180266e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002509700832888484,
+ 0.0026521242689341307,
+ 0.0027410376351326704,
+ 0.002574845217168331,
+ 0.001871992484666407
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.1381304264068604,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 264.63116455078125,
+ 241.50344848632812,
+ 225.20465087890625,
+ 214.67364501953125,
+ 212.77584838867188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.526918928604573e-05,
+ 5.0124705012422055e-05,
+ 5.2680206863442436e-05,
+ 5.1697836170205846e-05,
+ 3.9593822293682024e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0025687876623123884,
+ 0.0027084490284323692,
+ 0.0027945584151893854,
+ 0.0026290949899703264,
+ 0.0018978636944666505
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.149982213973999,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 264.168701171875,
+ 241.78074645996094,
+ 224.8336944580078,
+ 214.45762634277344,
+ 212.4181671142578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.745498517877422e-05,
+ 5.042303018854e-05,
+ 5.3622185077983886e-05,
+ 5.276402589515783e-05,
+ 4.0586572140455246e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026231552474200726,
+ 0.002779489615932107,
+ 0.002866284688934684,
+ 0.00268669705837965,
+ 0.0019228557357564569
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.158836007118225,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 263.89593505859375,
+ 240.3160858154297,
+ 223.6101531982422,
+ 212.4967803955078,
+ 210.63546752929688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.678544428315945e-05,
+ 5.029747626394965e-05,
+ 5.3069161367602646e-05,
+ 5.2157745813019574e-05,
+ 4.0450311644235626e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026451845187693834,
+ 0.002798875328153372,
+ 0.0028935885056853294,
+ 0.0027081011794507504,
+ 0.001933218096382916
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1447510719299316,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 262.4220275878906,
+ 239.43899536132812,
+ 223.32151794433594,
+ 212.5982666015625,
+ 209.80105590820312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.713214002549648e-05,
+ 5.087011959403753e-05,
+ 5.283053906168789e-05,
+ 5.280825644149445e-05,
+ 4.054068267578259e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002688886132091284,
+ 0.002841175301000476,
+ 0.002931408118456602,
+ 0.0027343749534338713,
+ 0.001953375292941928
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.1561517715454102,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 262.65814208984375,
+ 240.0749969482422,
+ 223.0806121826172,
+ 212.08688354492188,
+ 209.22561645507812
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8153047828236595e-05,
+ 5.145415343577042e-05,
+ 5.4130876378621906e-05,
+ 5.3563955589197576e-05,
+ 4.1630475607234985e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0026582488790154457,
+ 0.0028067713137716055,
+ 0.00290639977902174,
+ 0.0027312941383570433,
+ 0.0019485733937472105
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1465811729431152,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 262.0201721191406,
+ 239.08547973632812,
+ 222.36146545410156,
+ 211.62014770507812,
+ 208.1699676513672
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.763290053233504e-05,
+ 5.171096199774183e-05,
+ 5.4121221182867885e-05,
+ 5.251873881206848e-05,
+ 4.096185875823721e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0027110630180686712,
+ 0.002856222679838538,
+ 0.002954155672341585,
+ 0.0027671835850924253,
+ 0.001963438233360648
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6142578125,
+ "loss_eval": 1.140420913696289,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 261.04132080078125,
+ 238.44912719726562,
+ 221.8912353515625,
+ 210.62893676757812,
+ 207.68223571777344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.7598918172298e-05,
+ 5.09894234710373e-05,
+ 5.384815813158639e-05,
+ 5.2337087254272774e-05,
+ 4.065291432198137e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00274560390971601,
+ 0.0029035566840320826,
+ 0.0030046424362808466,
+ 0.0028060651384294033,
+ 0.001984622096642852
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.1556674242019653,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 260.81304931640625,
+ 237.52015686035156,
+ 221.12814331054688,
+ 210.04925537109375,
+ 206.80441284179688
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8430883907712996e-05,
+ 5.440305176307447e-05,
+ 5.596410119323991e-05,
+ 5.4586391343036667e-05,
+ 4.195213477942161e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002767855068668723,
+ 0.002925564767792821,
+ 0.003015928901731968,
+ 0.002823467366397381,
+ 0.0020000736694782972
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.599609375,
+ "loss_eval": 1.155595302581787,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 260.0649108886719,
+ 236.74310302734375,
+ 220.48731994628906,
+ 209.0772247314453,
+ 205.55821228027344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.8615416744723916e-05,
+ 5.309982589096762e-05,
+ 5.548154513235204e-05,
+ 5.3888015827396885e-05,
+ 4.1955223423428833e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028222037944942713,
+ 0.0029849831480532885,
+ 0.003080391325056553,
+ 0.0028690374456346035,
+ 0.002019484294578433
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.151352882385254,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 259.8204650878906,
+ 236.13253784179688,
+ 219.08865356445312,
+ 207.6793975830078,
+ 205.0387725830078
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.734982212539762e-05,
+ 5.1937022362835705e-05,
+ 5.472155680763535e-05,
+ 5.394391337176785e-05,
+ 4.0832986996974796e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.00282403570599854,
+ 0.0029848285485059023,
+ 0.0030928945634514093,
+ 0.002879998181015253,
+ 0.0020237534772604704
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.153958797454834,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 259.70703125,
+ 235.5811767578125,
+ 218.87939453125,
+ 207.87005615234375,
+ 204.21360778808594
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.972740134689957e-05,
+ 5.442327164928429e-05,
+ 5.538179539144039e-05,
+ 5.4411018936662003e-05,
+ 4.185390207567252e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002822998445481062,
+ 0.00298913661390543,
+ 0.0030840388499200344,
+ 0.0028817548882216215,
+ 0.0020279802847653627
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6201171875,
+ "loss_eval": 1.153503656387329,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 258.22747802734375,
+ 235.3745880126953,
+ 218.20066833496094,
+ 206.82144165039062,
+ 203.41139221191406
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.077639434603043e-05,
+ 5.5536078434670344e-05,
+ 5.664999844157137e-05,
+ 5.608425635728054e-05,
+ 4.293184611015022e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002843277994543314,
+ 0.0030130224768072367,
+ 0.0031098793260753155,
+ 0.00290561281144619,
+ 0.0020425335969775915
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1597235202789307,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 258.78253173828125,
+ 234.73965454101562,
+ 217.91439819335938,
+ 207.1282958984375,
+ 203.4480743408203
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.941036968375556e-05,
+ 5.3143365221330896e-05,
+ 5.529402187676169e-05,
+ 5.3718889830634e-05,
+ 4.207601887173951e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028217420913279057,
+ 0.0029905554838478565,
+ 0.0030917164403945208,
+ 0.002896753139793873,
+ 0.00204362440854311
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1545956134796143,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 258.10736083984375,
+ 234.35299682617188,
+ 217.81224060058594,
+ 206.38864135742188,
+ 202.70126342773438
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.899106716038659e-05,
+ 5.2254512411309406e-05,
+ 5.481128755491227e-05,
+ 5.298088217386976e-05,
+ 4.121303936699405e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002849399344995618,
+ 0.0030259499326348305,
+ 0.0031236386857926846,
+ 0.002921136561781168,
+ 0.0020506957080215216
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.615234375,
+ "loss_eval": 1.150564193725586,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 258.50750732421875,
+ 234.4120330810547,
+ 217.49217224121094,
+ 205.7490692138672,
+ 202.62380981445312
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.976892887498252e-05,
+ 5.383255484048277e-05,
+ 5.497025267686695e-05,
+ 5.391201557358727e-05,
+ 4.2558931454550475e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028686418663710356,
+ 0.003045660676434636,
+ 0.0031442255713045597,
+ 0.002935740165412426,
+ 0.0020568587351590395
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.152902603149414,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 258.063720703125,
+ 233.87294006347656,
+ 217.34030151367188,
+ 205.4007110595703,
+ 202.4425506591797
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.047345257480629e-05,
+ 5.492625859915279e-05,
+ 5.640966628561728e-05,
+ 5.587706982623786e-05,
+ 4.286773400963284e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002875820267945528,
+ 0.003056521760299802,
+ 0.0031533341389149427,
+ 0.002944495528936386,
+ 0.0020668748766183853
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.152883529663086,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 258.1524353027344,
+ 234.54095458984375,
+ 216.9737548828125,
+ 205.64048767089844,
+ 202.26617431640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9309845053358003e-05,
+ 5.373455860535614e-05,
+ 5.6388864322798327e-05,
+ 5.448140291264281e-05,
+ 4.2345352994743735e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028876049909740686,
+ 0.0030658405739814043,
+ 0.0031632501631975174,
+ 0.002954283496364951,
+ 0.0020715948194265366
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.155066967010498,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 257.7385559082031,
+ 233.87037658691406,
+ 216.7277069091797,
+ 205.37454223632812,
+ 202.0509033203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0028131227009e-05,
+ 5.394254549173638e-05,
+ 5.677127046510577e-05,
+ 5.581674486165866e-05,
+ 4.2508807382546365e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0028917219024151564,
+ 0.0030712694860994816,
+ 0.0031723883002996445,
+ 0.0029576809611171484,
+ 0.0020730902906507254
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1531357765197754,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 257.52423095703125,
+ 233.51254272460938,
+ 216.73731994628906,
+ 205.52561950683594,
+ 202.19493103027344
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9573794967727736e-05,
+ 5.4153944802237675e-05,
+ 5.742486973758787e-05,
+ 5.468217204906978e-05,
+ 4.2126855987589806e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029005431570112705,
+ 0.0030793119221925735,
+ 0.003179334569722414,
+ 0.0029661250300705433,
+ 0.002075627911835909
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.155139684677124,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 257.5526428222656,
+ 233.24456787109375,
+ 216.63601684570312,
+ 205.40318298339844,
+ 201.8704376220703
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.996290954295546e-05,
+ 5.331254214979708e-05,
+ 5.576194598688744e-05,
+ 5.50017248315271e-05,
+ 4.1135557694360614e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002902554115280509,
+ 0.003083745948970318,
+ 0.0031855429988354445,
+ 0.0029742431361228228,
+ 0.002079661935567856
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.15346360206604,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 257.3648681640625,
+ 233.42010498046875,
+ 216.6300506591797,
+ 204.97442626953125,
+ 201.4558868408203
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.06279211549554e-05,
+ 5.411348683992401e-05,
+ 5.6813423725543544e-05,
+ 5.523188519873656e-05,
+ 4.197460293653421e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029165328014642,
+ 0.003098647342994809,
+ 0.00319958315230906,
+ 0.002985388273373246,
+ 0.002088340697810054
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6015625,
+ "loss_eval": 1.155455470085144,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 257.30535888671875,
+ 233.4147491455078,
+ 216.60826110839844,
+ 205.0714874267578,
+ 201.24066162109375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.053050699643791e-05,
+ 5.4108801123220474e-05,
+ 5.702309499611147e-05,
+ 5.574637179961428e-05,
+ 4.271106809028424e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002917014993727207,
+ 0.0030978922732174397,
+ 0.0031987964175641537,
+ 0.0029851715080440044,
+ 0.0020893686451017857
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.1536216735839844,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 257.18878173828125,
+ 232.8798370361328,
+ 216.17039489746094,
+ 204.66229248046875,
+ 201.07859802246094
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.010717359255068e-05,
+ 5.397907079895958e-05,
+ 5.614722249447368e-05,
+ 5.553716255235486e-05,
+ 4.292877929401584e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029321948532015085,
+ 0.003115386702120304,
+ 0.0032163059804588556,
+ 0.002997474977746606,
+ 0.002096242969855666
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6123046875,
+ "loss_eval": 1.1570696830749512,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 257.0701904296875,
+ 232.91481018066406,
+ 216.06378173828125,
+ 204.648681640625,
+ 201.00148010253906
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9896454584086314e-05,
+ 5.386451448430307e-05,
+ 5.5900127335917205e-05,
+ 5.5407243053196e-05,
+ 4.247200922691263e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029298008885234594,
+ 0.0031122476793825626,
+ 0.0032105366699397564,
+ 0.0029950770549476147,
+ 0.0020956522785127163
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1554739475250244,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 257.0519104003906,
+ 232.83355712890625,
+ 216.1780242919922,
+ 204.67999267578125,
+ 201.0236358642578
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.054255234426819e-05,
+ 5.421326932264492e-05,
+ 5.641246752929874e-05,
+ 5.574019087362103e-05,
+ 4.288824857212603e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029319566674530506,
+ 0.0031146046239882708,
+ 0.003213704563677311,
+ 0.002997281262651086,
+ 0.0020963428542017937
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.607421875,
+ "loss_eval": 1.1545898914337158,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 257.1473388671875,
+ 232.85020446777344,
+ 216.2519989013672,
+ 204.68023681640625,
+ 200.93080139160156
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.0549009756650776e-05,
+ 5.3789182857144624e-05,
+ 5.673874693457037e-05,
+ 5.580837023444474e-05,
+ 4.2498151742620394e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029327664524316788,
+ 0.0031159960199147463,
+ 0.003215631702914834,
+ 0.002998515497893095,
+ 0.0020966045558452606
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1546047925949097,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 257.09906005859375,
+ 232.74813842773438,
+ 216.1462860107422,
+ 204.6047821044922,
+ 200.89031982421875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.086465898784809e-05,
+ 5.3742358431918547e-05,
+ 5.673644773196429e-05,
+ 5.5752621847204864e-05,
+ 4.2624127672752365e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029341024346649647,
+ 0.003117120126262307,
+ 0.0032170764170587063,
+ 0.0029998423997312784,
+ 0.002097061835229397
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.6083984375,
+ "loss_eval": 1.1545934677124023,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 257.09326171875,
+ 232.7879638671875,
+ 216.1444091796875,
+ 204.5867919921875,
+ 200.89596557617188
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.078025787952356e-05,
+ 5.40847031516023e-05,
+ 5.667618097504601e-05,
+ 5.571893780143e-05,
+ 4.271125726518221e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.0029357182793319225,
+ 0.0031186225824058056,
+ 0.003218533471226692,
+ 0.0030010156333446503,
+ 0.002097515854984522
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.154747486114502,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 257.0869140625,
+ 232.78091430664062,
+ 216.12852478027344,
+ 204.58143615722656,
+ 200.87417602539062
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.08715384057723e-05,
+ 5.4204192565521225e-05,
+ 5.669457823387347e-05,
+ 5.573080852627754e-05,
+ 4.275495302863419e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.002935809548944235,
+ 0.003118706401437521,
+ 0.0032186671160161495,
+ 0.003001126926392317,
+ 0.0020975489169359207
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.609375,
+ "loss_eval": 1.1547397375106812,
+ "epoch": 100
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010068593546748161,
+ 0.000997236929833889,
+ 0.0009934091940522194,
+ 0.0009870644425973296,
+ 0.0009829498594626784
+ ],
+ "bp_grad_norms_F": [
+ 0.03544403985142708,
+ 0.03507080301642418,
+ 0.03477022796869278,
+ 0.03443896397948265,
+ 0.03407429903745651
+ ],
+ "gamma_dfa": 0.007406219025142491,
+ "acc_eval": 0.115234375,
+ "loss_eval": 2.383650302886963,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 802.1658935546875,
+ 3058.3173828125,
+ 4910.8408203125,
+ 6491.31494140625,
+ 7304.1533203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.526000798752648e-06,
+ 1.3625027577290894e-06,
+ 1.3747999219049234e-06,
+ 1.378283172925876e-06,
+ 1.3869492931917193e-06
+ ],
+ "bp_grad_norms_F": [
+ 0.00013306058826856315,
+ 7.476000610040501e-05,
+ 7.328101492021233e-05,
+ 7.293069211300462e-05,
+ 7.309897773666307e-05
+ ],
+ "gamma_dfa": 0.08989996102172881,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9283097982406616,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1580.1480712890625,
+ 13320.0517578125,
+ 22793.435546875,
+ 32440.041015625,
+ 37758.640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1427439403632889e-06,
+ 3.0901847480890865e-07,
+ 3.1107475706448895e-07,
+ 3.1377521736430936e-07,
+ 3.1722706239634135e-07
+ ],
+ "bp_grad_norms_F": [
+ 6.523138290503994e-05,
+ 2.3476462956750765e-05,
+ 2.0436000340851024e-05,
+ 1.96047385543352e-05,
+ 1.9654715288197622e-05
+ ],
+ "gamma_dfa": 0.0858152944711037,
+ "acc_eval": 0.2880859375,
+ "loss_eval": 1.9359606504440308,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 2343.090576171875,
+ 32438.32421875,
+ 58119.84375,
+ 87185.09375,
+ 104586.15625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.229510513046989e-07,
+ 1.3056541092737461e-07,
+ 1.2754330214193033e-07,
+ 1.2950138739142858e-07,
+ 1.2936459370394005e-07
+ ],
+ "bp_grad_norms_F": [
+ 0.0001579313538968563,
+ 2.960947858809959e-05,
+ 1.2371615412121173e-05,
+ 8.468440682918299e-06,
+ 7.067524620651966e-06
+ ],
+ "gamma_dfa": 0.08629915304481983,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9288904666900635,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 3129.4423828125,
+ 62780.5,
+ 117608.9375,
+ 182640.09375,
+ 223504.390625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.484323762379063e-07,
+ 7.041825256237644e-08,
+ 6.729855783760286e-08,
+ 6.816127040565334e-08,
+ 6.818439857170233e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.9993034331710078e-05,
+ 2.8730657959386008e-06,
+ 2.3409718323819106e-06,
+ 2.367017486903933e-06,
+ 2.3597553990839515e-06
+ ],
+ "gamma_dfa": 0.08862219587899745,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926429033279419,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 3942.00390625,
+ 109015.7890625,
+ 203168.390625,
+ 329067.625,
+ 404167.84375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.148021386958135e-07,
+ 4.3746137379230277e-08,
+ 4.211498705330996e-08,
+ 4.271550579915129e-08,
+ 4.2616289164243426e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.426102219033055e-05,
+ 1.769960135789006e-06,
+ 1.4341048881760798e-06,
+ 1.45279318530811e-06,
+ 1.44924592859752e-06
+ ],
+ "gamma_dfa": 0.0876110177487135,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.9219281673431396,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 4737.880859375,
+ 173361.203125,
+ 331121.75,
+ 547707.8125,
+ 677363.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.4596529846785415e-07,
+ 2.929639286719521e-08,
+ 2.8080462399771022e-08,
+ 2.8515311001342525e-08,
+ 2.847208158129888e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.1308444047463126e-05,
+ 1.213497625940363e-06,
+ 9.622256129659945e-07,
+ 9.734020522955689e-07,
+ 9.715020041767275e-07
+ ],
+ "gamma_dfa": 0.08417161786928773,
+ "acc_eval": 0.2919921875,
+ "loss_eval": 1.942756175994873,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 5535.86865234375,
+ 258337.40625,
+ 501117.59375,
+ 823776.9375,
+ 1026549.875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.856409307445574e-07,
+ 2.2078769035260848e-08,
+ 2.0866384176088104e-08,
+ 2.09813144635973e-08,
+ 2.1003458527957264e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.847265775722917e-05,
+ 8.849666528476519e-07,
+ 7.187628057181428e-07,
+ 7.262269718921743e-07,
+ 7.249743703141576e-07
+ ],
+ "gamma_dfa": 0.08587896963581443,
+ "acc_eval": 0.2919921875,
+ "loss_eval": 1.9307396411895752,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 6304.064453125,
+ 367445.5625,
+ 717525.125,
+ 1200281.0,
+ 1512872.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.410295903449878e-07,
+ 1.670872862291617e-08,
+ 1.5770844186135946e-08,
+ 1.5891666649281433e-08,
+ 1.588542275499094e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.6556636182940565e-05,
+ 6.716044254062581e-07,
+ 5.55544488634041e-07,
+ 5.606318040918268e-07,
+ 5.59783927656099e-07
+ ],
+ "gamma_dfa": 0.08515941491350532,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9279191493988037,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 7086.48388671875,
+ 505478.71875,
+ 997925.8125,
+ 1708849.375,
+ 2150479.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.013988703060022e-07,
+ 1.3297809964285534e-08,
+ 1.2481795153007624e-08,
+ 1.262175253202713e-08,
+ 1.2595491760691857e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.4646101590187754e-05,
+ 5.195778953748231e-07,
+ 4.4164838186588895e-07,
+ 4.451969459751126e-07,
+ 4.4467057591646153e-07
+ ],
+ "gamma_dfa": 0.08757842611521482,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9144790172576904,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 7891.7685546875,
+ 675713.625,
+ 1320934.25,
+ 2319375.25,
+ 2933561.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.7613364750322944e-07,
+ 1.1096022767276281e-08,
+ 1.0442049891423721e-08,
+ 1.0500828651061056e-08,
+ 1.0485931234427426e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.3369051885092631e-05,
+ 4.295688142974541e-07,
+ 3.6954631355001766e-07,
+ 3.72132660686475e-07,
+ 3.718281220699282e-07
+ ],
+ "gamma_dfa": 0.08759273961186409,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.928476095199585,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 8605.7783203125,
+ 881309.9375,
+ 1719981.25,
+ 3048018.25,
+ 3848896.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.546977952988527e-07,
+ 9.457612470953336e-09,
+ 8.959561981214392e-09,
+ 8.996098976865596e-09,
+ 8.995014511015142e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2278720532776788e-05,
+ 3.6486676435742993e-07,
+ 3.18511354180373e-07,
+ 3.204301890491479e-07,
+ 3.2022188634073245e-07
+ ],
+ "gamma_dfa": 0.08920952118933201,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9193304777145386,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 9378.4287109375,
+ 1120098.75,
+ 2197340.0,
+ 3930402.25,
+ 4945595.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.424853278171213e-07,
+ 8.285154784459792e-09,
+ 7.84627474104127e-09,
+ 7.900293752527432e-09,
+ 7.906582943917329e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1596725016715936e-05,
+ 3.161075028401683e-07,
+ 2.796709850372281e-07,
+ 2.81156104620095e-07,
+ 2.810372734529665e-07
+ ],
+ "gamma_dfa": 0.09209982817992568,
+ "acc_eval": 0.287109375,
+ "loss_eval": 1.927558422088623,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 10124.396484375,
+ 1412441.875,
+ 2752346.75,
+ 5010036.0,
+ 6325289.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.236940588318248e-07,
+ 7.092171738776187e-09,
+ 6.815563668993718e-09,
+ 6.8297678623707725e-09,
+ 6.830232379684276e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0770681910798885e-05,
+ 2.7517026524037647e-07,
+ 2.434409793750092e-07,
+ 2.4456548430862313e-07,
+ 2.445065661049739e-07
+ ],
+ "gamma_dfa": 0.0919318727683276,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9280297756195068,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 10873.9169921875,
+ 1726814.125,
+ 3365165.0,
+ 6225292.5,
+ 7941070.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.0750607632180618e-07,
+ 6.175024491739123e-09,
+ 5.938003866390318e-09,
+ 5.979505779407646e-09,
+ 5.979241990416995e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.84854341368191e-06,
+ 2.3993459308258025e-07,
+ 2.1497004354387172e-07,
+ 2.1585482556929492e-07,
+ 2.1582005160780682e-07
+ ],
+ "gamma_dfa": 0.09486197168007493,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.9190003871917725,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11534.0087890625,
+ 2084976.25,
+ 4091674.75,
+ 7667605.5,
+ 9821730.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.9337822720899567e-07,
+ 5.5730837722478554e-09,
+ 5.387873702744628e-09,
+ 5.409793057964407e-09,
+ 5.415522696949893e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.290296475228388e-06,
+ 2.1226249202754843e-07,
+ 1.9121620198347955e-07,
+ 1.9190700584204023e-07,
+ 1.9189823774468096e-07
+ ],
+ "gamma_dfa": 0.09578572702594101,
+ "acc_eval": 0.28515625,
+ "loss_eval": 1.9317920207977295,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 12231.0380859375,
+ 2494592.5,
+ 4969235.5,
+ 9387796.0,
+ 12017026.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7950755193396617e-07,
+ 4.997119606997558e-09,
+ 4.8298063326512874e-09,
+ 4.8657629037052175e-09,
+ 4.859395552614387e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.774502930464223e-06,
+ 1.8752842834146577e-07,
+ 1.7071489821773866e-07,
+ 1.7126839679804107e-07,
+ 1.7126781415299774e-07
+ ],
+ "gamma_dfa": 0.09745451644994318,
+ "acc_eval": 0.2978515625,
+ "loss_eval": 1.927154541015625,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 12895.0341796875,
+ 2937750.0,
+ 5861416.5,
+ 11095317.0,
+ 14303387.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7269709928768862e-07,
+ 4.551929055907067e-09,
+ 4.4097947515808755e-09,
+ 4.41813474694186e-09,
+ 4.416958798714177e-09
+ ],
+ "bp_grad_norms_F": [
+ 8.354931196663529e-06,
+ 1.7010511044190935e-07,
+ 1.556661288759642e-07,
+ 1.5612842219070444e-07,
+ 1.5612160098044114e-07
+ ],
+ "gamma_dfa": 0.09986255329567939,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9158110618591309,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 13624.58984375,
+ 3430302.75,
+ 6892795.0,
+ 13179784.0,
+ 16997646.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.642013387481711e-07,
+ 4.094950600830316e-09,
+ 4.012986831725129e-09,
+ 4.022568500516854e-09,
+ 4.023625876925507e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.884121259849053e-06,
+ 1.54415545239317e-07,
+ 1.407240830531009e-07,
+ 1.411058434541701e-07,
+ 1.4110656820776057e-07
+ ],
+ "gamma_dfa": 0.09882167540490627,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9182151556015015,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 14323.6708984375,
+ 3985548.0,
+ 8076905.5,
+ 15465362.0,
+ 20015594.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.551940442823252e-07,
+ 3.79724474086629e-09,
+ 3.6876826037257615e-09,
+ 3.700401984829682e-09,
+ 3.6983835993709135e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.607863608427579e-06,
+ 1.393282218487002e-07,
+ 1.283839452526081e-07,
+ 1.2869591614617093e-07,
+ 1.2869809040694236e-07
+ ],
+ "gamma_dfa": 0.1002046266803518,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.9388974905014038,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 14955.4462890625,
+ 4541631.5,
+ 9327444.0,
+ 17893654.0,
+ 23108114.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.4713883444983367e-07,
+ 3.464018405452407e-09,
+ 3.3744134153579353e-09,
+ 3.379040602879968e-09,
+ 3.381670721225305e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.235442353703547e-06,
+ 1.2747574373861426e-07,
+ 1.1753004969250469e-07,
+ 1.1780696951291247e-07,
+ 1.1780796427274254e-07
+ ],
+ "gamma_dfa": 0.10065551439765841,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9343281984329224,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 15583.8564453125,
+ 5145675.5,
+ 10628445.0,
+ 20547210.0,
+ 26561584.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.4314694851691456e-07,
+ 3.170894435911009e-09,
+ 3.083378885548882e-09,
+ 3.0910656256821767e-09,
+ 3.0932543193529227e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.938716524018673e-06,
+ 1.1743370009753562e-07,
+ 1.0794892091325892e-07,
+ 1.0819184126376058e-07,
+ 1.0819199047773509e-07
+ ],
+ "gamma_dfa": 0.10184943513013422,
+ "acc_eval": 0.3154296875,
+ "loss_eval": 1.9154099225997925,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 16234.9208984375,
+ 5839592.5,
+ 12062968.0,
+ 23496628.0,
+ 30428386.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.379862197836701e-07,
+ 2.91886981251821e-09,
+ 2.8514124394973805e-09,
+ 2.8584146161136914e-09,
+ 2.860225389866855e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.72459282213822e-06,
+ 1.0762735769276333e-07,
+ 9.920048427147776e-08,
+ 9.94118352082296e-08,
+ 9.941232548271728e-08
+ ],
+ "gamma_dfa": 0.1024534439202398,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9225246906280518,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 16833.765625,
+ 6566770.0,
+ 13630788.0,
+ 26729236.0,
+ 34665300.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.331996628550769e-07,
+ 2.688527622751735e-09,
+ 2.6381341555747895e-09,
+ 2.6441848710589966e-09,
+ 2.644968466469777e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.5681074374879245e-06,
+ 9.902939268613409e-08,
+ 9.131563416531208e-08,
+ 9.149899682370233e-08,
+ 9.149922419737777e-08
+ ],
+ "gamma_dfa": 0.10199526121141389,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9233064651489258,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 17456.634765625,
+ 7337101.0,
+ 15401232.0,
+ 30171576.0,
+ 39161244.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2747005939672817e-07,
+ 2.4809998500074926e-09,
+ 2.4282977850731413e-09,
+ 2.432346990488554e-09,
+ 2.431272960734532e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.5036538217100315e-06,
+ 9.14754565428666e-08,
+ 8.484188640522916e-08,
+ 8.500099824004792e-08,
+ 8.500632731056612e-08
+ ],
+ "gamma_dfa": 0.10456769005395472,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9299731254577637,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 18049.205078125,
+ 8139419.5,
+ 17132936.0,
+ 33801196.0,
+ 43890588.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2153788020441425e-07,
+ 2.2737314253618024e-09,
+ 2.2332342641817604e-09,
+ 2.232388940370811e-09,
+ 2.237900753598865e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.099615802668268e-06,
+ 8.523231542767462e-08,
+ 7.842250226985925e-08,
+ 7.855853567662052e-08,
+ 7.856372263859157e-08
+ ],
+ "gamma_dfa": 0.10287670505931601,
+ "acc_eval": 0.3232421875,
+ "loss_eval": 1.923604965209961,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 18644.9375,
+ 9035569.0,
+ 19136636.0,
+ 37813052.0,
+ 49194300.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.212478508705317e-07,
+ 2.0938955014315752e-09,
+ 2.0560451119422396e-09,
+ 2.058360148993188e-09,
+ 2.061209425363586e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.810702987218974e-06,
+ 7.886949049407121e-08,
+ 7.294480752761956e-08,
+ 7.307144755941408e-08,
+ 7.307325233796291e-08
+ ],
+ "gamma_dfa": 0.10249267728067935,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9200568199157715,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 19280.703125,
+ 9952065.0,
+ 21071430.0,
+ 41963900.0,
+ 54690120.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1414142875310063e-07,
+ 1.9668882078605066e-09,
+ 1.928355919389446e-09,
+ 1.9296169107008154e-09,
+ 1.929810311551705e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.566818344959756e-06,
+ 7.357547104902551e-08,
+ 6.781976935599232e-08,
+ 6.792832607516175e-08,
+ 6.79302942785398e-08
+ ],
+ "gamma_dfa": 0.10335587273584679,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.92685067653656,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 19887.205078125,
+ 10899353.0,
+ 23080260.0,
+ 46142640.0,
+ 60105148.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1361055385350483e-07,
+ 1.8462845696731733e-09,
+ 1.815088412904231e-09,
+ 1.8113950339682106e-09,
+ 1.8156832704008252e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.398809662437998e-06,
+ 6.89453401037099e-08,
+ 6.4051612014282e-08,
+ 6.414857267600382e-08,
+ 6.415204012455433e-08
+ ],
+ "gamma_dfa": 0.10455695656128228,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.923227310180664,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 20438.587890625,
+ 11953376.0,
+ 25259200.0,
+ 50259240.0,
+ 65732368.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.1073134231764925e-07,
+ 1.7497674420496878e-09,
+ 1.7245866956727696e-09,
+ 1.7265968654811559e-09,
+ 1.727246901062074e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.281461653794395e-06,
+ 6.489771209317041e-08,
+ 6.026093046784808e-08,
+ 6.034837696233808e-08,
+ 6.035197941400838e-08
+ ],
+ "gamma_dfa": 0.10511547370697372,
+ "acc_eval": 0.326171875,
+ "loss_eval": 1.9300421476364136,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 20991.0234375,
+ 13017462.0,
+ 27475572.0,
+ 54971628.0,
+ 71927184.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0625635837868685e-07,
+ 1.6529324575742521e-09,
+ 1.6255721213553898e-09,
+ 1.6247864165208625e-09,
+ 1.6244732226056158e-09
+ ],
+ "bp_grad_norms_F": [
+ 5.098012934467988e-06,
+ 6.077872427567854e-08,
+ 5.674080227890954e-08,
+ 5.681971870785674e-08,
+ 5.6821534144546604e-08
+ ],
+ "gamma_dfa": 0.10590779440826736,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9211739301681519,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 21617.34765625,
+ 14125094.0,
+ 29881326.0,
+ 59926964.0,
+ 78189832.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0433515029717455e-07,
+ 1.5471924852406005e-09,
+ 1.5234034034250499e-09,
+ 1.5246930384904545e-09,
+ 1.5239296491387222e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.977115622750716e-06,
+ 5.780140810429657e-08,
+ 5.362210941939338e-08,
+ 5.3694908075385683e-08,
+ 5.369727773540944e-08
+ ],
+ "gamma_dfa": 0.10481705865822732,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.9209015369415283,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 22126.13671875,
+ 15300531.0,
+ 32579362.0,
+ 65167536.0,
+ 85083400.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0149238249823611e-07,
+ 1.4551810867402537e-09,
+ 1.4291762218121562e-09,
+ 1.432274854273885e-09,
+ 1.4318950469771607e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.9215527724300046e-06,
+ 5.434217342781267e-08,
+ 5.088266163966182e-08,
+ 5.094950239481477e-08,
+ 5.0953229191463834e-08
+ ],
+ "gamma_dfa": 0.10599250381346792,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9330241680145264,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 22662.396484375,
+ 16481282.0,
+ 35263600.0,
+ 70793304.0,
+ 92166136.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.882934648430819e-08,
+ 1.3810197430075277e-09,
+ 1.3668104426045602e-09,
+ 1.3675354182396404e-09,
+ 1.366150526038723e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.6740801735722926e-06,
+ 5.137474090588512e-08,
+ 4.796589792022132e-08,
+ 4.802501862855024e-08,
+ 4.8027377630432966e-08
+ ],
+ "gamma_dfa": 0.10529429838061333,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9205418825149536,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 23192.3125,
+ 17779744.0,
+ 38108720.0,
+ 76522688.0,
+ 99643120.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.530750588737646e-08,
+ 1.3089170858293642e-09,
+ 1.2901538726239892e-09,
+ 1.2906937740808644e-09,
+ 1.2914372904404559e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.669429472414777e-06,
+ 4.88593805414439e-08,
+ 4.5740907950175824e-08,
+ 4.579441181817856e-08,
+ 4.5798362435789386e-08
+ ],
+ "gamma_dfa": 0.1058788642694708,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9393997192382812,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 23683.251953125,
+ 18992256.0,
+ 40936536.0,
+ 82030200.0,
+ 106929248.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.458356942104729e-08,
+ 1.2407530558533608e-09,
+ 1.2231146095942336e-09,
+ 1.2233244417458877e-09,
+ 1.2247586278490985e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.483116299525136e-06,
+ 4.651869289773458e-08,
+ 4.358627236911161e-08,
+ 4.363666050721804e-08,
+ 4.3638891611408326e-08
+ ],
+ "gamma_dfa": 0.10620562738040462,
+ "acc_eval": 0.3251953125,
+ "loss_eval": 1.9221802949905396,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 24223.7265625,
+ 20421224.0,
+ 43883308.0,
+ 87849264.0,
+ 114523200.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.247051480087976e-08,
+ 1.182353992490448e-09,
+ 1.1679496259020539e-09,
+ 1.169668362166476e-09,
+ 1.1697178781133744e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.388592969917227e-06,
+ 4.4431864409943955e-08,
+ 4.157495325785021e-08,
+ 4.162143696362364e-08,
+ 4.16235543809762e-08
+ ],
+ "gamma_dfa": 0.10484841075958684,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9306102991104126,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 24732.05078125,
+ 21765008.0,
+ 46887340.0,
+ 93818392.0,
+ 122372552.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.012441637423763e-08,
+ 1.1452657711075176e-09,
+ 1.1280866241136778e-09,
+ 1.1283430856323662e-09,
+ 1.1287816237270931e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.297942268749466e-06,
+ 4.29258228962226e-08,
+ 3.9989565436826524e-08,
+ 4.003141995667647e-08,
+ 4.003394948881578e-08
+ ],
+ "gamma_dfa": 0.10523941312567331,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9360214471817017,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 25179.26953125,
+ 23094218.0,
+ 50076040.0,
+ 100053064.0,
+ 130605352.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.80345041309738e-08,
+ 1.0831726626747695e-09,
+ 1.0690409668612233e-09,
+ 1.0700328401114234e-09,
+ 1.0692404739387484e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.235343567415839e-06,
+ 4.072955306355652e-08,
+ 3.817867622046833e-08,
+ 3.8218924913735464e-08,
+ 3.822109917450689e-08
+ ],
+ "gamma_dfa": 0.10568258634884842,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.927825689315796,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 25586.23828125,
+ 24470240.0,
+ 53013036.0,
+ 105981368.0,
+ 138543408.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.783595717432036e-08,
+ 1.0381262516290235e-09,
+ 1.0265919225815878e-09,
+ 1.0273364381419015e-09,
+ 1.0274008310773297e-09
+ ],
+ "bp_grad_norms_F": [
+ 4.177269602223532e-06,
+ 3.924894187434802e-08,
+ 3.684685978555535e-08,
+ 3.688498040332888e-08,
+ 3.688741045948518e-08
+ ],
+ "gamma_dfa": 0.10561428684741259,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9321579933166504,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 26049.974609375,
+ 25812240.0,
+ 56223324.0,
+ 112200904.0,
+ 146978224.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.555475972116255e-08,
+ 9.982903392824483e-10,
+ 9.87055215340149e-10,
+ 9.8631947054173e-10,
+ 9.876408579856388e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.088252808287507e-06,
+ 3.767732792425704e-08,
+ 3.5331073178213046e-08,
+ 3.536514370239274e-08,
+ 3.5367978767908426e-08
+ ],
+ "gamma_dfa": 0.10579964506905526,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.930686116218567,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 26467.328125,
+ 27200558.0,
+ 59437036.0,
+ 118688848.0,
+ 155514592.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.46039256430231e-08,
+ 9.647596055373242e-10,
+ 9.512606258255119e-10,
+ 9.511659238015113e-10,
+ 9.522146404705722e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.015588729089359e-06,
+ 3.636354861669133e-08,
+ 3.413835614196614e-08,
+ 3.417060767674229e-08,
+ 3.417307326003538e-08
+ ],
+ "gamma_dfa": 0.10565257369307801,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9317667484283447,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 26919.3671875,
+ 28678974.0,
+ 62716300.0,
+ 125549296.0,
+ 163974208.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.232915860162393e-08,
+ 9.29719468079071e-10,
+ 9.197844152986079e-10,
+ 9.194760508535182e-10,
+ 9.196678418810222e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.951602138840826e-06,
+ 3.508949220076829e-08,
+ 3.2971975372220186e-08,
+ 3.3001178678659926e-08,
+ 3.300409190387654e-08
+ ],
+ "gamma_dfa": 0.10566475696396083,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.9284584522247314,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 27317.033203125,
+ 30078810.0,
+ 66046968.0,
+ 132107504.0,
+ 172659440.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.130339068657122e-08,
+ 9.03509489447174e-10,
+ 8.925334360476711e-10,
+ 8.917908633776506e-10,
+ 8.925368222278962e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.9174719859147444e-06,
+ 3.398368519924588e-08,
+ 3.1965900149089066e-08,
+ 3.199273024279137e-08,
+ 3.199540898890518e-08
+ ],
+ "gamma_dfa": 0.10646540904417634,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9241154193878174,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 27715.529296875,
+ 31383778.0,
+ 69356640.0,
+ 138681856.0,
+ 181338928.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.031172171740764e-08,
+ 8.735605017129444e-10,
+ 8.597746958827202e-10,
+ 8.612066615398817e-10,
+ 8.621173774869817e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.837071290035965e-06,
+ 3.286310601424702e-08,
+ 3.101721191001161e-08,
+ 3.104238288642591e-08,
+ 3.104513979224066e-08
+ ],
+ "gamma_dfa": 0.10568622383289039,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.938409447669983,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 28149.3203125,
+ 32840858.0,
+ 72848112.0,
+ 145667440.0,
+ 190265088.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.894184506085367e-08,
+ 8.401777051858517e-10,
+ 8.299890774665641e-10,
+ 8.304122944835512e-10,
+ 8.303523979513727e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.798121497311513e-06,
+ 3.184389640864538e-08,
+ 3.004597459721481e-08,
+ 3.0069060130699654e-08,
+ 3.007191295978373e-08
+ ],
+ "gamma_dfa": 0.10558789351489395,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9300565719604492,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 28522.55078125,
+ 34358040.0,
+ 76134080.0,
+ 152412848.0,
+ 198973936.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.830858095303483e-08,
+ 8.109956595170331e-10,
+ 8.036356025087343e-10,
+ 8.033995135825478e-10,
+ 8.031720843959533e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.7768336369481403e-06,
+ 3.096561229654071e-08,
+ 2.9296373327269976e-08,
+ 2.9317961391939207e-08,
+ 2.9320871064442144e-08
+ ],
+ "gamma_dfa": 0.10623026502435096,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.930029273033142,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 28924.912109375,
+ 35808620.0,
+ 79629336.0,
+ 159269824.0,
+ 208087264.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.754207587140627e-08,
+ 7.940589297206202e-10,
+ 7.852188899093449e-10,
+ 7.844204730211857e-10,
+ 7.861447048895798e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.695072564369184e-06,
+ 3.0030403053160626e-08,
+ 2.8479737679276695e-08,
+ 2.849986913133762e-08,
+ 2.8502654458861798e-08
+ ],
+ "gamma_dfa": 0.1059467513114214,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9284684658050537,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 29289.236328125,
+ 37312204.0,
+ 83049256.0,
+ 165977216.0,
+ 216710016.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.562951509498816e-08,
+ 7.782112176890621e-10,
+ 7.675478586044449e-10,
+ 7.666810519779688e-10,
+ 7.681388303204528e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.6269300380809e-06,
+ 2.9297559933638695e-08,
+ 2.782604902051844e-08,
+ 2.7844757610751003e-08,
+ 2.7847393724300673e-08
+ ],
+ "gamma_dfa": 0.10581977141555399,
+ "acc_eval": 0.3037109375,
+ "loss_eval": 1.9282777309417725,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 29638.296875,
+ 38754036.0,
+ 86627536.0,
+ 172893504.0,
+ 225686464.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.50456763398688e-08,
+ 7.526539391733422e-10,
+ 7.443530236628249e-10,
+ 7.439299176681402e-10,
+ 7.444729277494844e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.6355218071548734e-06,
+ 2.845291824371543e-08,
+ 2.7127033064289208e-08,
+ 2.714476821097378e-08,
+ 2.7147471826083347e-08
+ ],
+ "gamma_dfa": 0.1066790189652238,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.925389051437378,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 29950.615234375,
+ 40150236.0,
+ 90007640.0,
+ 179977856.0,
+ 235206976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.382724476201474e-08,
+ 7.370593024802474e-10,
+ 7.280710478951846e-10,
+ 7.283330605289962e-10,
+ 7.279294389483937e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5918935736845015e-06,
+ 2.7770946431360244e-08,
+ 2.6450262424759785e-08,
+ 2.6465910352158062e-08,
+ 2.6468752523101102e-08
+ ],
+ "gamma_dfa": 0.10654840966162737,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.929931402206421,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 30266.310546875,
+ 41604512.0,
+ 93401064.0,
+ 187075808.0,
+ 244203616.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.343555097349963e-08,
+ 7.144400626657443e-10,
+ 7.057154305378788e-10,
+ 7.05836944447924e-10,
+ 7.073042707084198e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.5134323752572527e-06,
+ 2.7063506990998576e-08,
+ 2.580901536930469e-08,
+ 2.582418012764265e-08,
+ 2.582707381293403e-08
+ ],
+ "gamma_dfa": 0.10640880587743595,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9268465042114258,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 30588.291015625,
+ 43073320.0,
+ 96898208.0,
+ 193783280.0,
+ 253267328.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.257300893570573e-08,
+ 6.925075513031231e-10,
+ 6.871804236752155e-10,
+ 6.855109813130866e-10,
+ 6.860176871015256e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4990612221008632e-06,
+ 2.652852693074692e-08,
+ 2.5297810068991566e-08,
+ 2.5311907236869047e-08,
+ 2.531497678148753e-08
+ ],
+ "gamma_dfa": 0.10629434209840838,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.932523488998413,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 30898.34765625,
+ 44412940.0,
+ 100019336.0,
+ 199966816.0,
+ 261667760.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.140450719589353e-08,
+ 6.861456958162648e-10,
+ 6.789319106914604e-10,
+ 6.784582895491553e-10,
+ 6.785109696316738e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.470987167020212e-06,
+ 2.5969489669819268e-08,
+ 2.478421379237261e-08,
+ 2.479695204726795e-08,
+ 2.4800137055080995e-08
+ ],
+ "gamma_dfa": 0.1070190458704019,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.932159662246704,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 31188.375,
+ 45820600.0,
+ 103429992.0,
+ 206547120.0,
+ 270181600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.079076169702603e-08,
+ 6.688025688816879e-10,
+ 6.633480986728557e-10,
+ 6.629659043966285e-10,
+ 6.630911930649575e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.4183981370006222e-06,
+ 2.540217280966317e-08,
+ 2.4278467236626966e-08,
+ 2.4290830680229192e-08,
+ 2.429379897250783e-08
+ ],
+ "gamma_dfa": 0.10550818023330066,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9357173442840576,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 31478.2109375,
+ 47178892.0,
+ 107044784.0,
+ 213196560.0,
+ 278895232.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.016877390242371e-08,
+ 6.609012226377331e-10,
+ 6.520708972779232e-10,
+ 6.519841333485488e-10,
+ 6.530669338644657e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.405668167033582e-06,
+ 2.4965938649756936e-08,
+ 2.3893584000234114e-08,
+ 2.390493669679472e-08,
+ 2.390810749375305e-08
+ ],
+ "gamma_dfa": 0.10673638083972037,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.9359304904937744,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 31753.5859375,
+ 48563264.0,
+ 110454832.0,
+ 219550528.0,
+ 287320896.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.007908919831607e-08,
+ 6.483197867446222e-10,
+ 6.408613084651904e-10,
+ 6.410805775125539e-10,
+ 6.409432429244077e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.369002797626308e-06,
+ 2.447991498399915e-08,
+ 2.3494733270013057e-08,
+ 2.350535943662635e-08,
+ 2.350850003551841e-08
+ ],
+ "gamma_dfa": 0.10726616549072787,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9281866550445557,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 32002.76953125,
+ 49866268.0,
+ 113724368.0,
+ 225759120.0,
+ 295231328.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.914736161434121e-08,
+ 6.332004365283694e-10,
+ 6.232644400583354e-10,
+ 6.233273341926804e-10,
+ 6.240686856173738e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.3845158213807736e-06,
+ 2.415495181651295e-08,
+ 2.3192731291032942e-08,
+ 2.3202973764568924e-08,
+ 2.3206132127029377e-08
+ ],
+ "gamma_dfa": 0.10715722179156728,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9343407154083252,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 32277.291015625,
+ 51206064.0,
+ 116617608.0,
+ 231756352.0,
+ 303064864.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.926612172719615e-08,
+ 6.240719607752965e-10,
+ 6.182420131395361e-10,
+ 6.17405682135086e-10,
+ 6.178215161689593e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.317889877507696e-06,
+ 2.3704412654979024e-08,
+ 2.2745311412109004e-08,
+ 2.2754765183208292e-08,
+ 2.2757769002623718e-08
+ ],
+ "gamma_dfa": 0.10657632350921631,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9305057525634766,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 32521.890625,
+ 52538716.0,
+ 119605040.0,
+ 237773904.0,
+ 310920672.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.805787933217289e-08,
+ 6.190028489783117e-10,
+ 6.10553496649402e-10,
+ 6.107545580391616e-10,
+ 6.10922701316241e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2823897981870687e-06,
+ 2.3313557306892108e-08,
+ 2.2385792775025948e-08,
+ 2.239448981811165e-08,
+ 2.239757002087117e-08
+ ],
+ "gamma_dfa": 0.10671919275773689,
+ "acc_eval": 0.302734375,
+ "loss_eval": 1.9269468784332275,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 32717.80859375,
+ 53698120.0,
+ 122676120.0,
+ 243745136.0,
+ 318772768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.75130422678194e-08,
+ 6.033377686343044e-10,
+ 5.948920800413759e-10,
+ 5.949861159315617e-10,
+ 5.951407144877408e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2588357044005534e-06,
+ 2.2926835541170476e-08,
+ 2.205681148836902e-08,
+ 2.206508220581327e-08,
+ 2.2068283200837868e-08
+ ],
+ "gamma_dfa": 0.10711025857017376,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9273767471313477,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 32950.74609375,
+ 54885932.0,
+ 125689616.0,
+ 249312240.0,
+ 326217856.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.673791119737871e-08,
+ 5.923626589243725e-10,
+ 5.863842189590684e-10,
+ 5.866296337586618e-10,
+ 5.870876007563197e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2307948458765168e-06,
+ 2.2597017590442192e-08,
+ 2.1738133071380616e-08,
+ 2.1745805156569986e-08,
+ 2.1749071876797643e-08
+ ],
+ "gamma_dfa": 0.10673619594308548,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9271256923675537,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 33148.1328125,
+ 55976648.0,
+ 128534072.0,
+ 254655232.0,
+ 333162784.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.663199769718631e-08,
+ 5.852057172184288e-10,
+ 5.787633705622852e-10,
+ 5.792484825128952e-10,
+ 5.793157620281875e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.197097157681128e-06,
+ 2.2320827852695402e-08,
+ 2.1484760637235922e-08,
+ 2.149219824332249e-08,
+ 2.1495376145708178e-08
+ ],
+ "gamma_dfa": 0.10659754439257085,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9244905710220337,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 33369.18359375,
+ 57164716.0,
+ 131352720.0,
+ 259876736.0,
+ 339964160.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.583201184184873e-08,
+ 5.737598174349046e-10,
+ 5.67273561458137e-10,
+ 5.66656666034504e-10,
+ 5.665773961105458e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.2037539767770795e-06,
+ 2.2096731555620863e-08,
+ 2.127841902677119e-08,
+ 2.1285371687440602e-08,
+ 2.1288625973170383e-08
+ ],
+ "gamma_dfa": 0.10679806087864563,
+ "acc_eval": 0.3154296875,
+ "loss_eval": 1.9308257102966309,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 33540.88671875,
+ 58301528.0,
+ 133722112.0,
+ 264798368.0,
+ 346396256.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.606099844930213e-08,
+ 5.686319748399171e-10,
+ 5.629098853709991e-10,
+ 5.619399945366865e-10,
+ 5.626447086015673e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.1530219075648347e-06,
+ 2.1766210167584177e-08,
+ 2.0992644067518995e-08,
+ 2.0999330274662498e-08,
+ 2.1002534822400776e-08
+ ],
+ "gamma_dfa": 0.10647483140928671,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.925765037536621,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 33728.984375,
+ 59420104.0,
+ 136277376.0,
+ 270265568.0,
+ 353408672.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.57889458466343e-08,
+ 5.627094901150542e-10,
+ 5.575621631059846e-10,
+ 5.567652450189087e-10,
+ 5.571588745922895e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.138873807984055e-06,
+ 2.1483266721133987e-08,
+ 2.0736742101234995e-08,
+ 2.0742897177683517e-08,
+ 2.0746110607205992e-08
+ ],
+ "gamma_dfa": 0.10677585859230021,
+ "acc_eval": 0.3154296875,
+ "loss_eval": 1.9289934635162354,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 33919.515625,
+ 60492864.0,
+ 138846208.0,
+ 275456896.0,
+ 359821632.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.451340084367985e-08,
+ 5.607461717183071e-10,
+ 5.556192728128906e-10,
+ 5.553609239150603e-10,
+ 5.557289628477236e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.125772991552367e-06,
+ 2.1269308092541905e-08,
+ 2.0518179155715188e-08,
+ 2.052397540808215e-08,
+ 2.0527094690692138e-08
+ ],
+ "gamma_dfa": 0.10671760967670707,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9296305179595947,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 34098.5,
+ 61508056.0,
+ 141295472.0,
+ 280204000.0,
+ 365860768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.474934366451635e-08,
+ 5.519530943409734e-10,
+ 5.459506735583375e-10,
+ 5.446967876743258e-10,
+ 5.452004958605983e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.1189638320938684e-06,
+ 2.1083655710185667e-08,
+ 2.0349753881987453e-08,
+ 2.0355370722313637e-08,
+ 2.0358520202989894e-08
+ ],
+ "gamma_dfa": 0.10652847628807649,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9298161268234253,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 34267.96875,
+ 62529272.0,
+ 143621744.0,
+ 284772064.0,
+ 371754336.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.392743046035321e-08,
+ 5.466314068058864e-10,
+ 5.412825743178473e-10,
+ 5.413390846698007e-10,
+ 5.416116999334974e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0790877190156607e-06,
+ 2.0871810946232472e-08,
+ 2.0159163227617682e-08,
+ 2.0164401703937074e-08,
+ 2.0167590264463797e-08
+ ],
+ "gamma_dfa": 0.10652959482831648,
+ "acc_eval": 0.298828125,
+ "loss_eval": 1.926388144493103,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 34420.42578125,
+ 63473892.0,
+ 145906128.0,
+ 289224256.0,
+ 377581856.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.427427479138714e-08,
+ 5.377295275721394e-10,
+ 5.307561612433176e-10,
+ 5.305922923248829e-10,
+ 5.308011252758149e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.096157115578535e-06,
+ 2.067219107004803e-08,
+ 2.0005694878477698e-08,
+ 2.001087118230771e-08,
+ 2.001400645212925e-08
+ ],
+ "gamma_dfa": 0.10710431921324925,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.9277684688568115,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 34573.87890625,
+ 64328388.0,
+ 148036320.0,
+ 293257856.0,
+ 382751104.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.389419127117435e-08,
+ 5.373848033229933e-10,
+ 5.314943485323909e-10,
+ 5.314927387090052e-10,
+ 5.31539035009132e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.072862682529376e-06,
+ 2.049388392322271e-08,
+ 1.98319511923728e-08,
+ 1.9836669196138246e-08,
+ 1.9840014076066836e-08
+ ],
+ "gamma_dfa": 0.10700461147644091,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9307092428207397,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 34690.74609375,
+ 65142160.0,
+ 150006800.0,
+ 297046144.0,
+ 387685792.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.348407310952098e-08,
+ 5.322000062868426e-10,
+ 5.271332259582096e-10,
+ 5.264539360005926e-10,
+ 5.263872671079639e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.055365141335642e-06,
+ 2.0346906381973895e-08,
+ 1.9688986441224188e-08,
+ 1.969357477094036e-08,
+ 1.969680063496071e-08
+ ],
+ "gamma_dfa": 0.10688555391971022,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9277830123901367,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 34818.79296875,
+ 65891160.0,
+ 151813680.0,
+ 300644832.0,
+ 392342848.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.302482802311715e-08,
+ 5.310150652526602e-10,
+ 5.265936020570905e-10,
+ 5.26124921407245e-10,
+ 5.26482579754628e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.027237426067586e-06,
+ 2.0201985861945104e-08,
+ 1.9550000729395833e-08,
+ 1.955433681644081e-08,
+ 1.9557578667672715e-08
+ ],
+ "gamma_dfa": 0.10652808679151349,
+ "acc_eval": 0.2998046875,
+ "loss_eval": 1.9273805618286133,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 34951.515625,
+ 66590476.0,
+ 153730848.0,
+ 304118720.0,
+ 396925408.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.403244157127119e-08,
+ 5.26472032635894e-10,
+ 5.205495479110311e-10,
+ 5.201504782448296e-10,
+ 5.20502474454787e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0631524623458972e-06,
+ 2.0121730059941e-08,
+ 1.9494045488954725e-08,
+ 1.9498189729461046e-08,
+ 1.950143335704979e-08
+ ],
+ "gamma_dfa": 0.1070192107144976,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.934456467628479,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 35056.31640625,
+ 67311408.0,
+ 155368816.0,
+ 307494752.0,
+ 401124448.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.303329769252741e-08,
+ 5.209726539057158e-10,
+ 5.160313842900166e-10,
+ 5.156270965755994e-10,
+ 5.161130411934778e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0127189347695094e-06,
+ 1.993531562050066e-08,
+ 1.93110221147208e-08,
+ 1.9314887467203334e-08,
+ 1.9318180832783582e-08
+ ],
+ "gamma_dfa": 0.10658633662387729,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9260145425796509,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 35158.68359375,
+ 67933192.0,
+ 157091536.0,
+ 310654048.0,
+ 405321344.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.339039515523837e-08,
+ 5.170803230036825e-10,
+ 5.107546607874269e-10,
+ 5.104218714357955e-10,
+ 5.108970468903351e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.0164017061906634e-06,
+ 1.9819051289005074e-08,
+ 1.921591774589615e-08,
+ 1.921967651696832e-08,
+ 1.9223040936822144e-08
+ ],
+ "gamma_dfa": 0.10703902837121859,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.927987813949585,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 35270.68359375,
+ 68510120.0,
+ 158496816.0,
+ 313641408.0,
+ 409130592.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.246813200050383e-08,
+ 5.133981018090594e-10,
+ 5.070178166199923e-10,
+ 5.070903141835004e-10,
+ 5.071925657240683e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.004009158757981e-06,
+ 1.970923690919335e-08,
+ 1.910464320076244e-08,
+ 1.9108172821802327e-08,
+ 1.9111526583515115e-08
+ ],
+ "gamma_dfa": 0.1070477613247931,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.9260926246643066,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 35364.3125,
+ 69078320.0,
+ 159830400.0,
+ 316294976.0,
+ 412518496.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.217867820623724e-08,
+ 5.12098419225282e-10,
+ 5.052269158589695e-10,
+ 5.058938268298618e-10,
+ 5.053178431246863e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9913805974501884e-06,
+ 1.9599063705300068e-08,
+ 1.900307999846973e-08,
+ 1.9006522578024487e-08,
+ 1.9009846141671005e-08
+ ],
+ "gamma_dfa": 0.10688473540358245,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926918864250183,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 35441.375,
+ 69602704.0,
+ 161117808.0,
+ 318818240.0,
+ 415766208.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.249013040360296e-08,
+ 5.102671063461628e-10,
+ 5.039960671027188e-10,
+ 5.038492956188634e-10,
+ 5.034740402365401e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9863124382245587e-06,
+ 1.9512324200832154e-08,
+ 1.8926254341522508e-08,
+ 1.8929529943534362e-08,
+ 1.8932860612608238e-08
+ ],
+ "gamma_dfa": 0.10701000291737728,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9271972179412842,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 35514.78125,
+ 70081152.0,
+ 162190624.0,
+ 321009312.0,
+ 418699392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.149930698029493e-08,
+ 5.099357047733122e-10,
+ 5.055039165036135e-10,
+ 5.048302331722709e-10,
+ 5.054044960317583e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.969128445329261e-06,
+ 1.9427163877594467e-08,
+ 1.883810085701043e-08,
+ 1.884115441441736e-08,
+ 1.884450639977331e-08
+ ],
+ "gamma_dfa": 0.10680000087450026,
+ "acc_eval": 0.3017578125,
+ "loss_eval": 1.9285144805908203,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 35582.9765625,
+ 70499392.0,
+ 163284976.0,
+ 323095264.0,
+ 421363552.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.187113399391819e-08,
+ 5.05410657769545e-10,
+ 4.990756696798826e-10,
+ 4.979930912085706e-10,
+ 4.985904467069702e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9715449727518717e-06,
+ 1.9354965630213883e-08,
+ 1.877567434860339e-08,
+ 1.8778711918798763e-08,
+ 1.8782076338652587e-08
+ ],
+ "gamma_dfa": 0.10694103027344681,
+ "acc_eval": 0.310546875,
+ "loss_eval": 1.92802095413208,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 35639.56640625,
+ 70899536.0,
+ 164253712.0,
+ 324923200.0,
+ 423745824.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.238182237439105e-08,
+ 5.018311322046998e-10,
+ 4.970572842211141e-10,
+ 4.953790155859394e-10,
+ 4.961450694729308e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.971921048811055e-06,
+ 1.9296171771543413e-08,
+ 1.872837351868384e-08,
+ 1.8731368456315067e-08,
+ 1.873476662694884e-08
+ ],
+ "gamma_dfa": 0.10704115682892734,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926428198814392,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 35689.78515625,
+ 71256024.0,
+ 165127008.0,
+ 326618208.0,
+ 425949792.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.238117578050151e-08,
+ 4.972192657604069e-10,
+ 4.926972718699574e-10,
+ 4.921834606541609e-10,
+ 4.923969565417963e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9655700473085744e-06,
+ 1.9235280035445612e-08,
+ 1.8671270751724478e-08,
+ 1.8674217727721043e-08,
+ 1.8677596358429582e-08
+ ],
+ "gamma_dfa": 0.10696214074414456,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.924986481666565,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 35742.58984375,
+ 71595640.0,
+ 165912336.0,
+ 328130016.0,
+ 427838752.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.213700487478491e-08,
+ 4.983659041002397e-10,
+ 4.936055453264032e-10,
+ 4.941617670617404e-10,
+ 4.939196274200697e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.951217993540922e-06,
+ 1.919361736213432e-08,
+ 1.863161003257119e-08,
+ 1.8634468190725784e-08,
+ 1.8637845045077484e-08
+ ],
+ "gamma_dfa": 0.10690056857129093,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9250625371932983,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 35784.6640625,
+ 71885704.0,
+ 166691376.0,
+ 329546848.0,
+ 429668704.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.175997668833588e-08,
+ 4.971995593017198e-10,
+ 4.919967211414189e-10,
+ 4.91977791838849e-10,
+ 4.926699603835516e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9550594717875356e-06,
+ 1.9144454910247077e-08,
+ 1.8583381944381472e-08,
+ 1.858614595562358e-08,
+ 1.8589524586332118e-08
+ ],
+ "gamma_dfa": 0.10689649073174223,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926330327987671,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 35822.33984375,
+ 72122744.0,
+ 167344016.0,
+ 330816224.0,
+ 431313312.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.139300978702522e-08,
+ 4.980582613001161e-10,
+ 4.935602482269985e-10,
+ 4.934832542602408e-10,
+ 4.934415098745148e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9577784061984858e-06,
+ 1.9112555094125128e-08,
+ 1.8551357783280764e-08,
+ 1.8553992120473595e-08,
+ 1.8557404501962083e-08
+ ],
+ "gamma_dfa": 0.10689723303948995,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.9307332038879395,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 35859.390625,
+ 72358304.0,
+ 167947920.0,
+ 331984992.0,
+ 432823232.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.135296359843778e-08,
+ 4.947317000514317e-10,
+ 4.903184525062443e-10,
+ 4.896648087004962e-10,
+ 4.905649775288623e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9511427328543505e-06,
+ 1.906450464161935e-08,
+ 1.8504644927475056e-08,
+ 1.8507259724742653e-08,
+ 1.8510663224446944e-08
+ ],
+ "gamma_dfa": 0.10684622721601045,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9271869659423828,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 35888.20703125,
+ 72553136.0,
+ 168401376.0,
+ 332911328.0,
+ 434057600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.163116239576993e-08,
+ 4.935953312745767e-10,
+ 4.904400219274407e-10,
+ 4.890517990574494e-10,
+ 4.891231308867816e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9438597266562283e-06,
+ 1.902795432329185e-08,
+ 1.8475304841558682e-08,
+ 1.8477877006262133e-08,
+ 1.848129471682114e-08
+ ],
+ "gamma_dfa": 0.10682923735294025,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9263050556182861,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 35914.35546875,
+ 72735848.0,
+ 168823680.0,
+ 333752736.0,
+ 435137376.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.153870657499283e-08,
+ 4.920966967247864e-10,
+ 4.894144534084433e-10,
+ 4.876969939004994e-10,
+ 4.884483928435657e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9408777209027903e-06,
+ 1.8999060102942167e-08,
+ 1.8450597494279464e-08,
+ 1.8453114591920894e-08,
+ 1.84565323024799e-08
+ ],
+ "gamma_dfa": 0.10694600266288035,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9252078533172607,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 35936.5546875,
+ 72887360.0,
+ 169178624.0,
+ 334467840.0,
+ 436061952.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.168602340039797e-08,
+ 4.908231043820876e-10,
+ 4.854965318656923e-10,
+ 4.846267276370497e-10,
+ 4.847209300606892e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.945510459539946e-06,
+ 1.8982424521141184e-08,
+ 1.8438125692910035e-08,
+ 1.844062857969675e-08,
+ 1.8444072935608347e-08
+ ],
+ "gamma_dfa": 0.10697454003093299,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.9264906644821167,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 35955.3671875,
+ 73005808.0,
+ 169498240.0,
+ 335085920.0,
+ 436862656.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.152810527737529e-08,
+ 4.922047214250824e-10,
+ 4.872572900715966e-10,
+ 4.873856318532432e-10,
+ 4.87353157829773e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9327068205020623e-06,
+ 1.8955052638602865e-08,
+ 1.8409036073308016e-08,
+ 1.8411496327530585e-08,
+ 1.841491403808959e-08
+ ],
+ "gamma_dfa": 0.10689280136284651,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9255037307739258,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 35973.34375,
+ 73111368.0,
+ 169770208.0,
+ 335584768.0,
+ 437507744.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.107820382794671e-08,
+ 4.92519802719471e-10,
+ 4.876242187812352e-10,
+ 4.871342773604681e-10,
+ 4.873002001914983e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9368579816946294e-06,
+ 1.8944499302619988e-08,
+ 1.839602603581625e-08,
+ 1.8398441881117833e-08,
+ 1.8401848933535803e-08
+ ],
+ "gamma_dfa": 0.10685028225998394,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9265596866607666,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 35985.046875,
+ 73193336.0,
+ 169984976.0,
+ 335981920.0,
+ 438037376.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.100844984757714e-08,
+ 4.92902163529152e-10,
+ 4.862484304091197e-10,
+ 4.871591463562197e-10,
+ 4.871424374996991e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.930574055426405e-06,
+ 1.8926412437281215e-08,
+ 1.8379486377284593e-08,
+ 1.8381888011731462e-08,
+ 1.8385312827717826e-08
+ ],
+ "gamma_dfa": 0.106783474504482,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9269328117370605,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 35994.07421875,
+ 73256784.0,
+ 170148048.0,
+ 336300032.0,
+ 438460544.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.113810968599864e-08,
+ 4.918689899824358e-10,
+ 4.860293834063611e-10,
+ 4.857191315821296e-10,
+ 4.859731506101639e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9313273444131482e-06,
+ 1.8918141719836967e-08,
+ 1.8372302790226058e-08,
+ 1.837469731924557e-08,
+ 1.8378123911588773e-08
+ ],
+ "gamma_dfa": 0.10685011067107553,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.9262909889221191,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 36002.55078125,
+ 73308792.0,
+ 170289472.0,
+ 336572864.0,
+ 438812896.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.121508988599089e-08,
+ 4.917221074762779e-10,
+ 4.853899504553283e-10,
+ 4.847242052186118e-10,
+ 4.849394219519354e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.933722271336592e-06,
+ 1.8911242349872737e-08,
+ 1.8366764109600808e-08,
+ 1.836915508590664e-08,
+ 1.8372583454606684e-08
+ ],
+ "gamma_dfa": 0.10693995938345324,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9261877536773682,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 36008.01953125,
+ 73348264.0,
+ 170386624.0,
+ 336761248.0,
+ 439049248.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.123732987362018e-08,
+ 4.916126949972011e-10,
+ 4.860848945575924e-10,
+ 4.87389184566922e-10,
+ 4.868180303319036e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9306668238859857e-06,
+ 1.8901717524499873e-08,
+ 1.835805107930355e-08,
+ 1.8360427844754668e-08,
+ 1.836385976616839e-08
+ ],
+ "gamma_dfa": 0.10689331469620811,
+ "acc_eval": 0.30859375,
+ "loss_eval": 1.9260027408599854,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 36011.9296875,
+ 73372720.0,
+ 170447072.0,
+ 336878464.0,
+ 439192800.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.115104156378948e-08,
+ 4.911633877391353e-10,
+ 4.862875657707377e-10,
+ 4.868677128122556e-10,
+ 4.867456437906981e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9297382297954755e-06,
+ 1.889710254943111e-08,
+ 1.8353631503487122e-08,
+ 1.835600293986772e-08,
+ 1.8359434861281443e-08
+ ],
+ "gamma_dfa": 0.1068731502891751,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9261021614074707,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 36014.109375,
+ 73385416.0,
+ 170481184.0,
+ 336945120.0,
+ 439280128.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.12362214269524e-08,
+ 4.916780316222003e-10,
+ 4.858832225451692e-10,
+ 4.867402036978774e-10,
+ 4.862423241824843e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.930293021563557e-06,
+ 1.8895260467388653e-08,
+ 1.8352444897118403e-08,
+ 1.835481810985584e-08,
+ 1.8358248254912723e-08
+ ],
+ "gamma_dfa": 0.10688256371940952,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.926184892654419,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 36015.9375,
+ 73396752.0,
+ 170510784.0,
+ 337001056.0,
+ 439352832.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.120947659837839e-08,
+ 4.916590468084792e-10,
+ 4.857179658479538e-10,
+ 4.86417739420375e-10,
+ 4.85919415815772e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.930209348050994e-06,
+ 1.889360845552801e-08,
+ 1.835070939648631e-08,
+ 1.8353080832866908e-08,
+ 1.835651275428063e-08
+ ],
+ "gamma_dfa": 0.10688149025372695,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9262256622314453,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 36016.734375,
+ 73401888.0,
+ 170523312.0,
+ 337026592.0,
+ 439384864.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.119820028516187e-08,
+ 4.917350415745148e-10,
+ 4.857160784688119e-10,
+ 4.860361002556601e-10,
+ 4.855379431845108e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9303794235602254e-06,
+ 1.8893027586841526e-08,
+ 1.835026353091962e-08,
+ 1.835263319094338e-08,
+ 1.83560651123571e-08
+ ],
+ "gamma_dfa": 0.10688879482768243,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926223874092102,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 36016.7734375,
+ 73401992.0,
+ 170523904.0,
+ 337027392.0,
+ 439386048.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.120198747794348e-08,
+ 4.91758134213427e-10,
+ 4.857037549932386e-10,
+ 4.860785107752008e-10,
+ 4.855802981929003e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9303721476026112e-06,
+ 1.8893056008550957e-08,
+ 1.8350315045267962e-08,
+ 1.8352682928934883e-08,
+ 1.8356114850348604e-08
+ ],
+ "gamma_dfa": 0.1068887785077095,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.926220417022705,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file