summaryrefslogtreecommitdiff
path: root/results/h2_no_residual_full_s123/snapshot_evolution_s123.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/h2_no_residual_full_s123/snapshot_evolution_s123.json')
-rw-r--r--results/h2_no_residual_full_s123/snapshot_evolution_s123.json2749
1 files changed, 2749 insertions, 0 deletions
diff --git a/results/h2_no_residual_full_s123/snapshot_evolution_s123.json b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json
new file mode 100644
index 0000000..cbad0e4
--- /dev/null
+++ b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json
@@ -0,0 +1,2749 @@
+{
+ "config": {
+ "output_dir": "results/h2_no_residual_full_s123",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 123,
+ "depth": 4,
+ "d_hidden": 256,
+ "log_every": 1,
+ "no_residual_add": true,
+ "w2_std": 0.5,
+ "random_targets": false,
+ "skip_bp": true
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "bp_log": null,
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.690464973449707,
+ 42.59831619262695,
+ 44.3453369140625,
+ 42.22452926635742,
+ 42.9206428527832
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001107031712308526,
+ 0.00020295626018196344,
+ 0.00014012052270118147,
+ 0.00011155186803080142,
+ 9.737444634083658e-05
+ ],
+ "bp_grad_norms_F": [
+ 0.03999145328998566,
+ 0.006603884976357222,
+ 0.004542526323348284,
+ 0.0036035836674273014,
+ 0.003130683209747076
+ ],
+ "gamma_dfa": 0.014937716419808567,
+ "acc_eval": 0.1025390625,
+ "loss_eval": 2.4329679012298584,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 1439.9598388671875,
+ 6195.9453125,
+ 9461.9462890625,
+ 7636.810546875,
+ 4633.29296875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.333700745628448e-07,
+ 6.382089736689522e-07,
+ 6.313390485956916e-07,
+ 6.29996520729037e-07,
+ 6.307979560915555e-07
+ ],
+ "bp_grad_norms_F": [
+ 5.84688204980921e-05,
+ 4.571088356897235e-05,
+ 4.522907693171874e-05,
+ 4.505911419983022e-05,
+ 4.481491123442538e-05
+ ],
+ "gamma_dfa": 0.029066061251796782,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 2.4298276901245117,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 3191.640380859375,
+ 44469.08984375,
+ 64403.30859375,
+ 40298.74609375,
+ 20860.859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.3425519657394034e-07,
+ 1.0419660867455605e-07,
+ 1.0399938332739112e-07,
+ 1.0393744531711491e-07,
+ 1.040296524479345e-07
+ ],
+ "bp_grad_norms_F": [
+ 2.9355647711781785e-05,
+ 1.3215229955676477e-05,
+ 1.2938599866174627e-05,
+ 1.2853749467467424e-05,
+ 1.2806296581402421e-05
+ ],
+ "gamma_dfa": 0.026177803985774517,
+ "acc_eval": 0.0849609375,
+ "loss_eval": 2.450077533721924,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 5072.8369140625,
+ 136290.921875,
+ 174667.984375,
+ 99872.765625,
+ 48604.14453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2239583213613514e-07,
+ 3.922263758227018e-08,
+ 3.8977361782599473e-08,
+ 3.902984602177639e-08,
+ 3.902538381339582e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.021085128944833e-05,
+ 5.516366400115658e-06,
+ 5.3598869271809235e-06,
+ 5.317293016560143e-06,
+ 5.302062618284253e-06
+ ],
+ "gamma_dfa": 0.025070607429370284,
+ "acc_eval": 0.1298828125,
+ "loss_eval": 2.470280170440674,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 6908.81494140625,
+ 300140.625,
+ 335781.1875,
+ 194737.578125,
+ 91168.953125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.2960639247176e-08,
+ 2.020572686944888e-08,
+ 2.0147625789945778e-08,
+ 2.017927869246705e-08,
+ 2.0169572678696568e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.5067237654875498e-05,
+ 3.154973455821164e-06,
+ 2.890229097829433e-06,
+ 2.8368178845994407e-06,
+ 2.826985564752249e-06
+ ],
+ "gamma_dfa": 0.0266711818985641,
+ "acc_eval": 0.125,
+ "loss_eval": 2.5050950050354004,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 8695.44140625,
+ 543316.5625,
+ 567899.375,
+ 335584.25,
+ 145692.765625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.380926009796895e-08,
+ 1.238302882455855e-08,
+ 1.2337157073716298e-08,
+ 1.2354545830817187e-08,
+ 1.2352338707444233e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.2898051863885485e-05,
+ 1.8491266473574797e-06,
+ 1.7919940091815079e-06,
+ 1.7602286561668734e-06,
+ 1.7506840777059551e-06
+ ],
+ "gamma_dfa": 0.022991596721112728,
+ "acc_eval": 0.115234375,
+ "loss_eval": 2.5430097579956055,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 10453.0947265625,
+ 880568.0625,
+ 851994.125,
+ 518617.03125,
+ 211486.65625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.6784926982800243e-08,
+ 8.739263535062491e-09,
+ 8.721374733511311e-09,
+ 8.72691785502866e-09,
+ 8.722811806194386e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2415013770805672e-05,
+ 1.2789794254786102e-06,
+ 1.2444495496310992e-06,
+ 1.2192489293738618e-06,
+ 1.2128068647143664e-06
+ ],
+ "gamma_dfa": 0.01671441923826933,
+ "acc_eval": 0.109375,
+ "loss_eval": 2.6205759048461914,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 12133.5908203125,
+ 1301136.875,
+ 1213412.0,
+ 761869.4375,
+ 299099.96875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.181741613569102e-08,
+ 6.701867505398695e-09,
+ 6.663806839668496e-09,
+ 6.668138485821373e-09,
+ 6.665318963428035e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4586516044801101e-05,
+ 9.615758926884155e-07,
+ 9.358571446682618e-07,
+ 9.15065527351544e-07,
+ 9.087396506402001e-07
+ ],
+ "gamma_dfa": 0.009791500167921185,
+ "acc_eval": 0.1103515625,
+ "loss_eval": 2.687662363052368,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 13778.3701171875,
+ 1831990.625,
+ 1660265.5,
+ 1070697.0,
+ 405510.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.950679510784539e-08,
+ 5.247439816002952e-09,
+ 5.240861966626653e-09,
+ 5.241989065041253e-09,
+ 5.2364685920736065e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.731455424509477e-05,
+ 7.950770282150188e-07,
+ 7.47014951230085e-07,
+ 7.077854888848378e-07,
+ 7.019767735982896e-07
+ ],
+ "gamma_dfa": 0.002645118860527873,
+ "acc_eval": 0.1083984375,
+ "loss_eval": 2.749309539794922,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 15423.7236328125,
+ 2441876.0,
+ 2156981.0,
+ 1456388.625,
+ 514814.78125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.9704105720138614e-08,
+ 4.314747670264296e-09,
+ 4.316281554395118e-09,
+ 4.3085655043739735e-09,
+ 4.306641265827693e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.53065484482795e-05,
+ 5.914198482059874e-07,
+ 5.698148015653715e-07,
+ 5.564911020883301e-07,
+ 5.521175125977607e-07
+ ],
+ "gamma_dfa": -0.004648297093808651,
+ "acc_eval": 0.087890625,
+ "loss_eval": 2.819417953491211,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 17014.275390625,
+ 3299996.25,
+ 2739406.75,
+ 1924564.5,
+ 645257.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.217410503632891e-08,
+ 3.7931444651917445e-09,
+ 3.791894354066017e-09,
+ 3.787997471249582e-09,
+ 3.786980062869816e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.8386483134236187e-05,
+ 5.170510917196225e-07,
+ 4.828122541766788e-07,
+ 4.6214248072828923e-07,
+ 4.5809062498847197e-07
+ ],
+ "gamma_dfa": -0.008237186702899635,
+ "acc_eval": 0.0771484375,
+ "loss_eval": 2.8880226612091064,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 18615.341796875,
+ 4327781.5,
+ 3460663.0,
+ 2493429.0,
+ 811358.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.4753250822159316e-08,
+ 3.4849005903225816e-09,
+ 3.4845948349016e-09,
+ 3.4844236385112026e-09,
+ 3.4833074202822445e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.760143095452804e-05,
+ 4.3398881643952336e-07,
+ 4.0691622871236177e-07,
+ 3.9397295381604636e-07,
+ 3.9136793361649325e-07
+ ],
+ "gamma_dfa": -0.013480214809533209,
+ "acc_eval": 0.107421875,
+ "loss_eval": 3.0378975868225098,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 20197.244140625,
+ 5361947.0,
+ 4309913.5,
+ 3117389.0,
+ 986810.625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.110099803890989e-08,
+ 3.3039087021791147e-09,
+ 3.3079554651038734e-09,
+ 3.309411411578367e-09,
+ 3.3057334647423886e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.7853921235655434e-05,
+ 3.920526410183811e-07,
+ 3.4606765098033065e-07,
+ 3.4065161003127287e-07,
+ 3.3874636073960573e-07
+ ],
+ "gamma_dfa": -0.017087776213884354,
+ "acc_eval": 0.1005859375,
+ "loss_eval": 3.226945161819458,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 21745.060546875,
+ 6626533.5,
+ 5288037.5,
+ 3845802.25,
+ 1183958.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.904146232500352e-08,
+ 3.0698867892198223e-09,
+ 3.072165188910958e-09,
+ 3.0722313582032257e-09,
+ 3.0718891874670362e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.694533218862489e-05,
+ 1.2521383041530498e-06,
+ 3.6304524542174477e-07,
+ 3.428452259868209e-07,
+ 3.3693893897179805e-07
+ ],
+ "gamma_dfa": -0.02254341426305473,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 3.4535317420959473,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 23268.326171875,
+ 8059270.5,
+ 6347708.5,
+ 4634334.0,
+ 1389795.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.468641882724114e-08,
+ 3.0219813318410615e-09,
+ 3.0241904536154607e-09,
+ 3.0243862969570046e-09,
+ 3.0241051884871695e-09
+ ],
+ "bp_grad_norms_F": [
+ 3.818523691734299e-05,
+ 3.265660666329495e-07,
+ 2.885882395275985e-07,
+ 2.7603223884398176e-07,
+ 2.7437968697086035e-07
+ ],
+ "gamma_dfa": -0.024787384318187833,
+ "acc_eval": 0.0830078125,
+ "loss_eval": 3.7082602977752686,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 24769.162109375,
+ 9503637.0,
+ 7524496.0,
+ 5577708.5,
+ 1619056.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.079865665422403e-08,
+ 2.885043093314721e-09,
+ 2.8850699607119168e-09,
+ 2.885329752899679e-09,
+ 2.885090166770965e-09
+ ],
+ "bp_grad_norms_F": [
+ 3.172496144543402e-05,
+ 2.7863097784575075e-07,
+ 2.5604617803764995e-07,
+ 2.4778245233392227e-07,
+ 2.465397699324967e-07
+ ],
+ "gamma_dfa": -0.028090000618249178,
+ "acc_eval": 0.09765625,
+ "loss_eval": 3.9940719604492188,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 26297.634765625,
+ 11348280.0,
+ 8835018.0,
+ 6709572.0,
+ 1860997.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.416654395659862e-08,
+ 2.716076252795574e-09,
+ 2.708202995194142e-09,
+ 2.713108182561541e-09,
+ 2.710037305675428e-09
+ ],
+ "bp_grad_norms_F": [
+ 6.21284925728105e-05,
+ 2.910503269504261e-07,
+ 2.3999916720640613e-07,
+ 2.286197116063704e-07,
+ 2.275272947827034e-07
+ ],
+ "gamma_dfa": -0.0305853869067505,
+ "acc_eval": 0.10546875,
+ "loss_eval": 4.280234336853027,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 27796.267578125,
+ 13131638.0,
+ 10275209.0,
+ 7908104.0,
+ 2124187.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.618104629931622e-08,
+ 2.527688947040474e-09,
+ 2.5195041608583324e-09,
+ 2.5170519002415404e-09,
+ 2.5167292694305843e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.9607001124531962e-05,
+ 2.280380755337319e-07,
+ 2.1368994396198104e-07,
+ 2.0886261609120993e-07,
+ 2.0800932531983563e-07
+ ],
+ "gamma_dfa": -0.032157177105546,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 4.584749221801758,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 29261.162109375,
+ 15093201.0,
+ 11924527.0,
+ 9201859.0,
+ 2398880.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.982802057744266e-08,
+ 2.362436024583303e-09,
+ 2.3667561244167246e-09,
+ 2.3683257577289396e-09,
+ 2.3661459458423906e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4750239643035457e-05,
+ 2.0303163239532296e-07,
+ 1.9652848948226165e-07,
+ 1.9512303595092817e-07,
+ 1.9424047081884055e-07
+ ],
+ "gamma_dfa": -0.033276769798249006,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 4.833416938781738,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 30654.640625,
+ 17198064.0,
+ 13711921.0,
+ 10622219.0,
+ 2733435.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.140238432792103e-08,
+ 2.218417227695113e-09,
+ 2.217410255411778e-09,
+ 2.2205985938938966e-09,
+ 2.2187365278369953e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.2792535673943348e-05,
+ 2.101570970580724e-07,
+ 1.8281718894286314e-07,
+ 1.770977462456358e-07,
+ 1.7618602043967257e-07
+ ],
+ "gamma_dfa": -0.0334639239590615,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 5.091382026672363,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 32095.28125,
+ 19561478.0,
+ 15722807.0,
+ 12287095.0,
+ 3104931.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.42815958637766e-08,
+ 2.0783239573773926e-09,
+ 2.0685115842411506e-09,
+ 2.072532145902528e-09,
+ 2.069893811906809e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.035827492363751e-05,
+ 1.7020983023030567e-07,
+ 1.504546105479676e-07,
+ 1.4846344242869236e-07,
+ 1.4791994829010946e-07
+ ],
+ "gamma_dfa": -0.03437755152117461,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 5.338113784790039,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 33549.3515625,
+ 22241236.0,
+ 17865768.0,
+ 13953577.0,
+ 3455886.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.694593927633832e-08,
+ 1.9436505738212873e-09,
+ 1.932475734989225e-09,
+ 1.9355790303876574e-09,
+ 1.9334791545588814e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.946108568517957e-05,
+ 1.476916224874003e-07,
+ 1.3395830933404795e-07,
+ 1.3276194010813924e-07,
+ 1.323410430131844e-07
+ ],
+ "gamma_dfa": -0.035225782776251435,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 5.639235496520996,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 35003.625,
+ 25199516.0,
+ 20151382.0,
+ 15868719.0,
+ 3834722.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.815706647486877e-08,
+ 1.8191292916469592e-09,
+ 1.812876404549968e-09,
+ 1.8141808055816e-09,
+ 1.813302730191424e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.900309871416539e-05,
+ 1.3126974351962417e-07,
+ 1.2148075256845914e-07,
+ 1.204552404487913e-07,
+ 1.2008344185687747e-07
+ ],
+ "gamma_dfa": -0.036192891420796514,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 5.912903785705566,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 36385.25390625,
+ 28323954.0,
+ 22925044.0,
+ 17971546.0,
+ 4269257.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.902030484454372e-08,
+ 1.6868005880965597e-09,
+ 1.6695808069400186e-09,
+ 1.6706477312666834e-09,
+ 1.6698925575653334e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.7624819520278834e-05,
+ 1.1903176755367895e-07,
+ 1.1061406013368469e-07,
+ 1.0976869191381411e-07,
+ 1.094643096166692e-07
+ ],
+ "gamma_dfa": -0.037227407563477755,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 6.16106653213501,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 37805.91796875,
+ 31593894.0,
+ 25615532.0,
+ 20113868.0,
+ 4713793.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.859636662667981e-08,
+ 1.5704177958042465e-09,
+ 1.5608032644109926e-09,
+ 1.5628717209281717e-09,
+ 1.5616322679434802e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.6187867004191503e-05,
+ 1.0865824151551351e-07,
+ 1.0160825070215651e-07,
+ 1.008768109045377e-07,
+ 1.0061884125889264e-07
+ ],
+ "gamma_dfa": -0.03782000340288505,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 6.406368732452393,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 39138.39453125,
+ 34956036.0,
+ 28542170.0,
+ 22404560.0,
+ 5139918.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.837745551521948e-08,
+ 1.4733757547347182e-09,
+ 1.4583911855936549e-09,
+ 1.4602866693635974e-09,
+ 1.4591743369152255e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.768167749105487e-05,
+ 1.015666910575419e-07,
+ 9.354967289709748e-08,
+ 9.288694968745403e-08,
+ 9.264899603067533e-08
+ ],
+ "gamma_dfa": -0.03860464284662157,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 6.634061813354492,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 40505.18359375,
+ 38650996.0,
+ 31492410.0,
+ 24792780.0,
+ 5620949.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.942911560756329e-08,
+ 1.3685884647784974e-09,
+ 1.3593203229689266e-09,
+ 1.3602377002541743e-09,
+ 1.3594056991195202e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.0700817913166247e-05,
+ 9.837697945158652e-08,
+ 8.757055525165924e-08,
+ 8.689728048238976e-08,
+ 8.669941564676265e-08
+ ],
+ "gamma_dfa": -0.03959248901810497,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 6.7737202644348145,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 41849.203125,
+ 42830568.0,
+ 34648896.0,
+ 27355716.0,
+ 6044684.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.865106420647862e-08,
+ 1.28658228515377e-09,
+ 1.2788612391290144e-09,
+ 1.2804906024399543e-09,
+ 1.2795147164013088e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.3165159291238524e-05,
+ 9.389359689748744e-08,
+ 8.146788132989968e-08,
+ 8.082054137048544e-08,
+ 8.063241097033824e-08
+ ],
+ "gamma_dfa": -0.040185014018788934,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 6.946921348571777,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 43129.56640625,
+ 47054352.0,
+ 37982196.0,
+ 29955390.0,
+ 6540964.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0036384878731042e-07,
+ 1.2043249730808725e-09,
+ 1.2007507210753943e-09,
+ 1.2010574756970982e-09,
+ 1.2009065963880516e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.413927359157242e-05,
+ 8.847878518736252e-08,
+ 7.592807094169984e-08,
+ 7.532069901117211e-08,
+ 7.515143352065934e-08
+ ],
+ "gamma_dfa": -0.04085268918424845,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.133134841918945,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 44368.93359375,
+ 51374800.0,
+ 41470788.0,
+ 32761826.0,
+ 6998702.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.0049345178231306e-07,
+ 1.1348291195645288e-09,
+ 1.132080207355557e-09,
+ 1.1335333782724888e-09,
+ 1.1326910520637057e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.53067773883231e-05,
+ 8.518416905189952e-08,
+ 7.111059119324636e-08,
+ 7.048716810231781e-08,
+ 7.034290661067644e-08
+ ],
+ "gamma_dfa": -0.04143569804728031,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.306489944458008,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 45540.84375,
+ 55799284.0,
+ 44925840.0,
+ 35576004.0,
+ 7506460.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.999683214800825e-08,
+ 1.0682152939978096e-09,
+ 1.0609697564945009e-09,
+ 1.0612235534779302e-09,
+ 1.0610903267149752e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.843971222115215e-05,
+ 8.002744067425738e-08,
+ 6.616264869307997e-08,
+ 6.571565336344065e-08,
+ 6.558265397416108e-08
+ ],
+ "gamma_dfa": -0.04231115654692985,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.393707752227783,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 46740.3125,
+ 60156548.0,
+ 48609568.0,
+ 38622656.0,
+ 7923887.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.801681954968444e-08,
+ 1.007545269438026e-09,
+ 1.0030560826379542e-09,
+ 1.0032202846232963e-09,
+ 1.003132132915141e-09
+ ],
+ "bp_grad_norms_F": [
+ 2.0189601855236106e-05,
+ 7.754985631436284e-08,
+ 6.295730514693787e-08,
+ 6.247479689136526e-08,
+ 6.235500649154346e-08
+ ],
+ "gamma_dfa": -0.042783402430359274,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.513785362243652,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 47946.2578125,
+ 65027368.0,
+ 52475872.0,
+ 41636652.0,
+ 8527125.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.764004715862029e-08,
+ 9.540165324395389e-10,
+ 9.49443301756503e-10,
+ 9.49665124316823e-10,
+ 9.49536671512874e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.2026428268873133e-05,
+ 7.400986135053245e-08,
+ 5.9516974459938865e-08,
+ 5.903561017817083e-08,
+ 5.892941956631148e-08
+ ],
+ "gamma_dfa": -0.04377710592234507,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.666411876678467,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 49101.84765625,
+ 70129512.0,
+ 56707888.0,
+ 44883068.0,
+ 9051192.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.715147086808429e-08,
+ 9.088669261636539e-10,
+ 8.977363297191232e-10,
+ 8.978853771601791e-10,
+ 8.978119914182514e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.6852110750041902e-05,
+ 7.312536354220356e-08,
+ 5.6589971819676066e-08,
+ 5.605170372291468e-08,
+ 5.593761187583368e-08
+ ],
+ "gamma_dfa": -0.04420170868979767,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 7.917013645172119,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 50205.94921875,
+ 75218112.0,
+ 61038472.0,
+ 48316120.0,
+ 9560446.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.637748377144817e-08,
+ 8.535361861738977e-10,
+ 8.499229653402551e-10,
+ 8.501254145087955e-10,
+ 8.500238846131936e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.704818507481832e-05,
+ 6.82247573990935e-08,
+ 5.427460791906924e-08,
+ 5.371628120087735e-08,
+ 5.360957899824825e-08
+ ],
+ "gamma_dfa": -0.0447281262895558,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 7.9629034996032715,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 51283.7109375,
+ 79971480.0,
+ 65131160.0,
+ 51675436.0,
+ 10150061.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.52169543211312e-08,
+ 8.244336879847936e-10,
+ 8.130549011831079e-10,
+ 8.13186962211887e-10,
+ 8.13120237808107e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.043289871129673e-05,
+ 6.438099831029831e-08,
+ 5.208626419062057e-08,
+ 5.1470838258182994e-08,
+ 5.136259773053098e-08
+ ],
+ "gamma_dfa": -0.04496103324345313,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 8.225072860717773,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 52391.31640625,
+ 85212368.0,
+ 69690088.0,
+ 54922688.0,
+ 10724330.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.460915606496201e-08,
+ 7.854291661502089e-10,
+ 7.73968722445062e-10,
+ 7.748673369611936e-10,
+ 7.740979524051284e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.253111935919151e-05,
+ 6.160666288224093e-08,
+ 5.0236756976573815e-08,
+ 4.957355770329741e-08,
+ 4.9483450226261994e-08
+ ],
+ "gamma_dfa": -0.04545678128488362,
+ "acc_eval": 0.103515625,
+ "loss_eval": 8.447563171386719,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 53471.4609375,
+ 90755416.0,
+ 74424576.0,
+ 58527500.0,
+ 11383908.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.481268392619313e-08,
+ 7.485803088513876e-10,
+ 7.380538402657066e-10,
+ 7.38905825414804e-10,
+ 7.384990952097326e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.8782606023014523e-05,
+ 5.679364178945434e-08,
+ 4.747649740011184e-08,
+ 4.686737042902678e-08,
+ 4.6776307272011763e-08
+ ],
+ "gamma_dfa": -0.04577424196759239,
+ "acc_eval": 0.10546875,
+ "loss_eval": 8.63510513305664,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 54526.26171875,
+ 96224200.0,
+ 79402688.0,
+ 62338148.0,
+ 11946441.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.414058155243765e-08,
+ 7.102119448099131e-10,
+ 7.013249980758474e-10,
+ 7.021335179935306e-10,
+ 7.017796899155826e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.6797888494911604e-05,
+ 5.262990754317798e-08,
+ 4.363804251283909e-08,
+ 4.31665583278118e-08,
+ 4.308598633429028e-08
+ ],
+ "gamma_dfa": -0.04641679968335666,
+ "acc_eval": 0.10546875,
+ "loss_eval": 8.730607986450195,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 55583.125,
+ 101480040.0,
+ 83697192.0,
+ 66218348.0,
+ 12538905.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.47181035826361e-08,
+ 6.868624002898116e-10,
+ 6.774021343858294e-10,
+ 6.77987721520168e-10,
+ 6.776118000040299e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.6024237740784883e-05,
+ 5.0800426976138624e-08,
+ 4.1874233858152365e-08,
+ 4.15037817447228e-08,
+ 4.1430755715055056e-08
+ ],
+ "gamma_dfa": -0.04637146886670962,
+ "acc_eval": 0.10546875,
+ "loss_eval": 8.87772274017334,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 56556.95703125,
+ 107073544.0,
+ 88369376.0,
+ 69716112.0,
+ 13102132.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.377198040283474e-08,
+ 6.585805234493591e-10,
+ 6.487251291709129e-10,
+ 6.49616194170477e-10,
+ 6.491358561788729e-10
+ ],
+ "bp_grad_norms_F": [
+ 3.484269473119639e-05,
+ 7.467966156582406e-08,
+ 4.40217604591453e-08,
+ 4.3712645947380224e-08,
+ 4.352901683546406e-08
+ ],
+ "gamma_dfa": -0.04681209813861642,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.053573608398438,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 57504.6875,
+ 113131968.0,
+ 93389736.0,
+ 73651392.0,
+ 13735091.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.427740366163562e-08,
+ 6.312518285866986e-10,
+ 6.225254756131449e-10,
+ 6.232416249751793e-10,
+ 6.229293747495035e-10
+ ],
+ "bp_grad_norms_F": [
+ 0.00021013167861383408,
+ 5.526797508537129e-07,
+ 5.349095744122678e-08,
+ 4.9017671699402854e-08,
+ 4.773081840880877e-08
+ ],
+ "gamma_dfa": -0.047232568118488416,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.214558601379395,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 58472.46875,
+ 118762648.0,
+ 98279872.0,
+ 77365656.0,
+ 14248840.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.310819137908766e-08,
+ 6.046827483174866e-10,
+ 5.995566820793385e-10,
+ 6.004566288630997e-10,
+ 5.99891414321263e-10
+ ],
+ "bp_grad_norms_F": [
+ 0.00010149624722544104,
+ 2.533984684305324e-07,
+ 4.4013567901401984e-08,
+ 4.291897326424987e-08,
+ 4.2505401864900705e-08
+ ],
+ "gamma_dfa": -0.04764813384099398,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 9.217700958251953,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 59401.03125,
+ 124607344.0,
+ 103250600.0,
+ 81130456.0,
+ 14810775.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.245275833791311e-08,
+ 5.824435378443127e-10,
+ 5.769146271816794e-10,
+ 5.777631706394004e-10,
+ 5.772260447400868e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.0584909584140405e-05,
+ 9.203435524796078e-08,
+ 3.4605545096155765e-08,
+ 3.4145575256161464e-08,
+ 3.4092256129270027e-08
+ ],
+ "gamma_dfa": -0.04794895404484123,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 9.390031814575195,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 60278.7890625,
+ 130581952.0,
+ 108096264.0,
+ 85136336.0,
+ 15405965.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.3390447375441e-08,
+ 5.630300670134147e-10,
+ 5.5805338128323e-10,
+ 5.588779439236191e-10,
+ 5.583465911840335e-10
+ ],
+ "bp_grad_norms_F": [
+ 4.781157258548774e-05,
+ 1.0881421275144021e-07,
+ 3.3062310222931046e-08,
+ 3.248984370429753e-08,
+ 3.2446724418377926e-08
+ ],
+ "gamma_dfa": -0.04778411969891749,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.621635437011719,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 61138.51171875,
+ 136691760.0,
+ 113402280.0,
+ 88772512.0,
+ 15993850.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.273151135857916e-08,
+ 5.43037670386326e-10,
+ 5.421059157129093e-10,
+ 5.42630551603196e-10,
+ 5.423762550194056e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.6410325517645106e-05,
+ 4.767177586018079e-08,
+ 3.172428364450752e-08,
+ 3.129938974666402e-08,
+ 3.1260690036560845e-08
+ ],
+ "gamma_dfa": -0.04829322246951051,
+ "acc_eval": 0.099609375,
+ "loss_eval": 9.733180046081543,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 61988.87890625,
+ 142480176.0,
+ 118613440.0,
+ 92755400.0,
+ 16660659.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.238209486284177e-08,
+ 5.250901380371431e-10,
+ 5.242600242816309e-10,
+ 5.243941947341568e-10,
+ 5.243331879789537e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.4320243028341793e-05,
+ 4.237628559167206e-08,
+ 3.048009489248216e-08,
+ 3.0116801497115375e-08,
+ 3.0080638424578865e-08
+ ],
+ "gamma_dfa": -0.048452052724314854,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 9.875200271606445,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 62831.0078125,
+ 148088512.0,
+ 124018112.0,
+ 96570944.0,
+ 17294454.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.218231866725546e-08,
+ 5.094495381108288e-10,
+ 5.088939269981552e-10,
+ 5.090234345139777e-10,
+ 5.089637600264041e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.273459904245101e-05,
+ 3.8132583313199575e-08,
+ 2.9463127049211835e-08,
+ 2.9154062275438264e-08,
+ 2.9119732403160015e-08
+ ],
+ "gamma_dfa": -0.04870791392750107,
+ "acc_eval": 0.1015625,
+ "loss_eval": 9.965906143188477,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 63619.36328125,
+ 153924256.0,
+ 129021120.0,
+ 100401856.0,
+ 17813234.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.170297232685698e-08,
+ 4.942196096813234e-10,
+ 4.92394736095747e-10,
+ 4.925179708514804e-10,
+ 4.924622931667955e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.1741494492744096e-05,
+ 3.567927819858596e-08,
+ 2.843704471899855e-08,
+ 2.816011068773605e-08,
+ 2.812711485944419e-08
+ ],
+ "gamma_dfa": -0.049255506150075234,
+ "acc_eval": 0.1025390625,
+ "loss_eval": 9.984619140625,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 64400.26171875,
+ 159789408.0,
+ 134080160.0,
+ 104244408.0,
+ 18432430.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.070604534144877e-08,
+ 4.78996176056512e-10,
+ 4.780518758629171e-10,
+ 4.781712803492155e-10,
+ 4.781176565771261e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.1263931557768956e-05,
+ 3.437593676380857e-08,
+ 2.7499025279098532e-08,
+ 2.7248480805042163e-08,
+ 2.7216600528845447e-08
+ ],
+ "gamma_dfa": -0.04910894545173505,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 10.146781921386719,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 65147.40234375,
+ 165462976.0,
+ 138862000.0,
+ 107834176.0,
+ 19038348.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.061706407464953e-08,
+ 4.668093134263529e-10,
+ 4.645184237261901e-10,
+ 4.6463269343099967e-10,
+ 4.6457995783732997e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.0052335457876325e-05,
+ 3.337338227993314e-08,
+ 2.6690587517919084e-08,
+ 2.646976504649956e-08,
+ 2.64381352366172e-08
+ ],
+ "gamma_dfa": -0.04920872090588091,
+ "acc_eval": 0.0966796875,
+ "loss_eval": 10.281063079833984,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 65863.96875,
+ 171261072.0,
+ 143810992.0,
+ 111834848.0,
+ 19625576.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.099313302840528e-08,
+ 4.5625103695101643e-10,
+ 4.524729202426414e-10,
+ 4.5258219394384014e-10,
+ 4.5253126246258546e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.9101036741631106e-05,
+ 3.2813989747637606e-08,
+ 2.5957119120789685e-08,
+ 2.5756730082093782e-08,
+ 2.572607549211625e-08
+ ],
+ "gamma_dfa": -0.04933306630846346,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 10.349817276000977,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 66593.8203125,
+ 176983552.0,
+ 149183712.0,
+ 115646976.0,
+ 20178866.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.1175948568889e-08,
+ 4.444306589412861e-10,
+ 4.412468168624173e-10,
+ 4.4135325949490323e-10,
+ 4.413052423490882e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.852569039328955e-05,
+ 3.21252677792927e-08,
+ 2.5265682879194173e-08,
+ 2.5077683929453087e-08,
+ 2.5048496610224902e-08
+ ],
+ "gamma_dfa": -0.04927207152650226,
+ "acc_eval": 0.1015625,
+ "loss_eval": 10.515829086303711,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 67302.6328125,
+ 182834976.0,
+ 154352272.0,
+ 119312168.0,
+ 20747826.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.146700818973841e-08,
+ 4.3625753010090307e-10,
+ 4.31810531775767e-10,
+ 4.319128388274862e-10,
+ 4.3186304532483177e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.817524571379181e-05,
+ 3.176044671704403e-08,
+ 2.468624060725233e-08,
+ 2.4515436791716638e-08,
+ 2.4487377459081472e-08
+ ],
+ "gamma_dfa": -0.04947220539179398,
+ "acc_eval": 0.1015625,
+ "loss_eval": 10.631593704223633,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 67943.6640625,
+ 188557808.0,
+ 159066528.0,
+ 122911296.0,
+ 21287842.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.120569188780792e-08,
+ 4.2657519183642023e-10,
+ 4.219723181986268e-10,
+ 4.220687410683155e-10,
+ 4.220172822311241e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.8009301129495725e-05,
+ 3.077772348092367e-08,
+ 2.4100344830912945e-08,
+ 2.3935520232498675e-08,
+ 2.390864395351855e-08
+ ],
+ "gamma_dfa": -0.04969306073326152,
+ "acc_eval": 0.1025390625,
+ "loss_eval": 10.66339111328125,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 68579.2578125,
+ 193996528.0,
+ 163940560.0,
+ 126448000.0,
+ 21766094.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.058499728098468e-08,
+ 4.1539605089013776e-10,
+ 4.1060946309734447e-10,
+ 4.1091324787245753e-10,
+ 4.10790096383451e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5884443200775422e-05,
+ 2.8224185655290057e-08,
+ 2.346608596326405e-08,
+ 2.3316024666542035e-08,
+ 2.328991399735969e-08
+ ],
+ "gamma_dfa": -0.04980730817624135,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 10.783552169799805,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 69203.796875,
+ 199460144.0,
+ 168890016.0,
+ 129780784.0,
+ 22302874.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.078585350152935e-08,
+ 4.0699738024230214e-10,
+ 4.025394462203735e-10,
+ 4.0283623659043144e-10,
+ 4.027146949248106e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5867637557676062e-05,
+ 2.8422073583556084e-08,
+ 2.300496149132414e-08,
+ 2.2864167448233275e-08,
+ 2.2838495539190262e-08
+ ],
+ "gamma_dfa": -0.04992603903519921,
+ "acc_eval": 0.09765625,
+ "loss_eval": 10.859743118286133,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 69791.453125,
+ 204736432.0,
+ 173582192.0,
+ 133232672.0,
+ 22820996.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.066331330132016e-08,
+ 3.96910615485524e-10,
+ 3.925613167865549e-10,
+ 3.926495240058614e-10,
+ 3.9260561468523747e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.4505669241771102e-05,
+ 2.6905636829610557e-08,
+ 2.2510086239435623e-08,
+ 2.2376122288392253e-08,
+ 2.235119467286495e-08
+ ],
+ "gamma_dfa": -0.04994637455092743,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 10.989320755004883,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 70371.9375,
+ 210191472.0,
+ 178149376.0,
+ 136544128.0,
+ 23324878.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.057572469828301e-08,
+ 3.849987550985645e-10,
+ 3.8476868913228657e-10,
+ 3.8500982957323515e-10,
+ 3.8497979804041904e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.4466082575381733e-05,
+ 2.6583837353655326e-08,
+ 2.2064293503376575e-08,
+ 2.1934541294399423e-08,
+ 2.191077008717457e-08
+ ],
+ "gamma_dfa": -0.05017502269765828,
+ "acc_eval": 0.1015625,
+ "loss_eval": 11.14348030090332,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 70926.1171875,
+ 215072384.0,
+ 182463952.0,
+ 139682864.0,
+ 23765930.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.095985831208964e-08,
+ 3.789666913611711e-10,
+ 3.7876501934874796e-10,
+ 3.788162006301832e-10,
+ 3.7878628011966953e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5613211871823296e-05,
+ 2.6332656943850452e-08,
+ 2.168836488181114e-08,
+ 2.1559124263603735e-08,
+ 2.1535397465299866e-08
+ ],
+ "gamma_dfa": -0.05026113349595107,
+ "acc_eval": 0.1015625,
+ "loss_eval": 11.245050430297852,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 71444.5078125,
+ 220139504.0,
+ 186860912.0,
+ 142962752.0,
+ 24235874.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.007455048504198e-08,
+ 3.741315868222017e-10,
+ 3.7062136692966874e-10,
+ 3.705513118568149e-10,
+ 3.7064074032144845e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.3456123017240316e-05,
+ 2.666844878262964e-08,
+ 2.1298749430798125e-08,
+ 2.1137482875133173e-08,
+ 2.1113727655119874e-08
+ ],
+ "gamma_dfa": -0.050498483098635916,
+ "acc_eval": 0.095703125,
+ "loss_eval": 11.284198760986328,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 71960.484375,
+ 225013808.0,
+ 190973296.0,
+ 145961232.0,
+ 24784322.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.034386749817713e-08,
+ 3.658137681661344e-10,
+ 3.6446287654534615e-10,
+ 3.645108936911612e-10,
+ 3.6448208340367216e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.785225660772994e-05,
+ 2.5983931450923592e-08,
+ 2.1029784136317176e-08,
+ 2.0842044534674642e-08,
+ 2.0818688994950207e-08
+ ],
+ "gamma_dfa": -0.05046346641029231,
+ "acc_eval": 0.0986328125,
+ "loss_eval": 11.392132759094238,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 72430.8359375,
+ 229851040.0,
+ 195010560.0,
+ 149020912.0,
+ 25253220.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.096932984675732e-08,
+ 3.608093823714853e-10,
+ 3.5983932500371907e-10,
+ 3.600989784136033e-10,
+ 3.599919529140294e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.763499469438102e-05,
+ 2.5544034443214514e-08,
+ 2.0638090347802063e-08,
+ 2.0451848214975143e-08,
+ 2.0428588598520037e-08
+ ],
+ "gamma_dfa": -0.050787233689334244,
+ "acc_eval": 0.091796875,
+ "loss_eval": 11.378694534301758,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 72896.0234375,
+ 234300800.0,
+ 198948976.0,
+ 152100720.0,
+ 25625868.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.0542243924574e-08,
+ 3.557290573219518e-10,
+ 3.5249042573681777e-10,
+ 3.5253552854719317e-10,
+ 3.5250652397067483e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.9849852580809966e-05,
+ 2.5036932527200406e-08,
+ 2.0406586642707225e-08,
+ 2.020845712991104e-08,
+ 2.0186647020636883e-08
+ ],
+ "gamma_dfa": -0.05070546226488659,
+ "acc_eval": 0.095703125,
+ "loss_eval": 11.479286193847656,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 73328.34375,
+ 238316288.0,
+ 202586032.0,
+ 155039648.0,
+ 26024600.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.105094989081408e-08,
+ 3.510710333554101e-10,
+ 3.495781997209235e-10,
+ 3.500161271929869e-10,
+ 3.499118772509746e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.91574870061595e-05,
+ 2.4413550292479158e-08,
+ 2.0145231260926266e-08,
+ 1.9952185681404444e-08,
+ 1.9931007955165114e-08
+ ],
+ "gamma_dfa": -0.05086314045183826,
+ "acc_eval": 0.0908203125,
+ "loss_eval": 11.489895820617676,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 73748.5859375,
+ 242733616.0,
+ 206386528.0,
+ 157821696.0,
+ 26465746.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.082241803071156e-08,
+ 3.460224329288053e-10,
+ 3.438662687926808e-10,
+ 3.4428762618610165e-10,
+ 3.442592599878225e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.8733484214171767e-05,
+ 2.375874608162576e-08,
+ 1.9914560667189107e-08,
+ 1.971613627915758e-08,
+ 1.969561402859199e-08
+ ],
+ "gamma_dfa": -0.05102878155594226,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 11.548040390014648,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 74135.421875,
+ 246595824.0,
+ 209988560.0,
+ 160289792.0,
+ 26835076.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.098909714566616e-08,
+ 3.4202959908746777e-10,
+ 3.378679835908116e-10,
+ 3.3727598491850586e-10,
+ 3.370834167348846e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.7568949008127674e-05,
+ 2.2366455354472237e-08,
+ 1.9751842827986366e-08,
+ 1.955501183203978e-08,
+ 1.9534347472927038e-08
+ ],
+ "gamma_dfa": -0.05096771135140443,
+ "acc_eval": 0.091796875,
+ "loss_eval": 11.69294548034668,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 74519.4609375,
+ 250496496.0,
+ 213470016.0,
+ 163034096.0,
+ 27224026.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.081137619659785e-08,
+ 3.371838919186132e-10,
+ 3.34856059547306e-10,
+ 3.351785793359596e-10,
+ 3.353441968556581e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.4417575332336128e-05,
+ 2.182440006492925e-08,
+ 1.9469752032819088e-08,
+ 1.9279319474208023e-08,
+ 1.925921822021337e-08
+ ],
+ "gamma_dfa": -0.051001671119593084,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 11.729022026062012,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 74894.3515625,
+ 254264416.0,
+ 216871648.0,
+ 165452496.0,
+ 27605496.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.085709962164401e-08,
+ 3.3377053898497877e-10,
+ 3.3198219173691257e-10,
+ 3.3151825729049733e-10,
+ 3.3171596025560746e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.2483380234916694e-05,
+ 2.14983302271321e-08,
+ 1.9263785233647468e-08,
+ 1.9080003355043118e-08,
+ 1.9060196976283805e-08
+ ],
+ "gamma_dfa": -0.050941091212735046,
+ "acc_eval": 0.087890625,
+ "loss_eval": 11.798931121826172,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 75242.4609375,
+ 257808672.0,
+ 219912720.0,
+ 167826688.0,
+ 27928376.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.091576913533572e-08,
+ 3.2881539158147177e-10,
+ 3.263028736100182e-10,
+ 3.2664609905808106e-10,
+ 3.264644665712524e-10
+ ],
+ "bp_grad_norms_F": [
+ 2.127209518221207e-05,
+ 2.0985540416518234e-08,
+ 1.9050151678356997e-08,
+ 1.8875326190936903e-08,
+ 1.8856361805319466e-08
+ ],
+ "gamma_dfa": -0.05089846828195732,
+ "acc_eval": 0.091796875,
+ "loss_eval": 11.895479202270508,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 75572.1171875,
+ 261119824.0,
+ 222742832.0,
+ 169876672.0,
+ 28198556.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.057247041255323e-08,
+ 3.278008420259937e-10,
+ 3.249100710700503e-10,
+ 3.242202339936995e-10,
+ 3.244049195938459e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.884793528006412e-05,
+ 2.07159356335751e-08,
+ 1.889556244805135e-08,
+ 1.8724394479363582e-08,
+ 1.8705017978959404e-08
+ ],
+ "gamma_dfa": -0.05079331841261592,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 11.890766143798828,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 75874.0546875,
+ 264210176.0,
+ 225470416.0,
+ 172025616.0,
+ 28547836.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.025038849586053e-08,
+ 3.2404043337486144e-10,
+ 3.204363163700208e-10,
+ 3.2077221434612113e-10,
+ 3.205906651260193e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.7337119061267003e-05,
+ 2.020676426184309e-08,
+ 1.872472488173571e-08,
+ 1.8554693781425158e-08,
+ 1.853570097409829e-08
+ ],
+ "gamma_dfa": -0.05096161225810647,
+ "acc_eval": 0.0849609375,
+ "loss_eval": 11.900531768798828,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 76155.671875,
+ 267008752.0,
+ 228187344.0,
+ 173959248.0,
+ 28788394.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.046407711821303e-08,
+ 3.195448350368224e-10,
+ 3.1774499698045133e-10,
+ 3.1807836919917065e-10,
+ 3.179001784037183e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.667224569246173e-05,
+ 2.00564560515204e-08,
+ 1.8585067707022063e-08,
+ 1.8417832592376726e-08,
+ 1.8399065382368462e-08
+ ],
+ "gamma_dfa": -0.05094757055485388,
+ "acc_eval": 0.087890625,
+ "loss_eval": 11.944206237792969,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 76421.0625,
+ 269839616.0,
+ 230674688.0,
+ 175791728.0,
+ 29094570.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 9.012642010475247e-08,
+ 3.166587547731581e-10,
+ 3.1469221672963954e-10,
+ 3.1502128683413844e-10,
+ 3.1484426177286196e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6745894754421897e-05,
+ 1.9875857404372255e-08,
+ 1.840698438115851e-08,
+ 1.8240543298020384e-08,
+ 1.822207096324746e-08
+ ],
+ "gamma_dfa": -0.05100561307335738,
+ "acc_eval": 0.0859375,
+ "loss_eval": 11.99311637878418,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 76664.2734375,
+ 272336768.0,
+ 232959216.0,
+ 177609664.0,
+ 29323556.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.990726030333462e-08,
+ 3.1504263087178686e-10,
+ 3.12906783817013e-10,
+ 3.131215564611267e-10,
+ 3.1305841252660116e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6934929590206593e-05,
+ 1.98417797747652e-08,
+ 1.8281056668456586e-08,
+ 1.8116447009219883e-08,
+ 1.8098068821359448e-08
+ ],
+ "gamma_dfa": -0.05103835645422805,
+ "acc_eval": 0.0849609375,
+ "loss_eval": 12.02127456665039,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 76888.4921875,
+ 274732928.0,
+ 235060816.0,
+ 179132768.0,
+ 29504610.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.986659594256707e-08,
+ 3.121746194878483e-10,
+ 3.1075714224115814e-10,
+ 3.1084415597071313e-10,
+ 3.1076746731528715e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.7154834495158866e-05,
+ 1.9609577961432478e-08,
+ 1.816025729795001e-08,
+ 1.7994944201404905e-08,
+ 1.7976633515104368e-08
+ ],
+ "gamma_dfa": -0.05099774348491337,
+ "acc_eval": 0.083984375,
+ "loss_eval": 12.060166358947754,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 77091.2421875,
+ 277045280.0,
+ 237230640.0,
+ 180794320.0,
+ 29739022.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.99742147453253e-08,
+ 3.103251822178521e-10,
+ 3.08925968139917e-10,
+ 3.089623279439735e-10,
+ 3.0893596014713864e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.679581509961281e-05,
+ 1.951891448470633e-08,
+ 1.803828730828627e-08,
+ 1.787446990419994e-08,
+ 1.785628889194868e-08
+ ],
+ "gamma_dfa": -0.050966299066203646,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.12912654876709,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 77280.328125,
+ 279085056.0,
+ 239194416.0,
+ 182229856.0,
+ 29919720.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.955728958426334e-08,
+ 3.0862179478674534e-10,
+ 3.06326686239089e-10,
+ 3.067510134791007e-10,
+ 3.0670044282032904e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6653601051075384e-05,
+ 1.913345748505435e-08,
+ 1.7934322471546693e-08,
+ 1.7773432503531694e-08,
+ 1.7755372283545512e-08
+ ],
+ "gamma_dfa": -0.050885657081380486,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.196252822875977,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 77464.84375,
+ 281044160.0,
+ 241080400.0,
+ 183481632.0,
+ 30118970.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.968549281007654e-08,
+ 3.077238464044285e-10,
+ 3.0509625381647254e-10,
+ 3.05251185439559e-10,
+ 3.0514471505149743e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6696472812327556e-05,
+ 1.9041245025164244e-08,
+ 1.7839029808897067e-08,
+ 1.767946500308426e-08,
+ 1.766149004822637e-08
+ ],
+ "gamma_dfa": -0.05102008958783699,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.193323135375977,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 77630.7734375,
+ 282858400.0,
+ 242823728.0,
+ 184645696.0,
+ 30321804.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.95526710564809e-08,
+ 3.0606236989250135e-10,
+ 3.0359312286343254e-10,
+ 3.0362826142216193e-10,
+ 3.0360203240320516e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.670894562266767e-05,
+ 1.8970476745039377e-08,
+ 1.7750505065805555e-08,
+ 1.7592398648957897e-08,
+ 1.7574748767401616e-08
+ ],
+ "gamma_dfa": -0.05112272154656239,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.226293563842773,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 77779.6484375,
+ 284380192.0,
+ 244252416.0,
+ 185749600.0,
+ 30452270.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.966701159351942e-08,
+ 3.0471447587387956e-10,
+ 3.022795902474229e-10,
+ 3.0231497860633283e-10,
+ 3.022894989879177e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6740978026064113e-05,
+ 1.889440781610574e-08,
+ 1.7666355489609487e-08,
+ 1.7510158656364183e-08,
+ 1.749260469807723e-08
+ ],
+ "gamma_dfa": -0.05107468220376177,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.260065078735352,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 77920.109375,
+ 285895104.0,
+ 245542864.0,
+ 186746576.0,
+ 30585936.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.98649830105569e-08,
+ 3.0335337020126474e-10,
+ 3.010065807718121e-10,
+ 3.0114838400763233e-10,
+ 3.010563187633153e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6312769730575383e-05,
+ 1.8841578963701977e-08,
+ 1.7605929159003608e-08,
+ 1.7449115929935033e-08,
+ 1.7431389665034658e-08
+ ],
+ "gamma_dfa": -0.051095581700792536,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.283187866210938,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 78045.9765625,
+ 287308480.0,
+ 246744592.0,
+ 187657408.0,
+ 30732464.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.991665367830137e-08,
+ 3.023456207618125e-10,
+ 3.001092707677344e-10,
+ 3.002506299143448e-10,
+ 3.001580373140911e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6261117707472295e-05,
+ 1.8763861575621377e-08,
+ 1.7538225094426707e-08,
+ 1.73831011807124e-08,
+ 1.7365564985993842e-08
+ ],
+ "gamma_dfa": -0.05111259325349238,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.312464714050293,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 78157.4453125,
+ 288495296.0,
+ 247894048.0,
+ 188423328.0,
+ 30852564.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.983852950450455e-08,
+ 3.0117680571706273e-10,
+ 2.9906743748142617e-10,
+ 2.9920824151652425e-10,
+ 2.991159819831779e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6263733414234594e-05,
+ 1.8713789629032362e-08,
+ 1.7478631875178507e-08,
+ 1.7324792267459088e-08,
+ 1.730730758708887e-08
+ ],
+ "gamma_dfa": -0.05116538004585891,
+ "acc_eval": 0.0849609375,
+ "loss_eval": 12.31210994720459,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 78262.0234375,
+ 289603808.0,
+ 248882656.0,
+ 189149776.0,
+ 30956266.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.960672204239017e-08,
+ 3.0011432228249646e-10,
+ 2.9822597169548715e-10,
+ 2.9836624837464853e-10,
+ 2.9827409986360465e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.631741542951204e-05,
+ 1.8692462688818523e-08,
+ 1.7431661447631086e-08,
+ 1.7277525188319487e-08,
+ 1.725989662304528e-08
+ ],
+ "gamma_dfa": -0.05115435087645892,
+ "acc_eval": 0.083984375,
+ "loss_eval": 12.336039543151855,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 78353.1171875,
+ 290648000.0,
+ 249810592.0,
+ 189809696.0,
+ 31040388.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.986083344098006e-08,
+ 2.995071968214802e-10,
+ 2.9758684405578606e-10,
+ 2.977268154236157e-10,
+ 2.9763422282336194e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6262692952295765e-05,
+ 1.849162600819909e-08,
+ 1.73968519590062e-08,
+ 1.7244063954535704e-08,
+ 1.7226579274165488e-08
+ ],
+ "gamma_dfa": -0.05118084823334357,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.381507873535156,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 78431.15625,
+ 291523168.0,
+ 250644688.0,
+ 190386224.0,
+ 31126390.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.970421561116382e-08,
+ 2.984960056906516e-10,
+ 2.967268375453358e-10,
+ 2.968662538016531e-10,
+ 2.967753265359363e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6223337297560647e-05,
+ 1.8457278372352448e-08,
+ 1.7345271885460534e-08,
+ 1.7192725465520198e-08,
+ 1.717533315570563e-08
+ ],
+ "gamma_dfa": -0.05117447574957623,
+ "acc_eval": 0.0849609375,
+ "loss_eval": 12.38785171508789,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 78499.1484375,
+ 292312512.0,
+ 251365920.0,
+ 190918880.0,
+ 31200688.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.988487110173082e-08,
+ 2.980244662165177e-10,
+ 2.966143997085169e-10,
+ 2.96407148825395e-10,
+ 2.965439005464532e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.627574602025561e-05,
+ 1.8460895034877467e-08,
+ 1.7314020439584965e-08,
+ 1.7161701393320072e-08,
+ 1.714437836142224e-08
+ ],
+ "gamma_dfa": -0.05115793484583264,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.419504165649414,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 78560.8984375,
+ 292944192.0,
+ 251977760.0,
+ 191372272.0,
+ 31263360.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.973138676537928e-08,
+ 2.973402635220168e-10,
+ 2.9567431836241553e-10,
+ 2.958131239960693e-10,
+ 2.957224187749574e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.628614336368628e-05,
+ 1.8427853021307783e-08,
+ 1.72794418773492e-08,
+ 1.7127625540069857e-08,
+ 1.7110302508172026e-08
+ ],
+ "gamma_dfa": -0.0511754965664295,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.422038078308105,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 78610.8515625,
+ 293507168.0,
+ 252467824.0,
+ 191746752.0,
+ 31315682.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.979492349681095e-08,
+ 2.9698124515142865e-10,
+ 2.9562619019429803e-10,
+ 2.9538149703967065e-10,
+ 2.9551999736199264e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.631640589039307e-05,
+ 1.8418628400240777e-08,
+ 1.726077947239446e-08,
+ 1.710880859207009e-08,
+ 1.709145003303547e-08
+ ],
+ "gamma_dfa": -0.051156919635104714,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.428571701049805,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 78652.9921875,
+ 293964640.0,
+ 252896208.0,
+ 192039472.0,
+ 31369200.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.969335141273405e-08,
+ 2.9646449184461687e-10,
+ 2.949255561990327e-10,
+ 2.949690214304468e-10,
+ 2.9487870478739353e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.6324445823556744e-05,
+ 1.8399745727037953e-08,
+ 1.7238173555256253e-08,
+ 1.7086200898575044e-08,
+ 1.7068817470544673e-08
+ ],
+ "gamma_dfa": -0.051174478845496196,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.429685592651367,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 78686.6953125,
+ 294364864.0,
+ 253268672.0,
+ 192287472.0,
+ 31404650.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.964375552977799e-08,
+ 2.960394152040635e-10,
+ 2.9448907201690133e-10,
+ 2.9462729478346716e-10,
+ 2.9453686711811145e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5716021152911708e-05,
+ 1.8335738261043844e-08,
+ 1.7222946624428914e-08,
+ 1.7072181890398497e-08,
+ 1.7054745171662944e-08
+ ],
+ "gamma_dfa": -0.05117890803012415,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.430795669555664,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 78715.6640625,
+ 294704960.0,
+ 253580416.0,
+ 192507984.0,
+ 31439268.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.966816267275135e-08,
+ 2.9585070504545286e-10,
+ 2.9467184248233025e-10,
+ 2.944416099825986e-10,
+ 2.943854882087038e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.575841633894015e-05,
+ 1.832342988450364e-08,
+ 1.7211402081329652e-08,
+ 1.7061056567513333e-08,
+ 1.704364827048721e-08
+ ],
+ "gamma_dfa": -0.05119702904630685,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.439577102661133,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 78736.21875,
+ 294950432.0,
+ 253812928.0,
+ 192667952.0,
+ 31460118.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.969291798166523e-08,
+ 2.956498934558738e-10,
+ 2.9448718463775947e-10,
+ 2.947934119035267e-10,
+ 2.946275168280721e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5731959138065577e-05,
+ 1.8296260506645012e-08,
+ 1.719953068857194e-08,
+ 1.7050359346626465e-08,
+ 1.703298835309397e-08
+ ],
+ "gamma_dfa": -0.05120327511394862,
+ "acc_eval": 0.0888671875,
+ "loss_eval": 12.4466552734375,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 78753.203125,
+ 295147232.0,
+ 253989200.0,
+ 192796160.0,
+ 31479312.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.963842645925979e-08,
+ 2.9541508128616556e-10,
+ 2.9437702275814104e-10,
+ 2.943085775086729e-10,
+ 2.9446245441988594e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.573332519910764e-05,
+ 1.8288872638549947e-08,
+ 1.718973052788897e-08,
+ 1.7040525435163545e-08,
+ 1.7023159770701568e-08
+ ],
+ "gamma_dfa": -0.051216166342783254,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.445267677307129,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 78765.84375,
+ 295294944.0,
+ 254123440.0,
+ 192894032.0,
+ 31493604.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.965194098209395e-08,
+ 2.9531932455029164e-10,
+ 2.942409649264732e-10,
+ 2.945468868809087e-10,
+ 2.943810750721809e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5746687495266087e-05,
+ 1.8289329162257673e-08,
+ 1.7184650147328284e-08,
+ 1.703533136776514e-08,
+ 1.7017976361444198e-08
+ ],
+ "gamma_dfa": -0.0512156481272541,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.449201583862305,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 78774.0859375,
+ 295388160.0,
+ 254208896.0,
+ 192955280.0,
+ 31502434.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.963444741993953e-08,
+ 2.9521793343256775e-10,
+ 2.941772103692841e-10,
+ 2.944521015901813e-10,
+ 2.9431723724826497e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.574558154970873e-05,
+ 1.8287312997244953e-08,
+ 1.7180775913061552e-08,
+ 1.7031513976917267e-08,
+ 1.7014160746953166e-08
+ ],
+ "gamma_dfa": -0.051216532388934866,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.451032638549805,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 78778.2109375,
+ 295438176.0,
+ 254253040.0,
+ 192987616.0,
+ 31507318.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.962313557958623e-08,
+ 2.951474897816553e-10,
+ 2.9410018864695076e-10,
+ 2.9431876380492383e-10,
+ 2.9424027103708283e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5746518329251558e-05,
+ 1.8286739233985827e-08,
+ 1.717829789527059e-08,
+ 1.7028938259500137e-08,
+ 1.7011583253179197e-08
+ ],
+ "gamma_dfa": -0.051216747364378534,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.451074600219727,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 78782.125,
+ 295481568.0,
+ 254291456.0,
+ 193016112.0,
+ 31511684.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.962148712043927e-08,
+ 2.9511454391339953e-10,
+ 2.9406876933535386e-10,
+ 2.942796561988814e-10,
+ 2.9420885172548594e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.574746784172021e-05,
+ 1.8285794212147266e-08,
+ 1.7176807531882332e-08,
+ 1.7027431908900326e-08,
+ 1.7010076902579385e-08
+ ],
+ "gamma_dfa": -0.05121716375651886,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.451665878295898,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 78783.9921875,
+ 295502592.0,
+ 254310320.0,
+ 193029024.0,
+ 31513524.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.961931285966784e-08,
+ 2.950964195225225e-10,
+ 2.940539201023995e-10,
+ 2.942680543682741e-10,
+ 2.941940024925316e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5747409634059295e-05,
+ 1.8284790570533005e-08,
+ 1.717580744298175e-08,
+ 1.702643714907026e-08,
+ 1.700908214274932e-08
+ ],
+ "gamma_dfa": -0.05121721836621873,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.452173233032227,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 78784.0078125,
+ 295502688.0,
+ 254310576.0,
+ 193029360.0,
+ 31513636.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.96192702271037e-08,
+ 2.9509686361173237e-10,
+ 2.940537813245214e-10,
+ 2.9426569514434675e-10,
+ 2.941938359590779e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.5747655197628774e-05,
+ 1.8284845637595026e-08,
+ 1.7175850075545895e-08,
+ 1.7026476228920728e-08,
+ 1.7009122998956627e-08
+ ],
+ "gamma_dfa": -0.05121716100984486,
+ "acc_eval": 0.087890625,
+ "loss_eval": 12.452241897583008,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file