diff options
Diffstat (limited to 'results/h2_no_residual_full_s123/snapshot_evolution_s123.json')
| -rw-r--r-- | results/h2_no_residual_full_s123/snapshot_evolution_s123.json | 2749 |
1 files changed, 2749 insertions, 0 deletions
diff --git a/results/h2_no_residual_full_s123/snapshot_evolution_s123.json b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json new file mode 100644 index 0000000..cbad0e4 --- /dev/null +++ b/results/h2_no_residual_full_s123/snapshot_evolution_s123.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/h2_no_residual_full_s123", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 123, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5, + "random_targets": false, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.690464973449707, + 42.59831619262695, + 44.3453369140625, + 42.22452926635742, + 42.9206428527832 + ], + "bp_grad_norms_per_sample_med": [ + 0.001107031712308526, + 0.00020295626018196344, + 0.00014012052270118147, + 0.00011155186803080142, + 9.737444634083658e-05 + ], + "bp_grad_norms_F": [ + 0.03999145328998566, + 0.006603884976357222, + 0.004542526323348284, + 0.0036035836674273014, + 0.003130683209747076 + ], + "gamma_dfa": 0.014937716419808567, + "acc_eval": 0.1025390625, + "loss_eval": 2.4329679012298584, + "epoch": 0 + }, + { + "hidden_norms": [ + 1439.9598388671875, + 6195.9453125, + 9461.9462890625, + 7636.810546875, + 4633.29296875 + ], + "bp_grad_norms_per_sample_med": [ + 9.333700745628448e-07, + 6.382089736689522e-07, + 6.313390485956916e-07, + 6.29996520729037e-07, + 6.307979560915555e-07 + ], + "bp_grad_norms_F": [ + 5.84688204980921e-05, + 4.571088356897235e-05, + 4.522907693171874e-05, + 4.505911419983022e-05, + 4.481491123442538e-05 + ], + "gamma_dfa": 0.029066061251796782, + "acc_eval": 0.0888671875, + "loss_eval": 2.4298276901245117, + "epoch": 1 + }, + { + "hidden_norms": [ + 3191.640380859375, + 44469.08984375, + 64403.30859375, + 40298.74609375, + 20860.859375 + ], + "bp_grad_norms_per_sample_med": [ + 2.3425519657394034e-07, + 1.0419660867455605e-07, + 1.0399938332739112e-07, + 1.0393744531711491e-07, + 1.040296524479345e-07 + ], + "bp_grad_norms_F": [ + 2.9355647711781785e-05, + 1.3215229955676477e-05, + 1.2938599866174627e-05, + 1.2853749467467424e-05, + 1.2806296581402421e-05 + ], + "gamma_dfa": 0.026177803985774517, + "acc_eval": 0.0849609375, + "loss_eval": 2.450077533721924, + "epoch": 2 + }, + { + "hidden_norms": [ + 5072.8369140625, + 136290.921875, + 174667.984375, + 99872.765625, + 48604.14453125 + ], + "bp_grad_norms_per_sample_med": [ + 1.2239583213613514e-07, + 3.922263758227018e-08, + 3.8977361782599473e-08, + 3.902984602177639e-08, + 3.902538381339582e-08 + ], + "bp_grad_norms_F": [ + 2.021085128944833e-05, + 5.516366400115658e-06, + 5.3598869271809235e-06, + 5.317293016560143e-06, + 5.302062618284253e-06 + ], + "gamma_dfa": 0.025070607429370284, + "acc_eval": 0.1298828125, + "loss_eval": 2.470280170440674, + "epoch": 3 + }, + { + "hidden_norms": [ + 6908.81494140625, + 300140.625, + 335781.1875, + 194737.578125, + 91168.953125 + ], + "bp_grad_norms_per_sample_med": [ + 8.2960639247176e-08, + 2.020572686944888e-08, + 2.0147625789945778e-08, + 2.017927869246705e-08, + 2.0169572678696568e-08 + ], + "bp_grad_norms_F": [ + 1.5067237654875498e-05, + 3.154973455821164e-06, + 2.890229097829433e-06, + 2.8368178845994407e-06, + 2.826985564752249e-06 + ], + "gamma_dfa": 0.0266711818985641, + "acc_eval": 0.125, + "loss_eval": 2.5050950050354004, + "epoch": 4 + }, + { + "hidden_norms": [ + 8695.44140625, + 543316.5625, + 567899.375, + 335584.25, + 145692.765625 + ], + "bp_grad_norms_per_sample_med": [ + 6.380926009796895e-08, + 1.238302882455855e-08, + 1.2337157073716298e-08, + 1.2354545830817187e-08, + 1.2352338707444233e-08 + ], + "bp_grad_norms_F": [ + 1.2898051863885485e-05, + 1.8491266473574797e-06, + 1.7919940091815079e-06, + 1.7602286561668734e-06, + 1.7506840777059551e-06 + ], + "gamma_dfa": 0.022991596721112728, + "acc_eval": 0.115234375, + "loss_eval": 2.5430097579956055, + "epoch": 5 + }, + { + "hidden_norms": [ + 10453.0947265625, + 880568.0625, + 851994.125, + 518617.03125, + 211486.65625 + ], + "bp_grad_norms_per_sample_med": [ + 5.6784926982800243e-08, + 8.739263535062491e-09, + 8.721374733511311e-09, + 8.72691785502866e-09, + 8.722811806194386e-09 + ], + "bp_grad_norms_F": [ + 1.2415013770805672e-05, + 1.2789794254786102e-06, + 1.2444495496310992e-06, + 1.2192489293738618e-06, + 1.2128068647143664e-06 + ], + "gamma_dfa": 0.01671441923826933, + "acc_eval": 0.109375, + "loss_eval": 2.6205759048461914, + "epoch": 6 + }, + { + "hidden_norms": [ + 12133.5908203125, + 1301136.875, + 1213412.0, + 761869.4375, + 299099.96875 + ], + "bp_grad_norms_per_sample_med": [ + 5.181741613569102e-08, + 6.701867505398695e-09, + 6.663806839668496e-09, + 6.668138485821373e-09, + 6.665318963428035e-09 + ], + "bp_grad_norms_F": [ + 1.4586516044801101e-05, + 9.615758926884155e-07, + 9.358571446682618e-07, + 9.15065527351544e-07, + 9.087396506402001e-07 + ], + "gamma_dfa": 0.009791500167921185, + "acc_eval": 0.1103515625, + "loss_eval": 2.687662363052368, + "epoch": 7 + }, + { + "hidden_norms": [ + 13778.3701171875, + 1831990.625, + 1660265.5, + 1070697.0, + 405510.90625 + ], + "bp_grad_norms_per_sample_med": [ + 4.950679510784539e-08, + 5.247439816002952e-09, + 5.240861966626653e-09, + 5.241989065041253e-09, + 5.2364685920736065e-09 + ], + "bp_grad_norms_F": [ + 2.731455424509477e-05, + 7.950770282150188e-07, + 7.47014951230085e-07, + 7.077854888848378e-07, + 7.019767735982896e-07 + ], + "gamma_dfa": 0.002645118860527873, + "acc_eval": 0.1083984375, + "loss_eval": 2.749309539794922, + "epoch": 8 + }, + { + "hidden_norms": [ + 15423.7236328125, + 2441876.0, + 2156981.0, + 1456388.625, + 514814.78125 + ], + "bp_grad_norms_per_sample_med": [ + 4.9704105720138614e-08, + 4.314747670264296e-09, + 4.316281554395118e-09, + 4.3085655043739735e-09, + 4.306641265827693e-09 + ], + "bp_grad_norms_F": [ + 1.53065484482795e-05, + 5.914198482059874e-07, + 5.698148015653715e-07, + 5.564911020883301e-07, + 5.521175125977607e-07 + ], + "gamma_dfa": -0.004648297093808651, + "acc_eval": 0.087890625, + "loss_eval": 2.819417953491211, + "epoch": 9 + }, + { + "hidden_norms": [ + 17014.275390625, + 3299996.25, + 2739406.75, + 1924564.5, + 645257.125 + ], + "bp_grad_norms_per_sample_med": [ + 5.217410503632891e-08, + 3.7931444651917445e-09, + 3.791894354066017e-09, + 3.787997471249582e-09, + 3.786980062869816e-09 + ], + "bp_grad_norms_F": [ + 1.8386483134236187e-05, + 5.170510917196225e-07, + 4.828122541766788e-07, + 4.6214248072828923e-07, + 4.5809062498847197e-07 + ], + "gamma_dfa": -0.008237186702899635, + "acc_eval": 0.0771484375, + "loss_eval": 2.8880226612091064, + "epoch": 10 + }, + { + "hidden_norms": [ + 18615.341796875, + 4327781.5, + 3460663.0, + 2493429.0, + 811358.25 + ], + "bp_grad_norms_per_sample_med": [ + 5.4753250822159316e-08, + 3.4849005903225816e-09, + 3.4845948349016e-09, + 3.4844236385112026e-09, + 3.4833074202822445e-09 + ], + "bp_grad_norms_F": [ + 1.760143095452804e-05, + 4.3398881643952336e-07, + 4.0691622871236177e-07, + 3.9397295381604636e-07, + 3.9136793361649325e-07 + ], + "gamma_dfa": -0.013480214809533209, + "acc_eval": 0.107421875, + "loss_eval": 3.0378975868225098, + "epoch": 11 + }, + { + "hidden_norms": [ + 20197.244140625, + 5361947.0, + 4309913.5, + 3117389.0, + 986810.625 + ], + "bp_grad_norms_per_sample_med": [ + 6.110099803890989e-08, + 3.3039087021791147e-09, + 3.3079554651038734e-09, + 3.309411411578367e-09, + 3.3057334647423886e-09 + ], + "bp_grad_norms_F": [ + 1.7853921235655434e-05, + 3.920526410183811e-07, + 3.4606765098033065e-07, + 3.4065161003127287e-07, + 3.3874636073960573e-07 + ], + "gamma_dfa": -0.017087776213884354, + "acc_eval": 0.1005859375, + "loss_eval": 3.226945161819458, + "epoch": 12 + }, + { + "hidden_norms": [ + 21745.060546875, + 6626533.5, + 5288037.5, + 3845802.25, + 1183958.5 + ], + "bp_grad_norms_per_sample_med": [ + 6.904146232500352e-08, + 3.0698867892198223e-09, + 3.072165188910958e-09, + 3.0722313582032257e-09, + 3.0718891874670362e-09 + ], + "bp_grad_norms_F": [ + 9.694533218862489e-05, + 1.2521383041530498e-06, + 3.6304524542174477e-07, + 3.428452259868209e-07, + 3.3693893897179805e-07 + ], + "gamma_dfa": -0.02254341426305473, + "acc_eval": 0.0888671875, + "loss_eval": 3.4535317420959473, + "epoch": 13 + }, + { + "hidden_norms": [ + 23268.326171875, + 8059270.5, + 6347708.5, + 4634334.0, + 1389795.375 + ], + "bp_grad_norms_per_sample_med": [ + 7.468641882724114e-08, + 3.0219813318410615e-09, + 3.0241904536154607e-09, + 3.0243862969570046e-09, + 3.0241051884871695e-09 + ], + "bp_grad_norms_F": [ + 3.818523691734299e-05, + 3.265660666329495e-07, + 2.885882395275985e-07, + 2.7603223884398176e-07, + 2.7437968697086035e-07 + ], + "gamma_dfa": -0.024787384318187833, + "acc_eval": 0.0830078125, + "loss_eval": 3.7082602977752686, + "epoch": 14 + }, + { + "hidden_norms": [ + 24769.162109375, + 9503637.0, + 7524496.0, + 5577708.5, + 1619056.75 + ], + "bp_grad_norms_per_sample_med": [ + 8.079865665422403e-08, + 2.885043093314721e-09, + 2.8850699607119168e-09, + 2.885329752899679e-09, + 2.885090166770965e-09 + ], + "bp_grad_norms_F": [ + 3.172496144543402e-05, + 2.7863097784575075e-07, + 2.5604617803764995e-07, + 2.4778245233392227e-07, + 2.465397699324967e-07 + ], + "gamma_dfa": -0.028090000618249178, + "acc_eval": 0.09765625, + "loss_eval": 3.9940719604492188, + "epoch": 15 + }, + { + "hidden_norms": [ + 26297.634765625, + 11348280.0, + 8835018.0, + 6709572.0, + 1860997.375 + ], + "bp_grad_norms_per_sample_med": [ + 8.416654395659862e-08, + 2.716076252795574e-09, + 2.708202995194142e-09, + 2.713108182561541e-09, + 2.710037305675428e-09 + ], + "bp_grad_norms_F": [ + 6.21284925728105e-05, + 2.910503269504261e-07, + 2.3999916720640613e-07, + 2.286197116063704e-07, + 2.275272947827034e-07 + ], + "gamma_dfa": -0.0305853869067505, + "acc_eval": 0.10546875, + "loss_eval": 4.280234336853027, + "epoch": 16 + }, + { + "hidden_norms": [ + 27796.267578125, + 13131638.0, + 10275209.0, + 7908104.0, + 2124187.75 + ], + "bp_grad_norms_per_sample_med": [ + 8.618104629931622e-08, + 2.527688947040474e-09, + 2.5195041608583324e-09, + 2.5170519002415404e-09, + 2.5167292694305843e-09 + ], + "bp_grad_norms_F": [ + 2.9607001124531962e-05, + 2.280380755337319e-07, + 2.1368994396198104e-07, + 2.0886261609120993e-07, + 2.0800932531983563e-07 + ], + "gamma_dfa": -0.032157177105546, + "acc_eval": 0.1064453125, + "loss_eval": 4.584749221801758, + "epoch": 17 + }, + { + "hidden_norms": [ + 29261.162109375, + 15093201.0, + 11924527.0, + 9201859.0, + 2398880.25 + ], + "bp_grad_norms_per_sample_med": [ + 8.982802057744266e-08, + 2.362436024583303e-09, + 2.3667561244167246e-09, + 2.3683257577289396e-09, + 2.3661459458423906e-09 + ], + "bp_grad_norms_F": [ + 1.4750239643035457e-05, + 2.0303163239532296e-07, + 1.9652848948226165e-07, + 1.9512303595092817e-07, + 1.9424047081884055e-07 + ], + "gamma_dfa": -0.033276769798249006, + "acc_eval": 0.1064453125, + "loss_eval": 4.833416938781738, + "epoch": 18 + }, + { + "hidden_norms": [ + 30654.640625, + 17198064.0, + 13711921.0, + 10622219.0, + 2733435.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.140238432792103e-08, + 2.218417227695113e-09, + 2.217410255411778e-09, + 2.2205985938938966e-09, + 2.2187365278369953e-09 + ], + "bp_grad_norms_F": [ + 2.2792535673943348e-05, + 2.101570970580724e-07, + 1.8281718894286314e-07, + 1.770977462456358e-07, + 1.7618602043967257e-07 + ], + "gamma_dfa": -0.0334639239590615, + "acc_eval": 0.1064453125, + "loss_eval": 5.091382026672363, + "epoch": 19 + }, + { + "hidden_norms": [ + 32095.28125, + 19561478.0, + 15722807.0, + 12287095.0, + 3104931.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.42815958637766e-08, + 2.0783239573773926e-09, + 2.0685115842411506e-09, + 2.072532145902528e-09, + 2.069893811906809e-09 + ], + "bp_grad_norms_F": [ + 2.035827492363751e-05, + 1.7020983023030567e-07, + 1.504546105479676e-07, + 1.4846344242869236e-07, + 1.4791994829010946e-07 + ], + "gamma_dfa": -0.03437755152117461, + "acc_eval": 0.1044921875, + "loss_eval": 5.338113784790039, + "epoch": 20 + }, + { + "hidden_norms": [ + 33549.3515625, + 22241236.0, + 17865768.0, + 13953577.0, + 3455886.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.694593927633832e-08, + 1.9436505738212873e-09, + 1.932475734989225e-09, + 1.9355790303876574e-09, + 1.9334791545588814e-09 + ], + "bp_grad_norms_F": [ + 1.946108568517957e-05, + 1.476916224874003e-07, + 1.3395830933404795e-07, + 1.3276194010813924e-07, + 1.323410430131844e-07 + ], + "gamma_dfa": -0.035225782776251435, + "acc_eval": 0.1044921875, + "loss_eval": 5.639235496520996, + "epoch": 21 + }, + { + "hidden_norms": [ + 35003.625, + 25199516.0, + 20151382.0, + 15868719.0, + 3834722.75 + ], + "bp_grad_norms_per_sample_med": [ + 9.815706647486877e-08, + 1.8191292916469592e-09, + 1.812876404549968e-09, + 1.8141808055816e-09, + 1.813302730191424e-09 + ], + "bp_grad_norms_F": [ + 1.900309871416539e-05, + 1.3126974351962417e-07, + 1.2148075256845914e-07, + 1.204552404487913e-07, + 1.2008344185687747e-07 + ], + "gamma_dfa": -0.036192891420796514, + "acc_eval": 0.1044921875, + "loss_eval": 5.912903785705566, + "epoch": 22 + }, + { + "hidden_norms": [ + 36385.25390625, + 28323954.0, + 22925044.0, + 17971546.0, + 4269257.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.902030484454372e-08, + 1.6868005880965597e-09, + 1.6695808069400186e-09, + 1.6706477312666834e-09, + 1.6698925575653334e-09 + ], + "bp_grad_norms_F": [ + 1.7624819520278834e-05, + 1.1903176755367895e-07, + 1.1061406013368469e-07, + 1.0976869191381411e-07, + 1.094643096166692e-07 + ], + "gamma_dfa": -0.037227407563477755, + "acc_eval": 0.1044921875, + "loss_eval": 6.16106653213501, + "epoch": 23 + }, + { + "hidden_norms": [ + 37805.91796875, + 31593894.0, + 25615532.0, + 20113868.0, + 4713793.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.859636662667981e-08, + 1.5704177958042465e-09, + 1.5608032644109926e-09, + 1.5628717209281717e-09, + 1.5616322679434802e-09 + ], + "bp_grad_norms_F": [ + 1.6187867004191503e-05, + 1.0865824151551351e-07, + 1.0160825070215651e-07, + 1.008768109045377e-07, + 1.0061884125889264e-07 + ], + "gamma_dfa": -0.03782000340288505, + "acc_eval": 0.1044921875, + "loss_eval": 6.406368732452393, + "epoch": 24 + }, + { + "hidden_norms": [ + 39138.39453125, + 34956036.0, + 28542170.0, + 22404560.0, + 5139918.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.837745551521948e-08, + 1.4733757547347182e-09, + 1.4583911855936549e-09, + 1.4602866693635974e-09, + 1.4591743369152255e-09 + ], + "bp_grad_norms_F": [ + 1.768167749105487e-05, + 1.015666910575419e-07, + 9.354967289709748e-08, + 9.288694968745403e-08, + 9.264899603067533e-08 + ], + "gamma_dfa": -0.03860464284662157, + "acc_eval": 0.1044921875, + "loss_eval": 6.634061813354492, + "epoch": 25 + }, + { + "hidden_norms": [ + 40505.18359375, + 38650996.0, + 31492410.0, + 24792780.0, + 5620949.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.942911560756329e-08, + 1.3685884647784974e-09, + 1.3593203229689266e-09, + 1.3602377002541743e-09, + 1.3594056991195202e-09 + ], + "bp_grad_norms_F": [ + 2.0700817913166247e-05, + 9.837697945158652e-08, + 8.757055525165924e-08, + 8.689728048238976e-08, + 8.669941564676265e-08 + ], + "gamma_dfa": -0.03959248901810497, + "acc_eval": 0.1044921875, + "loss_eval": 6.7737202644348145, + "epoch": 26 + }, + { + "hidden_norms": [ + 41849.203125, + 42830568.0, + 34648896.0, + 27355716.0, + 6044684.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.865106420647862e-08, + 1.28658228515377e-09, + 1.2788612391290144e-09, + 1.2804906024399543e-09, + 1.2795147164013088e-09 + ], + "bp_grad_norms_F": [ + 2.3165159291238524e-05, + 9.389359689748744e-08, + 8.146788132989968e-08, + 8.082054137048544e-08, + 8.063241097033824e-08 + ], + "gamma_dfa": -0.040185014018788934, + "acc_eval": 0.1044921875, + "loss_eval": 6.946921348571777, + "epoch": 27 + }, + { + "hidden_norms": [ + 43129.56640625, + 47054352.0, + 37982196.0, + 29955390.0, + 6540964.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0036384878731042e-07, + 1.2043249730808725e-09, + 1.2007507210753943e-09, + 1.2010574756970982e-09, + 1.2009065963880516e-09 + ], + "bp_grad_norms_F": [ + 2.413927359157242e-05, + 8.847878518736252e-08, + 7.592807094169984e-08, + 7.532069901117211e-08, + 7.515143352065934e-08 + ], + "gamma_dfa": -0.04085268918424845, + "acc_eval": 0.1044921875, + "loss_eval": 7.133134841918945, + "epoch": 28 + }, + { + "hidden_norms": [ + 44368.93359375, + 51374800.0, + 41470788.0, + 32761826.0, + 6998702.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.0049345178231306e-07, + 1.1348291195645288e-09, + 1.132080207355557e-09, + 1.1335333782724888e-09, + 1.1326910520637057e-09 + ], + "bp_grad_norms_F": [ + 2.53067773883231e-05, + 8.518416905189952e-08, + 7.111059119324636e-08, + 7.048716810231781e-08, + 7.034290661067644e-08 + ], + "gamma_dfa": -0.04143569804728031, + "acc_eval": 0.1044921875, + "loss_eval": 7.306489944458008, + "epoch": 29 + }, + { + "hidden_norms": [ + 45540.84375, + 55799284.0, + 44925840.0, + 35576004.0, + 7506460.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.999683214800825e-08, + 1.0682152939978096e-09, + 1.0609697564945009e-09, + 1.0612235534779302e-09, + 1.0610903267149752e-09 + ], + "bp_grad_norms_F": [ + 1.843971222115215e-05, + 8.002744067425738e-08, + 6.616264869307997e-08, + 6.571565336344065e-08, + 6.558265397416108e-08 + ], + "gamma_dfa": -0.04231115654692985, + "acc_eval": 0.1044921875, + "loss_eval": 7.393707752227783, + "epoch": 30 + }, + { + "hidden_norms": [ + 46740.3125, + 60156548.0, + 48609568.0, + 38622656.0, + 7923887.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.801681954968444e-08, + 1.007545269438026e-09, + 1.0030560826379542e-09, + 1.0032202846232963e-09, + 1.003132132915141e-09 + ], + "bp_grad_norms_F": [ + 2.0189601855236106e-05, + 7.754985631436284e-08, + 6.295730514693787e-08, + 6.247479689136526e-08, + 6.235500649154346e-08 + ], + "gamma_dfa": -0.042783402430359274, + "acc_eval": 0.1044921875, + "loss_eval": 7.513785362243652, + "epoch": 31 + }, + { + "hidden_norms": [ + 47946.2578125, + 65027368.0, + 52475872.0, + 41636652.0, + 8527125.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.764004715862029e-08, + 9.540165324395389e-10, + 9.49443301756503e-10, + 9.49665124316823e-10, + 9.49536671512874e-10 + ], + "bp_grad_norms_F": [ + 2.2026428268873133e-05, + 7.400986135053245e-08, + 5.9516974459938865e-08, + 5.903561017817083e-08, + 5.892941956631148e-08 + ], + "gamma_dfa": -0.04377710592234507, + "acc_eval": 0.1044921875, + "loss_eval": 7.666411876678467, + "epoch": 32 + }, + { + "hidden_norms": [ + 49101.84765625, + 70129512.0, + 56707888.0, + 44883068.0, + 9051192.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.715147086808429e-08, + 9.088669261636539e-10, + 8.977363297191232e-10, + 8.978853771601791e-10, + 8.978119914182514e-10 + ], + "bp_grad_norms_F": [ + 2.6852110750041902e-05, + 7.312536354220356e-08, + 5.6589971819676066e-08, + 5.605170372291468e-08, + 5.593761187583368e-08 + ], + "gamma_dfa": -0.04420170868979767, + "acc_eval": 0.1044921875, + "loss_eval": 7.917013645172119, + "epoch": 33 + }, + { + "hidden_norms": [ + 50205.94921875, + 75218112.0, + 61038472.0, + 48316120.0, + 9560446.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.637748377144817e-08, + 8.535361861738977e-10, + 8.499229653402551e-10, + 8.501254145087955e-10, + 8.500238846131936e-10 + ], + "bp_grad_norms_F": [ + 2.704818507481832e-05, + 6.82247573990935e-08, + 5.427460791906924e-08, + 5.371628120087735e-08, + 5.360957899824825e-08 + ], + "gamma_dfa": -0.0447281262895558, + "acc_eval": 0.1064453125, + "loss_eval": 7.9629034996032715, + "epoch": 34 + }, + { + "hidden_norms": [ + 51283.7109375, + 79971480.0, + 65131160.0, + 51675436.0, + 10150061.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.52169543211312e-08, + 8.244336879847936e-10, + 8.130549011831079e-10, + 8.13186962211887e-10, + 8.13120237808107e-10 + ], + "bp_grad_norms_F": [ + 3.043289871129673e-05, + 6.438099831029831e-08, + 5.208626419062057e-08, + 5.1470838258182994e-08, + 5.136259773053098e-08 + ], + "gamma_dfa": -0.04496103324345313, + "acc_eval": 0.1064453125, + "loss_eval": 8.225072860717773, + "epoch": 35 + }, + { + "hidden_norms": [ + 52391.31640625, + 85212368.0, + 69690088.0, + 54922688.0, + 10724330.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.460915606496201e-08, + 7.854291661502089e-10, + 7.73968722445062e-10, + 7.748673369611936e-10, + 7.740979524051284e-10 + ], + "bp_grad_norms_F": [ + 3.253111935919151e-05, + 6.160666288224093e-08, + 5.0236756976573815e-08, + 4.957355770329741e-08, + 4.9483450226261994e-08 + ], + "gamma_dfa": -0.04545678128488362, + "acc_eval": 0.103515625, + "loss_eval": 8.447563171386719, + "epoch": 36 + }, + { + "hidden_norms": [ + 53471.4609375, + 90755416.0, + 74424576.0, + 58527500.0, + 11383908.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.481268392619313e-08, + 7.485803088513876e-10, + 7.380538402657066e-10, + 7.38905825414804e-10, + 7.384990952097326e-10 + ], + "bp_grad_norms_F": [ + 2.8782606023014523e-05, + 5.679364178945434e-08, + 4.747649740011184e-08, + 4.686737042902678e-08, + 4.6776307272011763e-08 + ], + "gamma_dfa": -0.04577424196759239, + "acc_eval": 0.10546875, + "loss_eval": 8.63510513305664, + "epoch": 37 + }, + { + "hidden_norms": [ + 54526.26171875, + 96224200.0, + 79402688.0, + 62338148.0, + 11946441.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.414058155243765e-08, + 7.102119448099131e-10, + 7.013249980758474e-10, + 7.021335179935306e-10, + 7.017796899155826e-10 + ], + "bp_grad_norms_F": [ + 2.6797888494911604e-05, + 5.262990754317798e-08, + 4.363804251283909e-08, + 4.31665583278118e-08, + 4.308598633429028e-08 + ], + "gamma_dfa": -0.04641679968335666, + "acc_eval": 0.10546875, + "loss_eval": 8.730607986450195, + "epoch": 38 + }, + { + "hidden_norms": [ + 55583.125, + 101480040.0, + 83697192.0, + 66218348.0, + 12538905.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.47181035826361e-08, + 6.868624002898116e-10, + 6.774021343858294e-10, + 6.77987721520168e-10, + 6.776118000040299e-10 + ], + "bp_grad_norms_F": [ + 2.6024237740784883e-05, + 5.0800426976138624e-08, + 4.1874233858152365e-08, + 4.15037817447228e-08, + 4.1430755715055056e-08 + ], + "gamma_dfa": -0.04637146886670962, + "acc_eval": 0.10546875, + "loss_eval": 8.87772274017334, + "epoch": 39 + }, + { + "hidden_norms": [ + 56556.95703125, + 107073544.0, + 88369376.0, + 69716112.0, + 13102132.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.377198040283474e-08, + 6.585805234493591e-10, + 6.487251291709129e-10, + 6.49616194170477e-10, + 6.491358561788729e-10 + ], + "bp_grad_norms_F": [ + 3.484269473119639e-05, + 7.467966156582406e-08, + 4.40217604591453e-08, + 4.3712645947380224e-08, + 4.352901683546406e-08 + ], + "gamma_dfa": -0.04681209813861642, + "acc_eval": 0.10546875, + "loss_eval": 9.053573608398438, + "epoch": 40 + }, + { + "hidden_norms": [ + 57504.6875, + 113131968.0, + 93389736.0, + 73651392.0, + 13735091.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.427740366163562e-08, + 6.312518285866986e-10, + 6.225254756131449e-10, + 6.232416249751793e-10, + 6.229293747495035e-10 + ], + "bp_grad_norms_F": [ + 0.00021013167861383408, + 5.526797508537129e-07, + 5.349095744122678e-08, + 4.9017671699402854e-08, + 4.773081840880877e-08 + ], + "gamma_dfa": -0.047232568118488416, + "acc_eval": 0.10546875, + "loss_eval": 9.214558601379395, + "epoch": 41 + }, + { + "hidden_norms": [ + 58472.46875, + 118762648.0, + 98279872.0, + 77365656.0, + 14248840.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.310819137908766e-08, + 6.046827483174866e-10, + 5.995566820793385e-10, + 6.004566288630997e-10, + 5.99891414321263e-10 + ], + "bp_grad_norms_F": [ + 0.00010149624722544104, + 2.533984684305324e-07, + 4.4013567901401984e-08, + 4.291897326424987e-08, + 4.2505401864900705e-08 + ], + "gamma_dfa": -0.04764813384099398, + "acc_eval": 0.1044921875, + "loss_eval": 9.217700958251953, + "epoch": 42 + }, + { + "hidden_norms": [ + 59401.03125, + 124607344.0, + 103250600.0, + 81130456.0, + 14810775.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.245275833791311e-08, + 5.824435378443127e-10, + 5.769146271816794e-10, + 5.777631706394004e-10, + 5.772260447400868e-10 + ], + "bp_grad_norms_F": [ + 4.0584909584140405e-05, + 9.203435524796078e-08, + 3.4605545096155765e-08, + 3.4145575256161464e-08, + 3.4092256129270027e-08 + ], + "gamma_dfa": -0.04794895404484123, + "acc_eval": 0.1064453125, + "loss_eval": 9.390031814575195, + "epoch": 43 + }, + { + "hidden_norms": [ + 60278.7890625, + 130581952.0, + 108096264.0, + 85136336.0, + 15405965.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.3390447375441e-08, + 5.630300670134147e-10, + 5.5805338128323e-10, + 5.588779439236191e-10, + 5.583465911840335e-10 + ], + "bp_grad_norms_F": [ + 4.781157258548774e-05, + 1.0881421275144021e-07, + 3.3062310222931046e-08, + 3.248984370429753e-08, + 3.2446724418377926e-08 + ], + "gamma_dfa": -0.04778411969891749, + "acc_eval": 0.10546875, + "loss_eval": 9.621635437011719, + "epoch": 44 + }, + { + "hidden_norms": [ + 61138.51171875, + 136691760.0, + 113402280.0, + 88772512.0, + 15993850.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.273151135857916e-08, + 5.43037670386326e-10, + 5.421059157129093e-10, + 5.42630551603196e-10, + 5.423762550194056e-10 + ], + "bp_grad_norms_F": [ + 2.6410325517645106e-05, + 4.767177586018079e-08, + 3.172428364450752e-08, + 3.129938974666402e-08, + 3.1260690036560845e-08 + ], + "gamma_dfa": -0.04829322246951051, + "acc_eval": 0.099609375, + "loss_eval": 9.733180046081543, + "epoch": 45 + }, + { + "hidden_norms": [ + 61988.87890625, + 142480176.0, + 118613440.0, + 92755400.0, + 16660659.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.238209486284177e-08, + 5.250901380371431e-10, + 5.242600242816309e-10, + 5.243941947341568e-10, + 5.243331879789537e-10 + ], + "bp_grad_norms_F": [ + 2.4320243028341793e-05, + 4.237628559167206e-08, + 3.048009489248216e-08, + 3.0116801497115375e-08, + 3.0080638424578865e-08 + ], + "gamma_dfa": -0.048452052724314854, + "acc_eval": 0.0986328125, + "loss_eval": 9.875200271606445, + "epoch": 46 + }, + { + "hidden_norms": [ + 62831.0078125, + 148088512.0, + 124018112.0, + 96570944.0, + 17294454.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.218231866725546e-08, + 5.094495381108288e-10, + 5.088939269981552e-10, + 5.090234345139777e-10, + 5.089637600264041e-10 + ], + "bp_grad_norms_F": [ + 2.273459904245101e-05, + 3.8132583313199575e-08, + 2.9463127049211835e-08, + 2.9154062275438264e-08, + 2.9119732403160015e-08 + ], + "gamma_dfa": -0.04870791392750107, + "acc_eval": 0.1015625, + "loss_eval": 9.965906143188477, + "epoch": 47 + }, + { + "hidden_norms": [ + 63619.36328125, + 153924256.0, + 129021120.0, + 100401856.0, + 17813234.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.170297232685698e-08, + 4.942196096813234e-10, + 4.92394736095747e-10, + 4.925179708514804e-10, + 4.924622931667955e-10 + ], + "bp_grad_norms_F": [ + 2.1741494492744096e-05, + 3.567927819858596e-08, + 2.843704471899855e-08, + 2.816011068773605e-08, + 2.812711485944419e-08 + ], + "gamma_dfa": -0.049255506150075234, + "acc_eval": 0.1025390625, + "loss_eval": 9.984619140625, + "epoch": 48 + }, + { + "hidden_norms": [ + 64400.26171875, + 159789408.0, + 134080160.0, + 104244408.0, + 18432430.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.070604534144877e-08, + 4.78996176056512e-10, + 4.780518758629171e-10, + 4.781712803492155e-10, + 4.781176565771261e-10 + ], + "bp_grad_norms_F": [ + 2.1263931557768956e-05, + 3.437593676380857e-08, + 2.7499025279098532e-08, + 2.7248480805042163e-08, + 2.7216600528845447e-08 + ], + "gamma_dfa": -0.04910894545173505, + "acc_eval": 0.0986328125, + "loss_eval": 10.146781921386719, + "epoch": 49 + }, + { + "hidden_norms": [ + 65147.40234375, + 165462976.0, + 138862000.0, + 107834176.0, + 19038348.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.061706407464953e-08, + 4.668093134263529e-10, + 4.645184237261901e-10, + 4.6463269343099967e-10, + 4.6457995783732997e-10 + ], + "bp_grad_norms_F": [ + 2.0052335457876325e-05, + 3.337338227993314e-08, + 2.6690587517919084e-08, + 2.646976504649956e-08, + 2.64381352366172e-08 + ], + "gamma_dfa": -0.04920872090588091, + "acc_eval": 0.0966796875, + "loss_eval": 10.281063079833984, + "epoch": 50 + }, + { + "hidden_norms": [ + 65863.96875, + 171261072.0, + 143810992.0, + 111834848.0, + 19625576.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.099313302840528e-08, + 4.5625103695101643e-10, + 4.524729202426414e-10, + 4.5258219394384014e-10, + 4.5253126246258546e-10 + ], + "bp_grad_norms_F": [ + 1.9101036741631106e-05, + 3.2813989747637606e-08, + 2.5957119120789685e-08, + 2.5756730082093782e-08, + 2.572607549211625e-08 + ], + "gamma_dfa": -0.04933306630846346, + "acc_eval": 0.0986328125, + "loss_eval": 10.349817276000977, + "epoch": 51 + }, + { + "hidden_norms": [ + 66593.8203125, + 176983552.0, + 149183712.0, + 115646976.0, + 20178866.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.1175948568889e-08, + 4.444306589412861e-10, + 4.412468168624173e-10, + 4.4135325949490323e-10, + 4.413052423490882e-10 + ], + "bp_grad_norms_F": [ + 1.852569039328955e-05, + 3.21252677792927e-08, + 2.5265682879194173e-08, + 2.5077683929453087e-08, + 2.5048496610224902e-08 + ], + "gamma_dfa": -0.04927207152650226, + "acc_eval": 0.1015625, + "loss_eval": 10.515829086303711, + "epoch": 52 + }, + { + "hidden_norms": [ + 67302.6328125, + 182834976.0, + 154352272.0, + 119312168.0, + 20747826.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.146700818973841e-08, + 4.3625753010090307e-10, + 4.31810531775767e-10, + 4.319128388274862e-10, + 4.3186304532483177e-10 + ], + "bp_grad_norms_F": [ + 1.817524571379181e-05, + 3.176044671704403e-08, + 2.468624060725233e-08, + 2.4515436791716638e-08, + 2.4487377459081472e-08 + ], + "gamma_dfa": -0.04947220539179398, + "acc_eval": 0.1015625, + "loss_eval": 10.631593704223633, + "epoch": 53 + }, + { + "hidden_norms": [ + 67943.6640625, + 188557808.0, + 159066528.0, + 122911296.0, + 21287842.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.120569188780792e-08, + 4.2657519183642023e-10, + 4.219723181986268e-10, + 4.220687410683155e-10, + 4.220172822311241e-10 + ], + "bp_grad_norms_F": [ + 1.8009301129495725e-05, + 3.077772348092367e-08, + 2.4100344830912945e-08, + 2.3935520232498675e-08, + 2.390864395351855e-08 + ], + "gamma_dfa": -0.04969306073326152, + "acc_eval": 0.1025390625, + "loss_eval": 10.66339111328125, + "epoch": 54 + }, + { + "hidden_norms": [ + 68579.2578125, + 193996528.0, + 163940560.0, + 126448000.0, + 21766094.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.058499728098468e-08, + 4.1539605089013776e-10, + 4.1060946309734447e-10, + 4.1091324787245753e-10, + 4.10790096383451e-10 + ], + "bp_grad_norms_F": [ + 1.5884443200775422e-05, + 2.8224185655290057e-08, + 2.346608596326405e-08, + 2.3316024666542035e-08, + 2.328991399735969e-08 + ], + "gamma_dfa": -0.04980730817624135, + "acc_eval": 0.0986328125, + "loss_eval": 10.783552169799805, + "epoch": 55 + }, + { + "hidden_norms": [ + 69203.796875, + 199460144.0, + 168890016.0, + 129780784.0, + 22302874.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.078585350152935e-08, + 4.0699738024230214e-10, + 4.025394462203735e-10, + 4.0283623659043144e-10, + 4.027146949248106e-10 + ], + "bp_grad_norms_F": [ + 1.5867637557676062e-05, + 2.8422073583556084e-08, + 2.300496149132414e-08, + 2.2864167448233275e-08, + 2.2838495539190262e-08 + ], + "gamma_dfa": -0.04992603903519921, + "acc_eval": 0.09765625, + "loss_eval": 10.859743118286133, + "epoch": 56 + }, + { + "hidden_norms": [ + 69791.453125, + 204736432.0, + 173582192.0, + 133232672.0, + 22820996.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.066331330132016e-08, + 3.96910615485524e-10, + 3.925613167865549e-10, + 3.926495240058614e-10, + 3.9260561468523747e-10 + ], + "bp_grad_norms_F": [ + 1.4505669241771102e-05, + 2.6905636829610557e-08, + 2.2510086239435623e-08, + 2.2376122288392253e-08, + 2.235119467286495e-08 + ], + "gamma_dfa": -0.04994637455092743, + "acc_eval": 0.0986328125, + "loss_eval": 10.989320755004883, + "epoch": 57 + }, + { + "hidden_norms": [ + 70371.9375, + 210191472.0, + 178149376.0, + 136544128.0, + 23324878.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.057572469828301e-08, + 3.849987550985645e-10, + 3.8476868913228657e-10, + 3.8500982957323515e-10, + 3.8497979804041904e-10 + ], + "bp_grad_norms_F": [ + 1.4466082575381733e-05, + 2.6583837353655326e-08, + 2.2064293503376575e-08, + 2.1934541294399423e-08, + 2.191077008717457e-08 + ], + "gamma_dfa": -0.05017502269765828, + "acc_eval": 0.1015625, + "loss_eval": 11.14348030090332, + "epoch": 58 + }, + { + "hidden_norms": [ + 70926.1171875, + 215072384.0, + 182463952.0, + 139682864.0, + 23765930.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.095985831208964e-08, + 3.789666913611711e-10, + 3.7876501934874796e-10, + 3.788162006301832e-10, + 3.7878628011966953e-10 + ], + "bp_grad_norms_F": [ + 1.5613211871823296e-05, + 2.6332656943850452e-08, + 2.168836488181114e-08, + 2.1559124263603735e-08, + 2.1535397465299866e-08 + ], + "gamma_dfa": -0.05026113349595107, + "acc_eval": 0.1015625, + "loss_eval": 11.245050430297852, + "epoch": 59 + }, + { + "hidden_norms": [ + 71444.5078125, + 220139504.0, + 186860912.0, + 142962752.0, + 24235874.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.007455048504198e-08, + 3.741315868222017e-10, + 3.7062136692966874e-10, + 3.705513118568149e-10, + 3.7064074032144845e-10 + ], + "bp_grad_norms_F": [ + 2.3456123017240316e-05, + 2.666844878262964e-08, + 2.1298749430798125e-08, + 2.1137482875133173e-08, + 2.1113727655119874e-08 + ], + "gamma_dfa": -0.050498483098635916, + "acc_eval": 0.095703125, + "loss_eval": 11.284198760986328, + "epoch": 60 + }, + { + "hidden_norms": [ + 71960.484375, + 225013808.0, + 190973296.0, + 145961232.0, + 24784322.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.034386749817713e-08, + 3.658137681661344e-10, + 3.6446287654534615e-10, + 3.645108936911612e-10, + 3.6448208340367216e-10 + ], + "bp_grad_norms_F": [ + 2.785225660772994e-05, + 2.5983931450923592e-08, + 2.1029784136317176e-08, + 2.0842044534674642e-08, + 2.0818688994950207e-08 + ], + "gamma_dfa": -0.05046346641029231, + "acc_eval": 0.0986328125, + "loss_eval": 11.392132759094238, + "epoch": 61 + }, + { + "hidden_norms": [ + 72430.8359375, + 229851040.0, + 195010560.0, + 149020912.0, + 25253220.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.096932984675732e-08, + 3.608093823714853e-10, + 3.5983932500371907e-10, + 3.600989784136033e-10, + 3.599919529140294e-10 + ], + "bp_grad_norms_F": [ + 2.763499469438102e-05, + 2.5544034443214514e-08, + 2.0638090347802063e-08, + 2.0451848214975143e-08, + 2.0428588598520037e-08 + ], + "gamma_dfa": -0.050787233689334244, + "acc_eval": 0.091796875, + "loss_eval": 11.378694534301758, + "epoch": 62 + }, + { + "hidden_norms": [ + 72896.0234375, + 234300800.0, + 198948976.0, + 152100720.0, + 25625868.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.0542243924574e-08, + 3.557290573219518e-10, + 3.5249042573681777e-10, + 3.5253552854719317e-10, + 3.5250652397067483e-10 + ], + "bp_grad_norms_F": [ + 2.9849852580809966e-05, + 2.5036932527200406e-08, + 2.0406586642707225e-08, + 2.020845712991104e-08, + 2.0186647020636883e-08 + ], + "gamma_dfa": -0.05070546226488659, + "acc_eval": 0.095703125, + "loss_eval": 11.479286193847656, + "epoch": 63 + }, + { + "hidden_norms": [ + 73328.34375, + 238316288.0, + 202586032.0, + 155039648.0, + 26024600.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.105094989081408e-08, + 3.510710333554101e-10, + 3.495781997209235e-10, + 3.500161271929869e-10, + 3.499118772509746e-10 + ], + "bp_grad_norms_F": [ + 2.91574870061595e-05, + 2.4413550292479158e-08, + 2.0145231260926266e-08, + 1.9952185681404444e-08, + 1.9931007955165114e-08 + ], + "gamma_dfa": -0.05086314045183826, + "acc_eval": 0.0908203125, + "loss_eval": 11.489895820617676, + "epoch": 64 + }, + { + "hidden_norms": [ + 73748.5859375, + 242733616.0, + 206386528.0, + 157821696.0, + 26465746.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.082241803071156e-08, + 3.460224329288053e-10, + 3.438662687926808e-10, + 3.4428762618610165e-10, + 3.442592599878225e-10 + ], + "bp_grad_norms_F": [ + 2.8733484214171767e-05, + 2.375874608162576e-08, + 1.9914560667189107e-08, + 1.971613627915758e-08, + 1.969561402859199e-08 + ], + "gamma_dfa": -0.05102878155594226, + "acc_eval": 0.0888671875, + "loss_eval": 11.548040390014648, + "epoch": 65 + }, + { + "hidden_norms": [ + 74135.421875, + 246595824.0, + 209988560.0, + 160289792.0, + 26835076.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.098909714566616e-08, + 3.4202959908746777e-10, + 3.378679835908116e-10, + 3.3727598491850586e-10, + 3.370834167348846e-10 + ], + "bp_grad_norms_F": [ + 2.7568949008127674e-05, + 2.2366455354472237e-08, + 1.9751842827986366e-08, + 1.955501183203978e-08, + 1.9534347472927038e-08 + ], + "gamma_dfa": -0.05096771135140443, + "acc_eval": 0.091796875, + "loss_eval": 11.69294548034668, + "epoch": 66 + }, + { + "hidden_norms": [ + 74519.4609375, + 250496496.0, + 213470016.0, + 163034096.0, + 27224026.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.081137619659785e-08, + 3.371838919186132e-10, + 3.34856059547306e-10, + 3.351785793359596e-10, + 3.353441968556581e-10 + ], + "bp_grad_norms_F": [ + 2.4417575332336128e-05, + 2.182440006492925e-08, + 1.9469752032819088e-08, + 1.9279319474208023e-08, + 1.925921822021337e-08 + ], + "gamma_dfa": -0.051001671119593084, + "acc_eval": 0.0888671875, + "loss_eval": 11.729022026062012, + "epoch": 67 + }, + { + "hidden_norms": [ + 74894.3515625, + 254264416.0, + 216871648.0, + 165452496.0, + 27605496.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.085709962164401e-08, + 3.3377053898497877e-10, + 3.3198219173691257e-10, + 3.3151825729049733e-10, + 3.3171596025560746e-10 + ], + "bp_grad_norms_F": [ + 2.2483380234916694e-05, + 2.14983302271321e-08, + 1.9263785233647468e-08, + 1.9080003355043118e-08, + 1.9060196976283805e-08 + ], + "gamma_dfa": -0.050941091212735046, + "acc_eval": 0.087890625, + "loss_eval": 11.798931121826172, + "epoch": 68 + }, + { + "hidden_norms": [ + 75242.4609375, + 257808672.0, + 219912720.0, + 167826688.0, + 27928376.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.091576913533572e-08, + 3.2881539158147177e-10, + 3.263028736100182e-10, + 3.2664609905808106e-10, + 3.264644665712524e-10 + ], + "bp_grad_norms_F": [ + 2.127209518221207e-05, + 2.0985540416518234e-08, + 1.9050151678356997e-08, + 1.8875326190936903e-08, + 1.8856361805319466e-08 + ], + "gamma_dfa": -0.05089846828195732, + "acc_eval": 0.091796875, + "loss_eval": 11.895479202270508, + "epoch": 69 + }, + { + "hidden_norms": [ + 75572.1171875, + 261119824.0, + 222742832.0, + 169876672.0, + 28198556.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.057247041255323e-08, + 3.278008420259937e-10, + 3.249100710700503e-10, + 3.242202339936995e-10, + 3.244049195938459e-10 + ], + "bp_grad_norms_F": [ + 1.884793528006412e-05, + 2.07159356335751e-08, + 1.889556244805135e-08, + 1.8724394479363582e-08, + 1.8705017978959404e-08 + ], + "gamma_dfa": -0.05079331841261592, + "acc_eval": 0.0888671875, + "loss_eval": 11.890766143798828, + "epoch": 70 + }, + { + "hidden_norms": [ + 75874.0546875, + 264210176.0, + 225470416.0, + 172025616.0, + 28547836.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.025038849586053e-08, + 3.2404043337486144e-10, + 3.204363163700208e-10, + 3.2077221434612113e-10, + 3.205906651260193e-10 + ], + "bp_grad_norms_F": [ + 1.7337119061267003e-05, + 2.020676426184309e-08, + 1.872472488173571e-08, + 1.8554693781425158e-08, + 1.853570097409829e-08 + ], + "gamma_dfa": -0.05096161225810647, + "acc_eval": 0.0849609375, + "loss_eval": 11.900531768798828, + "epoch": 71 + }, + { + "hidden_norms": [ + 76155.671875, + 267008752.0, + 228187344.0, + 173959248.0, + 28788394.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.046407711821303e-08, + 3.195448350368224e-10, + 3.1774499698045133e-10, + 3.1807836919917065e-10, + 3.179001784037183e-10 + ], + "bp_grad_norms_F": [ + 1.667224569246173e-05, + 2.00564560515204e-08, + 1.8585067707022063e-08, + 1.8417832592376726e-08, + 1.8399065382368462e-08 + ], + "gamma_dfa": -0.05094757055485388, + "acc_eval": 0.087890625, + "loss_eval": 11.944206237792969, + "epoch": 72 + }, + { + "hidden_norms": [ + 76421.0625, + 269839616.0, + 230674688.0, + 175791728.0, + 29094570.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.012642010475247e-08, + 3.166587547731581e-10, + 3.1469221672963954e-10, + 3.1502128683413844e-10, + 3.1484426177286196e-10 + ], + "bp_grad_norms_F": [ + 1.6745894754421897e-05, + 1.9875857404372255e-08, + 1.840698438115851e-08, + 1.8240543298020384e-08, + 1.822207096324746e-08 + ], + "gamma_dfa": -0.05100561307335738, + "acc_eval": 0.0859375, + "loss_eval": 11.99311637878418, + "epoch": 73 + }, + { + "hidden_norms": [ + 76664.2734375, + 272336768.0, + 232959216.0, + 177609664.0, + 29323556.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.990726030333462e-08, + 3.1504263087178686e-10, + 3.12906783817013e-10, + 3.131215564611267e-10, + 3.1305841252660116e-10 + ], + "bp_grad_norms_F": [ + 1.6934929590206593e-05, + 1.98417797747652e-08, + 1.8281056668456586e-08, + 1.8116447009219883e-08, + 1.8098068821359448e-08 + ], + "gamma_dfa": -0.05103835645422805, + "acc_eval": 0.0849609375, + "loss_eval": 12.02127456665039, + "epoch": 74 + }, + { + "hidden_norms": [ + 76888.4921875, + 274732928.0, + 235060816.0, + 179132768.0, + 29504610.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.986659594256707e-08, + 3.121746194878483e-10, + 3.1075714224115814e-10, + 3.1084415597071313e-10, + 3.1076746731528715e-10 + ], + "bp_grad_norms_F": [ + 1.7154834495158866e-05, + 1.9609577961432478e-08, + 1.816025729795001e-08, + 1.7994944201404905e-08, + 1.7976633515104368e-08 + ], + "gamma_dfa": -0.05099774348491337, + "acc_eval": 0.083984375, + "loss_eval": 12.060166358947754, + "epoch": 75 + }, + { + "hidden_norms": [ + 77091.2421875, + 277045280.0, + 237230640.0, + 180794320.0, + 29739022.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.99742147453253e-08, + 3.103251822178521e-10, + 3.08925968139917e-10, + 3.089623279439735e-10, + 3.0893596014713864e-10 + ], + "bp_grad_norms_F": [ + 1.679581509961281e-05, + 1.951891448470633e-08, + 1.803828730828627e-08, + 1.787446990419994e-08, + 1.785628889194868e-08 + ], + "gamma_dfa": -0.050966299066203646, + "acc_eval": 0.087890625, + "loss_eval": 12.12912654876709, + "epoch": 76 + }, + { + "hidden_norms": [ + 77280.328125, + 279085056.0, + 239194416.0, + 182229856.0, + 29919720.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.955728958426334e-08, + 3.0862179478674534e-10, + 3.06326686239089e-10, + 3.067510134791007e-10, + 3.0670044282032904e-10 + ], + "bp_grad_norms_F": [ + 1.6653601051075384e-05, + 1.913345748505435e-08, + 1.7934322471546693e-08, + 1.7773432503531694e-08, + 1.7755372283545512e-08 + ], + "gamma_dfa": -0.050885657081380486, + "acc_eval": 0.0888671875, + "loss_eval": 12.196252822875977, + "epoch": 77 + }, + { + "hidden_norms": [ + 77464.84375, + 281044160.0, + 241080400.0, + 183481632.0, + 30118970.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.968549281007654e-08, + 3.077238464044285e-10, + 3.0509625381647254e-10, + 3.05251185439559e-10, + 3.0514471505149743e-10 + ], + "bp_grad_norms_F": [ + 1.6696472812327556e-05, + 1.9041245025164244e-08, + 1.7839029808897067e-08, + 1.767946500308426e-08, + 1.766149004822637e-08 + ], + "gamma_dfa": -0.05102008958783699, + "acc_eval": 0.0888671875, + "loss_eval": 12.193323135375977, + "epoch": 78 + }, + { + "hidden_norms": [ + 77630.7734375, + 282858400.0, + 242823728.0, + 184645696.0, + 30321804.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.95526710564809e-08, + 3.0606236989250135e-10, + 3.0359312286343254e-10, + 3.0362826142216193e-10, + 3.0360203240320516e-10 + ], + "bp_grad_norms_F": [ + 1.670894562266767e-05, + 1.8970476745039377e-08, + 1.7750505065805555e-08, + 1.7592398648957897e-08, + 1.7574748767401616e-08 + ], + "gamma_dfa": -0.05112272154656239, + "acc_eval": 0.087890625, + "loss_eval": 12.226293563842773, + "epoch": 79 + }, + { + "hidden_norms": [ + 77779.6484375, + 284380192.0, + 244252416.0, + 185749600.0, + 30452270.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.966701159351942e-08, + 3.0471447587387956e-10, + 3.022795902474229e-10, + 3.0231497860633283e-10, + 3.022894989879177e-10 + ], + "bp_grad_norms_F": [ + 1.6740978026064113e-05, + 1.889440781610574e-08, + 1.7666355489609487e-08, + 1.7510158656364183e-08, + 1.749260469807723e-08 + ], + "gamma_dfa": -0.05107468220376177, + "acc_eval": 0.0888671875, + "loss_eval": 12.260065078735352, + "epoch": 80 + }, + { + "hidden_norms": [ + 77920.109375, + 285895104.0, + 245542864.0, + 186746576.0, + 30585936.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.98649830105569e-08, + 3.0335337020126474e-10, + 3.010065807718121e-10, + 3.0114838400763233e-10, + 3.010563187633153e-10 + ], + "bp_grad_norms_F": [ + 1.6312769730575383e-05, + 1.8841578963701977e-08, + 1.7605929159003608e-08, + 1.7449115929935033e-08, + 1.7431389665034658e-08 + ], + "gamma_dfa": -0.051095581700792536, + "acc_eval": 0.087890625, + "loss_eval": 12.283187866210938, + "epoch": 81 + }, + { + "hidden_norms": [ + 78045.9765625, + 287308480.0, + 246744592.0, + 187657408.0, + 30732464.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.991665367830137e-08, + 3.023456207618125e-10, + 3.001092707677344e-10, + 3.002506299143448e-10, + 3.001580373140911e-10 + ], + "bp_grad_norms_F": [ + 1.6261117707472295e-05, + 1.8763861575621377e-08, + 1.7538225094426707e-08, + 1.73831011807124e-08, + 1.7365564985993842e-08 + ], + "gamma_dfa": -0.05111259325349238, + "acc_eval": 0.0888671875, + "loss_eval": 12.312464714050293, + "epoch": 82 + }, + { + "hidden_norms": [ + 78157.4453125, + 288495296.0, + 247894048.0, + 188423328.0, + 30852564.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.983852950450455e-08, + 3.0117680571706273e-10, + 2.9906743748142617e-10, + 2.9920824151652425e-10, + 2.991159819831779e-10 + ], + "bp_grad_norms_F": [ + 1.6263733414234594e-05, + 1.8713789629032362e-08, + 1.7478631875178507e-08, + 1.7324792267459088e-08, + 1.730730758708887e-08 + ], + "gamma_dfa": -0.05116538004585891, + "acc_eval": 0.0849609375, + "loss_eval": 12.31210994720459, + "epoch": 83 + }, + { + "hidden_norms": [ + 78262.0234375, + 289603808.0, + 248882656.0, + 189149776.0, + 30956266.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.960672204239017e-08, + 3.0011432228249646e-10, + 2.9822597169548715e-10, + 2.9836624837464853e-10, + 2.9827409986360465e-10 + ], + "bp_grad_norms_F": [ + 1.631741542951204e-05, + 1.8692462688818523e-08, + 1.7431661447631086e-08, + 1.7277525188319487e-08, + 1.725989662304528e-08 + ], + "gamma_dfa": -0.05115435087645892, + "acc_eval": 0.083984375, + "loss_eval": 12.336039543151855, + "epoch": 84 + }, + { + "hidden_norms": [ + 78353.1171875, + 290648000.0, + 249810592.0, + 189809696.0, + 31040388.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.986083344098006e-08, + 2.995071968214802e-10, + 2.9758684405578606e-10, + 2.977268154236157e-10, + 2.9763422282336194e-10 + ], + "bp_grad_norms_F": [ + 1.6262692952295765e-05, + 1.849162600819909e-08, + 1.73968519590062e-08, + 1.7244063954535704e-08, + 1.7226579274165488e-08 + ], + "gamma_dfa": -0.05118084823334357, + "acc_eval": 0.0888671875, + "loss_eval": 12.381507873535156, + "epoch": 85 + }, + { + "hidden_norms": [ + 78431.15625, + 291523168.0, + 250644688.0, + 190386224.0, + 31126390.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.970421561116382e-08, + 2.984960056906516e-10, + 2.967268375453358e-10, + 2.968662538016531e-10, + 2.967753265359363e-10 + ], + "bp_grad_norms_F": [ + 1.6223337297560647e-05, + 1.8457278372352448e-08, + 1.7345271885460534e-08, + 1.7192725465520198e-08, + 1.717533315570563e-08 + ], + "gamma_dfa": -0.05117447574957623, + "acc_eval": 0.0849609375, + "loss_eval": 12.38785171508789, + "epoch": 86 + }, + { + "hidden_norms": [ + 78499.1484375, + 292312512.0, + 251365920.0, + 190918880.0, + 31200688.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.988487110173082e-08, + 2.980244662165177e-10, + 2.966143997085169e-10, + 2.96407148825395e-10, + 2.965439005464532e-10 + ], + "bp_grad_norms_F": [ + 1.627574602025561e-05, + 1.8460895034877467e-08, + 1.7314020439584965e-08, + 1.7161701393320072e-08, + 1.714437836142224e-08 + ], + "gamma_dfa": -0.05115793484583264, + "acc_eval": 0.0888671875, + "loss_eval": 12.419504165649414, + "epoch": 87 + }, + { + "hidden_norms": [ + 78560.8984375, + 292944192.0, + 251977760.0, + 191372272.0, + 31263360.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.973138676537928e-08, + 2.973402635220168e-10, + 2.9567431836241553e-10, + 2.958131239960693e-10, + 2.957224187749574e-10 + ], + "bp_grad_norms_F": [ + 1.628614336368628e-05, + 1.8427853021307783e-08, + 1.72794418773492e-08, + 1.7127625540069857e-08, + 1.7110302508172026e-08 + ], + "gamma_dfa": -0.0511754965664295, + "acc_eval": 0.087890625, + "loss_eval": 12.422038078308105, + "epoch": 88 + }, + { + "hidden_norms": [ + 78610.8515625, + 293507168.0, + 252467824.0, + 191746752.0, + 31315682.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.979492349681095e-08, + 2.9698124515142865e-10, + 2.9562619019429803e-10, + 2.9538149703967065e-10, + 2.9551999736199264e-10 + ], + "bp_grad_norms_F": [ + 1.631640589039307e-05, + 1.8418628400240777e-08, + 1.726077947239446e-08, + 1.710880859207009e-08, + 1.709145003303547e-08 + ], + "gamma_dfa": -0.051156919635104714, + "acc_eval": 0.0888671875, + "loss_eval": 12.428571701049805, + "epoch": 89 + }, + { + "hidden_norms": [ + 78652.9921875, + 293964640.0, + 252896208.0, + 192039472.0, + 31369200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.969335141273405e-08, + 2.9646449184461687e-10, + 2.949255561990327e-10, + 2.949690214304468e-10, + 2.9487870478739353e-10 + ], + "bp_grad_norms_F": [ + 1.6324445823556744e-05, + 1.8399745727037953e-08, + 1.7238173555256253e-08, + 1.7086200898575044e-08, + 1.7068817470544673e-08 + ], + "gamma_dfa": -0.051174478845496196, + "acc_eval": 0.087890625, + "loss_eval": 12.429685592651367, + "epoch": 90 + }, + { + "hidden_norms": [ + 78686.6953125, + 294364864.0, + 253268672.0, + 192287472.0, + 31404650.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.964375552977799e-08, + 2.960394152040635e-10, + 2.9448907201690133e-10, + 2.9462729478346716e-10, + 2.9453686711811145e-10 + ], + "bp_grad_norms_F": [ + 1.5716021152911708e-05, + 1.8335738261043844e-08, + 1.7222946624428914e-08, + 1.7072181890398497e-08, + 1.7054745171662944e-08 + ], + "gamma_dfa": -0.05117890803012415, + "acc_eval": 0.087890625, + "loss_eval": 12.430795669555664, + "epoch": 91 + }, + { + "hidden_norms": [ + 78715.6640625, + 294704960.0, + 253580416.0, + 192507984.0, + 31439268.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.966816267275135e-08, + 2.9585070504545286e-10, + 2.9467184248233025e-10, + 2.944416099825986e-10, + 2.943854882087038e-10 + ], + "bp_grad_norms_F": [ + 1.575841633894015e-05, + 1.832342988450364e-08, + 1.7211402081329652e-08, + 1.7061056567513333e-08, + 1.704364827048721e-08 + ], + "gamma_dfa": -0.05119702904630685, + "acc_eval": 0.087890625, + "loss_eval": 12.439577102661133, + "epoch": 92 + }, + { + "hidden_norms": [ + 78736.21875, + 294950432.0, + 253812928.0, + 192667952.0, + 31460118.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.969291798166523e-08, + 2.956498934558738e-10, + 2.9448718463775947e-10, + 2.947934119035267e-10, + 2.946275168280721e-10 + ], + "bp_grad_norms_F": [ + 1.5731959138065577e-05, + 1.8296260506645012e-08, + 1.719953068857194e-08, + 1.7050359346626465e-08, + 1.703298835309397e-08 + ], + "gamma_dfa": -0.05120327511394862, + "acc_eval": 0.0888671875, + "loss_eval": 12.4466552734375, + "epoch": 93 + }, + { + "hidden_norms": [ + 78753.203125, + 295147232.0, + 253989200.0, + 192796160.0, + 31479312.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.963842645925979e-08, + 2.9541508128616556e-10, + 2.9437702275814104e-10, + 2.943085775086729e-10, + 2.9446245441988594e-10 + ], + "bp_grad_norms_F": [ + 1.573332519910764e-05, + 1.8288872638549947e-08, + 1.718973052788897e-08, + 1.7040525435163545e-08, + 1.7023159770701568e-08 + ], + "gamma_dfa": -0.051216166342783254, + "acc_eval": 0.087890625, + "loss_eval": 12.445267677307129, + "epoch": 94 + }, + { + "hidden_norms": [ + 78765.84375, + 295294944.0, + 254123440.0, + 192894032.0, + 31493604.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.965194098209395e-08, + 2.9531932455029164e-10, + 2.942409649264732e-10, + 2.945468868809087e-10, + 2.943810750721809e-10 + ], + "bp_grad_norms_F": [ + 1.5746687495266087e-05, + 1.8289329162257673e-08, + 1.7184650147328284e-08, + 1.703533136776514e-08, + 1.7017976361444198e-08 + ], + "gamma_dfa": -0.0512156481272541, + "acc_eval": 0.087890625, + "loss_eval": 12.449201583862305, + "epoch": 95 + }, + { + "hidden_norms": [ + 78774.0859375, + 295388160.0, + 254208896.0, + 192955280.0, + 31502434.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.963444741993953e-08, + 2.9521793343256775e-10, + 2.941772103692841e-10, + 2.944521015901813e-10, + 2.9431723724826497e-10 + ], + "bp_grad_norms_F": [ + 1.574558154970873e-05, + 1.8287312997244953e-08, + 1.7180775913061552e-08, + 1.7031513976917267e-08, + 1.7014160746953166e-08 + ], + "gamma_dfa": -0.051216532388934866, + "acc_eval": 0.087890625, + "loss_eval": 12.451032638549805, + "epoch": 96 + }, + { + "hidden_norms": [ + 78778.2109375, + 295438176.0, + 254253040.0, + 192987616.0, + 31507318.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.962313557958623e-08, + 2.951474897816553e-10, + 2.9410018864695076e-10, + 2.9431876380492383e-10, + 2.9424027103708283e-10 + ], + "bp_grad_norms_F": [ + 1.5746518329251558e-05, + 1.8286739233985827e-08, + 1.717829789527059e-08, + 1.7028938259500137e-08, + 1.7011583253179197e-08 + ], + "gamma_dfa": -0.051216747364378534, + "acc_eval": 0.087890625, + "loss_eval": 12.451074600219727, + "epoch": 97 + }, + { + "hidden_norms": [ + 78782.125, + 295481568.0, + 254291456.0, + 193016112.0, + 31511684.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.962148712043927e-08, + 2.9511454391339953e-10, + 2.9406876933535386e-10, + 2.942796561988814e-10, + 2.9420885172548594e-10 + ], + "bp_grad_norms_F": [ + 1.574746784172021e-05, + 1.8285794212147266e-08, + 1.7176807531882332e-08, + 1.7027431908900326e-08, + 1.7010076902579385e-08 + ], + "gamma_dfa": -0.05121716375651886, + "acc_eval": 0.087890625, + "loss_eval": 12.451665878295898, + "epoch": 98 + }, + { + "hidden_norms": [ + 78783.9921875, + 295502592.0, + 254310320.0, + 193029024.0, + 31513524.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.961931285966784e-08, + 2.950964195225225e-10, + 2.940539201023995e-10, + 2.942680543682741e-10, + 2.941940024925316e-10 + ], + "bp_grad_norms_F": [ + 1.5747409634059295e-05, + 1.8284790570533005e-08, + 1.717580744298175e-08, + 1.702643714907026e-08, + 1.700908214274932e-08 + ], + "gamma_dfa": -0.05121721836621873, + "acc_eval": 0.087890625, + "loss_eval": 12.452173233032227, + "epoch": 99 + }, + { + "hidden_norms": [ + 78784.0078125, + 295502688.0, + 254310576.0, + 193029360.0, + 31513636.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.96192702271037e-08, + 2.9509686361173237e-10, + 2.940537813245214e-10, + 2.9426569514434675e-10, + 2.941938359590779e-10 + ], + "bp_grad_norms_F": [ + 1.5747655197628774e-05, + 1.8284845637595026e-08, + 1.7175850075545895e-08, + 1.7026476228920728e-08, + 1.7009122998956627e-08 + ], + "gamma_dfa": -0.05121716100984486, + "acc_eval": 0.087890625, + "loss_eval": 12.452241897583008, + "epoch": 100 + } + ] +}
\ No newline at end of file |
