summaryrefslogtreecommitdiff
path: root/results/h2_no_residual_full_s456/snapshot_evolution_s456.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/h2_no_residual_full_s456/snapshot_evolution_s456.json')
-rw-r--r--results/h2_no_residual_full_s456/snapshot_evolution_s456.json2749
1 files changed, 2749 insertions, 0 deletions
diff --git a/results/h2_no_residual_full_s456/snapshot_evolution_s456.json b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json
new file mode 100644
index 0000000..4070eaa
--- /dev/null
+++ b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json
@@ -0,0 +1,2749 @@
+{
+ "config": {
+ "output_dir": "results/h2_no_residual_full_s456",
+ "epochs": 100,
+ "lr": 0.001,
+ "wd": 0.01,
+ "seed": 456,
+ "depth": 4,
+ "d_hidden": 256,
+ "log_every": 1,
+ "no_residual_add": true,
+ "w2_std": 0.5,
+ "random_targets": false,
+ "skip_bp": true
+ },
+ "depth": 4,
+ "d_hidden": 256,
+ "num_classes": 10,
+ "bp_log": null,
+ "dfa_log": [
+ {
+ "hidden_norms": [
+ 8.696551322937012,
+ 42.47159957885742,
+ 42.67432403564453,
+ 45.272701263427734,
+ 43.449092864990234
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011182057205587626,
+ 0.00021166827355045825,
+ 0.00014748115791007876,
+ 0.00011803740198956802,
+ 0.00010102539090439677
+ ],
+ "bp_grad_norms_F": [
+ 0.039927296340465546,
+ 0.006882709916681051,
+ 0.004750067833811045,
+ 0.00377994985319674,
+ 0.0032426300458610058
+ ],
+ "gamma_dfa": 0.012312270817346871,
+ "acc_eval": 0.1142578125,
+ "loss_eval": 2.3956005573272705,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 1556.684814453125,
+ 6497.32177734375,
+ 10603.298828125,
+ 15776.048828125,
+ 9974.5771484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.715180458944815e-07,
+ 4.893955178886245e-07,
+ 4.84326051264361e-07,
+ 4.838655058847507e-07,
+ 4.83024962250056e-07
+ ],
+ "bp_grad_norms_F": [
+ 4.703722152044065e-05,
+ 2.927827154053375e-05,
+ 2.886639595089946e-05,
+ 2.8710121114272624e-05,
+ 2.851033423212357e-05
+ ],
+ "gamma_dfa": 0.018546399660408497,
+ "acc_eval": 0.111328125,
+ "loss_eval": 2.356113910675049,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 3438.555908203125,
+ 41675.72265625,
+ 66460.0234375,
+ 84792.1875,
+ 42575.42578125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.2151462530928256e-07,
+ 8.604414603041732e-08,
+ 8.536036233408595e-08,
+ 8.52630037684321e-08,
+ 8.530036410547837e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.8386168449069373e-05,
+ 6.961788585613249e-06,
+ 6.748253326804843e-06,
+ 6.721136742271483e-06,
+ 6.674351880064933e-06
+ ],
+ "gamma_dfa": 0.017316466895863414,
+ "acc_eval": 0.1005859375,
+ "loss_eval": 2.356572151184082,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 5372.435546875,
+ 121188.546875,
+ 174809.4375,
+ 203405.859375,
+ 95077.4609375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.2532444770840812e-07,
+ 3.495903300176906e-08,
+ 3.4808731896873724e-08,
+ 3.474917420476231e-08,
+ 3.4685903926856554e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.1882418220920954e-05,
+ 2.7211688120587496e-06,
+ 2.6087484457093524e-06,
+ 2.602359927550424e-06,
+ 2.590174972283421e-06
+ ],
+ "gamma_dfa": 0.014974067453294992,
+ "acc_eval": 0.080078125,
+ "loss_eval": 2.381472110748291,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 7225.4375,
+ 258499.359375,
+ 333575.4375,
+ 364076.25,
+ 168464.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.640306248253182e-08,
+ 1.9808053863812347e-08,
+ 1.9682946827970227e-08,
+ 1.9666908102067282e-08,
+ 1.967319640527876e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.1042752703360748e-05,
+ 1.5015855296951486e-06,
+ 1.3234410971563193e-06,
+ 1.3206722542236093e-06,
+ 1.314130940954783e-06
+ ],
+ "gamma_dfa": 0.020775633631274104,
+ "acc_eval": 0.0654296875,
+ "loss_eval": 2.458400249481201,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 8934.6435546875,
+ 470048.6875,
+ 549725.375,
+ 586957.8125,
+ 270350.28125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.15417982632971e-08,
+ 1.303753727199819e-08,
+ 1.2938533799911056e-08,
+ 1.2922544811999614e-08,
+ 1.2902905410783205e-08
+ ],
+ "bp_grad_norms_F": [
+ 9.721887181513011e-06,
+ 9.336578727925371e-07,
+ 8.095747716652113e-07,
+ 8.079554731921235e-07,
+ 8.037279712880263e-07
+ ],
+ "gamma_dfa": 0.023886571638286114,
+ "acc_eval": 0.0732421875,
+ "loss_eval": 2.553205966949463,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 10581.7958984375,
+ 749584.4375,
+ 812141.0,
+ 857193.1875,
+ 400190.71875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.321820222865426e-08,
+ 9.664934630393418e-09,
+ 9.634317343909515e-09,
+ 9.620791274755902e-09,
+ 9.613222218263218e-09
+ ],
+ "bp_grad_norms_F": [
+ 7.260930487973383e-06,
+ 5.95286962834507e-07,
+ 5.624330583486881e-07,
+ 5.61392937470373e-07,
+ 5.576875423685124e-07
+ ],
+ "gamma_dfa": 0.024110323167406023,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 2.702815532684326,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 12157.236328125,
+ 1101113.5,
+ 1131608.625,
+ 1175579.75,
+ 556328.5625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.076628977780274e-08,
+ 7.990832884274823e-09,
+ 7.954333192117247e-09,
+ 7.956207248582814e-09,
+ 7.94490695454897e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.092925211007241e-06,
+ 4.779853952641133e-07,
+ 4.453321764685825e-07,
+ 4.4446503011386085e-07,
+ 4.4091100903642655e-07
+ ],
+ "gamma_dfa": 0.029227681923657656,
+ "acc_eval": 0.1123046875,
+ "loss_eval": 2.943108558654785,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 13644.7734375,
+ 1553127.5,
+ 1514848.5,
+ 1594542.125,
+ 760487.4375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.183345391264083e-08,
+ 6.574770061718027e-09,
+ 6.521708506568302e-09,
+ 6.522410611609075e-09,
+ 6.511657879570976e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.052718380378792e-05,
+ 3.7946443853797973e-07,
+ 3.55582386646347e-07,
+ 3.546880407157005e-07,
+ 3.51142261934001e-07
+ ],
+ "gamma_dfa": 0.031233762740157545,
+ "acc_eval": 0.115234375,
+ "loss_eval": 3.18121600151062,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 15180.75,
+ 2118332.5,
+ 1971916.0,
+ 2126576.75,
+ 1010951.875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.837856147967614e-08,
+ 5.575389039336187e-09,
+ 5.5562221490390584e-09,
+ 5.548445258796164e-09,
+ 5.536703984176938e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.100128883990692e-05,
+ 3.2698190466362576e-07,
+ 3.031300082056987e-07,
+ 3.0168610010150587e-07,
+ 2.9835959480806196e-07
+ ],
+ "gamma_dfa": 0.03483391250483692,
+ "acc_eval": 0.1162109375,
+ "loss_eval": 3.5671467781066895,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 16599.55078125,
+ 2766443.75,
+ 2507868.5,
+ 2746855.25,
+ 1307418.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.16296781888559e-08,
+ 4.753268889601259e-09,
+ 4.731485869768903e-09,
+ 4.728840874435036e-09,
+ 4.7213348786101506e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1134686246805359e-05,
+ 2.7916473754885374e-07,
+ 2.561137080192566e-07,
+ 2.54354034723292e-07,
+ 2.5102386302933155e-07
+ ],
+ "gamma_dfa": 0.04032926296349615,
+ "acc_eval": 0.115234375,
+ "loss_eval": 3.8605642318725586,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 18096.76171875,
+ 3487919.0,
+ 3098858.25,
+ 3488545.25,
+ 1643380.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.39422816309343e-08,
+ 4.142685749997099e-09,
+ 4.12689660223009e-09,
+ 4.106536444226094e-09,
+ 4.097727934748718e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2028808669128921e-05,
+ 2.466808268763998e-07,
+ 2.2443308012043417e-07,
+ 2.2274194577676099e-07,
+ 2.1958824447665393e-07
+ ],
+ "gamma_dfa": 0.04084749217145145,
+ "acc_eval": 0.1162109375,
+ "loss_eval": 4.266114234924316,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 19581.2265625,
+ 4300652.5,
+ 3764740.75,
+ 4282907.0,
+ 2046749.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.486859487926267e-08,
+ 3.5559581945676655e-09,
+ 3.521152702745667e-09,
+ 3.5090488292865984e-09,
+ 3.507678369985001e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1329559129080735e-05,
+ 2.097379336873928e-07,
+ 1.916048546490856e-07,
+ 1.900083077543968e-07,
+ 1.8724767869571224e-07
+ ],
+ "gamma_dfa": 0.041128118813503534,
+ "acc_eval": 0.1123046875,
+ "loss_eval": 4.545563220977783,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 21009.037109375,
+ 5305093.0,
+ 4626911.0,
+ 5321710.0,
+ 2528971.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.575832938755411e-08,
+ 3.0991811339475817e-09,
+ 3.0681037710422743e-09,
+ 3.060007136568288e-09,
+ 3.054509534194949e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.31506558318506e-05,
+ 1.8260404033298983e-07,
+ 1.6721619999771065e-07,
+ 1.6574335859331768e-07,
+ 1.6327113883107813e-07
+ ],
+ "gamma_dfa": 0.04362456756643951,
+ "acc_eval": 0.1142578125,
+ "loss_eval": 5.006200790405273,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 22418.66015625,
+ 6455876.5,
+ 5546792.0,
+ 6434348.0,
+ 3069372.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.665693146918784e-08,
+ 2.6803985697654298e-09,
+ 2.6608955039364446e-09,
+ 2.655886177649336e-09,
+ 2.650993424779813e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1598707715165801e-05,
+ 1.584767090889727e-07,
+ 1.4540981396748975e-07,
+ 1.442050745481538e-07,
+ 1.419812747371907e-07
+ ],
+ "gamma_dfa": 0.043382189120166004,
+ "acc_eval": 0.115234375,
+ "loss_eval": 5.284748077392578,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 23927.9296875,
+ 7772545.0,
+ 6605308.0,
+ 7661779.0,
+ 3671957.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.622067954571321e-08,
+ 2.3548620831093103e-09,
+ 2.3399049364769553e-09,
+ 2.3347188626843263e-09,
+ 2.3328083909035513e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2071202945662662e-05,
+ 1.4146635862744006e-07,
+ 1.285337845047252e-07,
+ 1.2724865428026533e-07,
+ 1.2524400005986536e-07
+ ],
+ "gamma_dfa": 0.045932179084047675,
+ "acc_eval": 0.1123046875,
+ "loss_eval": 5.692019462585449,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 25385.748046875,
+ 9261487.0,
+ 7775942.0,
+ 8990953.0,
+ 4363130.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.712851868291182e-08,
+ 2.1066282052117913e-09,
+ 2.0846218085068813e-09,
+ 2.0782020548892888e-09,
+ 2.0737342953935922e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4093741810938809e-05,
+ 1.278412895544534e-07,
+ 1.1472226901787508e-07,
+ 1.1351045259289094e-07,
+ 1.1163785273993199e-07
+ ],
+ "gamma_dfa": 0.04430226338445209,
+ "acc_eval": 0.1103515625,
+ "loss_eval": 6.133723258972168,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 26846.431640625,
+ 10875826.0,
+ 9052473.0,
+ 10511219.0,
+ 5116002.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.701503079715621e-08,
+ 1.8753321118225585e-09,
+ 1.861700571481606e-09,
+ 1.8542083424222255e-09,
+ 1.8551130631649926e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3089967978885397e-05,
+ 1.156644771072024e-07,
+ 1.0296086117023151e-07,
+ 1.0183324405943495e-07,
+ 1.0014894513687977e-07
+ ],
+ "gamma_dfa": 0.04534357553347945,
+ "acc_eval": 0.103515625,
+ "loss_eval": 6.548648834228516,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 28266.26953125,
+ 12742770.0,
+ 10505442.0,
+ 12262496.0,
+ 5946980.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.75791733076403e-08,
+ 1.6816592562918231e-09,
+ 1.6644484679417815e-09,
+ 1.662164628157825e-09,
+ 1.6569644545327833e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3716629837290384e-05,
+ 1.0489808488500785e-07,
+ 9.319560234644086e-08,
+ 9.210800300252231e-08,
+ 9.0522433993101e-08
+ ],
+ "gamma_dfa": 0.04543712313170545,
+ "acc_eval": 0.0859375,
+ "loss_eval": 6.933040618896484,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 29640.484375,
+ 14788877.0,
+ 12157201.0,
+ 14095277.0,
+ 6799392.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.606816865290966e-08,
+ 1.512424963046044e-09,
+ 1.495692236730406e-09,
+ 1.4903339673466576e-09,
+ 1.4848139384682213e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3458115063258447e-05,
+ 9.697606628833455e-08,
+ 8.518442484728439e-08,
+ 8.402660256479066e-08,
+ 8.255508987531357e-08
+ ],
+ "gamma_dfa": 0.044778631010558456,
+ "acc_eval": 0.076171875,
+ "loss_eval": 7.425451278686523,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 31005.751953125,
+ 17043824.0,
+ 13942765.0,
+ 16095532.0,
+ 7803190.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.645277122492189e-08,
+ 1.3731507042535895e-09,
+ 1.3549177335647755e-09,
+ 1.3525375264222816e-09,
+ 1.3489699357549512e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2845624951296486e-05,
+ 8.864368084005037e-08,
+ 7.73182620150692e-08,
+ 7.621348885322732e-08,
+ 7.483793496021462e-08
+ ],
+ "gamma_dfa": 0.045761530549498275,
+ "acc_eval": 0.080078125,
+ "loss_eval": 7.776348114013672,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 32358.83984375,
+ 19344688.0,
+ 15897992.0,
+ 18375228.0,
+ 8836651.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.644052146815739e-08,
+ 1.2519073555594673e-09,
+ 1.235606394978106e-09,
+ 1.2283364325682555e-09,
+ 1.2260956694376546e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3093407687847503e-05,
+ 8.157029185440479e-08,
+ 7.093318998840914e-08,
+ 6.988454259726495e-08,
+ 6.859116297164292e-08
+ ],
+ "gamma_dfa": 0.04580485462793149,
+ "acc_eval": 0.0927734375,
+ "loss_eval": 8.182464599609375,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 33740.52734375,
+ 21987014.0,
+ 17933020.0,
+ 20700014.0,
+ 9927617.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.858014328121499e-08,
+ 1.141782890456966e-09,
+ 1.131721383273998e-09,
+ 1.1269319921680676e-09,
+ 1.1228904472915247e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2902617527288385e-05,
+ 7.599386009360387e-08,
+ 6.517191053490023e-08,
+ 6.410991915117847e-08,
+ 6.290429155342281e-08
+ ],
+ "gamma_dfa": 0.046245397155871615,
+ "acc_eval": 0.1044921875,
+ "loss_eval": 8.578572273254395,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 35055.48828125,
+ 24700796.0,
+ 20204280.0,
+ 23173254.0,
+ 11098732.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.840032623107618e-08,
+ 1.054925813370744e-09,
+ 1.0381229209599496e-09,
+ 1.033837571107199e-09,
+ 1.0320241328187763e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3013632269576192e-05,
+ 7.11033791844784e-08,
+ 6.033156552121e-08,
+ 5.929242519187028e-08,
+ 5.8144280501437606e-08
+ ],
+ "gamma_dfa": 0.04646674945252016,
+ "acc_eval": 0.10546875,
+ "loss_eval": 8.944098472595215,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 36405.48046875,
+ 27759312.0,
+ 22467726.0,
+ 25750832.0,
+ 12358187.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 7.77747288793762e-08,
+ 9.745112494741193e-10,
+ 9.61777768537786e-10,
+ 9.57246060195871e-10,
+ 9.547377333163354e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.3124400538799819e-05,
+ 6.744348723941584e-08,
+ 5.6144159543691785e-08,
+ 5.510578660050669e-08,
+ 5.4037375463167336e-08
+ ],
+ "gamma_dfa": 0.04619356358307414,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.376721382141113,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 37680.57421875,
+ 30906478.0,
+ 24827362.0,
+ 28558372.0,
+ 13662978.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.0997551776818e-08,
+ 9.035370229781847e-10,
+ 8.898414227687113e-10,
+ 8.862885980676083e-10,
+ 8.829543207689028e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.3445563126879279e-05,
+ 6.41164845660569e-08,
+ 5.240685041485449e-08,
+ 5.135610692263981e-08,
+ 5.02956822856504e-08
+ ],
+ "gamma_dfa": 0.046825854369672015,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.577943801879883,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 38936.06640625,
+ 34144420.0,
+ 27240194.0,
+ 31329912.0,
+ 14997002.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.190059475055023e-08,
+ 8.378591709323757e-10,
+ 8.267845297282861e-10,
+ 8.228125403242359e-10,
+ 8.203847046139856e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2998734746361151e-05,
+ 6.114981232485661e-08,
+ 4.876913095586133e-08,
+ 4.772548578557689e-08,
+ 4.673227849139039e-08
+ ],
+ "gamma_dfa": 0.047515806669252925,
+ "acc_eval": 0.10546875,
+ "loss_eval": 9.88414478302002,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 40155.01953125,
+ 37508168.0,
+ 29749186.0,
+ 34078604.0,
+ 16502834.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.168245813067188e-08,
+ 7.775868282600129e-10,
+ 7.702881665849759e-10,
+ 7.661091205868331e-10,
+ 7.637669940940839e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.3017543096793815e-05,
+ 5.765622645981239e-08,
+ 4.5165805317992636e-08,
+ 4.418279431206429e-08,
+ 4.329486813503536e-08
+ ],
+ "gamma_dfa": 0.047424486168893054,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 10.275530815124512,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 41438.58203125,
+ 41153480.0,
+ 32568028.0,
+ 37348624.0,
+ 18107524.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.174999521770587e-08,
+ 7.312160876793428e-10,
+ 7.228238008138987e-10,
+ 7.196194196090744e-10,
+ 7.171208626921555e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2991866242373362e-05,
+ 5.5619945982243735e-08,
+ 4.266198772029384e-08,
+ 4.1693596131153754e-08,
+ 4.083043592117974e-08
+ ],
+ "gamma_dfa": 0.04726689399103634,
+ "acc_eval": 0.10546875,
+ "loss_eval": 10.532907485961914,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 42610.61328125,
+ 44767372.0,
+ 35250536.0,
+ 40433388.0,
+ 19648566.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.25098211976183e-08,
+ 6.862435619758855e-10,
+ 6.773137606330693e-10,
+ 6.743952063459346e-10,
+ 6.720446421581983e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2943252841068897e-05,
+ 5.273594538834914e-08,
+ 4.00670607803022e-08,
+ 3.916983715157585e-08,
+ 3.8364525778433745e-08
+ ],
+ "gamma_dfa": 0.04717689534300007,
+ "acc_eval": 0.10546875,
+ "loss_eval": 10.889819145202637,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 43802.12109375,
+ 48777580.0,
+ 38250948.0,
+ 43905160.0,
+ 21394392.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.3824673424715e-08,
+ 6.459773826961168e-10,
+ 6.385393880314894e-10,
+ 6.341404623633196e-10,
+ 6.317291689761362e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2702556887234095e-05,
+ 4.966772237935402e-08,
+ 3.767947376331904e-08,
+ 3.682788829451056e-08,
+ 3.60615324268565e-08
+ ],
+ "gamma_dfa": 0.04775475192582235,
+ "acc_eval": 0.10546875,
+ "loss_eval": 11.143190383911133,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 44971.96484375,
+ 53001532.0,
+ 41286860.0,
+ 47327540.0,
+ 23064180.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.44017193912805e-08,
+ 6.083171188997483e-10,
+ 6.001447672154825e-10,
+ 5.973078143206578e-10,
+ 5.949598036458781e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2565969882416539e-05,
+ 4.7034244943233716e-08,
+ 3.557239125484557e-08,
+ 3.4768806500551364e-08,
+ 3.403641457566664e-08
+ ],
+ "gamma_dfa": 0.04808254592353478,
+ "acc_eval": 0.10546875,
+ "loss_eval": 11.375898361206055,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 46135.65234375,
+ 57315672.0,
+ 44360792.0,
+ 51011808.0,
+ 24900550.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.566909315277371e-08,
+ 5.749250520103999e-10,
+ 5.675590553089194e-10,
+ 5.655514945246409e-10,
+ 5.63264157538157e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2200253877381328e-05,
+ 4.4094601747701745e-08,
+ 3.3572575830476126e-08,
+ 3.2811797723297786e-08,
+ 3.210490717719949e-08
+ ],
+ "gamma_dfa": 0.04755272905458696,
+ "acc_eval": 0.1064453125,
+ "loss_eval": 11.584449768066406,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 47265.27734375,
+ 61919976.0,
+ 47722620.0,
+ 54844944.0,
+ 26929922.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.478352953034118e-08,
+ 5.391301294288553e-10,
+ 5.344974463028507e-10,
+ 5.308364858791492e-10,
+ 5.291052596057e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.2009260899503715e-05,
+ 4.1767787450908145e-08,
+ 3.1745546635875144e-08,
+ 3.102580947711431e-08,
+ 3.037316531617762e-08
+ ],
+ "gamma_dfa": 0.0475847675697878,
+ "acc_eval": 0.10546875,
+ "loss_eval": 11.923343658447266,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 48342.62109375,
+ 66327300.0,
+ 51030320.0,
+ 58382808.0,
+ 28803830.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.630867398551345e-08,
+ 5.130093017058357e-10,
+ 5.057400054298e-10,
+ 5.023059190811807e-10,
+ 5.003696346150832e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1836677003884688e-05,
+ 3.972920481487563e-08,
+ 3.016906902075789e-08,
+ 2.9483924635087533e-08,
+ 2.8860545953079964e-08
+ ],
+ "gamma_dfa": 0.04806397232459858,
+ "acc_eval": 0.10546875,
+ "loss_eval": 12.134788513183594,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 49438.7734375,
+ 70923576.0,
+ 54371588.0,
+ 62839076.0,
+ 30745350.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.529716666316745e-08,
+ 4.881638981935055e-10,
+ 4.826159472059999e-10,
+ 4.801878894511447e-10,
+ 4.785546958707698e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1614155482675415e-05,
+ 3.7715466305598966e-08,
+ 2.8843189170402184e-08,
+ 2.8193024803613298e-08,
+ 2.7588850315396485e-08
+ ],
+ "gamma_dfa": 0.047784373455215245,
+ "acc_eval": 0.10546875,
+ "loss_eval": 12.365730285644531,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 50484.30859375,
+ 75708880.0,
+ 57946872.0,
+ 66924284.0,
+ 32685426.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.612364865712152e-08,
+ 4.650996809907326e-10,
+ 4.5824133376726195e-10,
+ 4.5511036605994093e-10,
+ 4.534528585953268e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1689081475196872e-05,
+ 3.617047283910324e-08,
+ 2.7491989129657668e-08,
+ 2.6862345237077534e-08,
+ 2.6283149878736367e-08
+ ],
+ "gamma_dfa": 0.04781174083473161,
+ "acc_eval": 0.10546875,
+ "loss_eval": 12.582022666931152,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 51533.140625,
+ 80717000.0,
+ 61608756.0,
+ 71031448.0,
+ 34583536.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.646285465374604e-08,
+ 4.4203954385757527e-10,
+ 4.369871131615355e-10,
+ 4.329318292750628e-10,
+ 4.319989088674703e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1521507985889912e-05,
+ 3.4413087490747785e-08,
+ 2.619959005301098e-08,
+ 2.5601275766007348e-08,
+ 2.505496254912032e-08
+ ],
+ "gamma_dfa": 0.04798329665209167,
+ "acc_eval": 0.10546875,
+ "loss_eval": 12.857856750488281,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 52583.0859375,
+ 85961416.0,
+ 65257552.0,
+ 74859152.0,
+ 36629052.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.666147977010041e-08,
+ 4.2343398232169704e-10,
+ 4.1782510784571514e-10,
+ 4.1457998145588704e-10,
+ 4.136685161082454e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1553073818504345e-05,
+ 3.306437434957843e-08,
+ 2.515412056425248e-08,
+ 2.4584762670087912e-08,
+ 2.405546162265182e-08
+ ],
+ "gamma_dfa": 0.04809549875790253,
+ "acc_eval": 0.10546875,
+ "loss_eval": 13.005304336547852,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 53574.21875,
+ 91233752.0,
+ 68912136.0,
+ 78801432.0,
+ 38771888.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.665335116120332e-08,
+ 4.0339676043998907e-10,
+ 4.0027073322512763e-10,
+ 3.982228713450553e-10,
+ 3.9690134512326836e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1503744644869585e-05,
+ 3.151562921743789e-08,
+ 2.405471910549295e-08,
+ 2.3515880798186117e-08,
+ 2.3014273153876275e-08
+ ],
+ "gamma_dfa": 0.04791133257094771,
+ "acc_eval": 0.10546875,
+ "loss_eval": 13.310943603515625,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 54515.76953125,
+ 96143688.0,
+ 72537432.0,
+ 83291584.0,
+ 40846320.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.742490109625578e-08,
+ 3.8639558219699666e-10,
+ 3.8376418709518134e-10,
+ 3.813957205611729e-10,
+ 3.8053543649496646e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1331952919135801e-05,
+ 3.0162087938379045e-08,
+ 2.3133726045898584e-08,
+ 2.2621049922122438e-08,
+ 2.2133153976255926e-08
+ ],
+ "gamma_dfa": 0.0483476699446328,
+ "acc_eval": 0.10546875,
+ "loss_eval": 13.509955406188965,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 55471.92578125,
+ 101352504.0,
+ 76262640.0,
+ 87893288.0,
+ 43005752.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.776105886454388e-08,
+ 3.722072094980433e-10,
+ 3.6970662642410446e-10,
+ 3.67776836762701e-10,
+ 3.6656577773186427e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1259300663368776e-05,
+ 2.921965247537628e-08,
+ 2.22886100686992e-08,
+ 2.178610181147178e-08,
+ 2.1311375775212582e-08
+ ],
+ "gamma_dfa": 0.04882028384599835,
+ "acc_eval": 0.10546875,
+ "loss_eval": 13.669061660766602,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 56406.1796875,
+ 106503480.0,
+ 80309328.0,
+ 92335120.0,
+ 45272116.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.741802304257362e-08,
+ 3.5817968035978254e-10,
+ 3.546553328792612e-10,
+ 3.5286135124934503e-10,
+ 3.517087177051792e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.1156203981954604e-05,
+ 2.829144030158659e-08,
+ 2.1501875835383544e-08,
+ 2.1014004758512783e-08,
+ 2.056106396253199e-08
+ ],
+ "gamma_dfa": 0.04876198567217216,
+ "acc_eval": 0.10546875,
+ "loss_eval": 13.882933616638184,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 57307.2421875,
+ 111696136.0,
+ 84071088.0,
+ 96859240.0,
+ 47347232.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.675155527271272e-08,
+ 3.451815777655298e-10,
+ 3.4170632989827254e-10,
+ 3.399925063707343e-10,
+ 3.38884892370217e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.105228056985652e-05,
+ 2.731184522986041e-08,
+ 2.0790139387827367e-08,
+ 2.0321502702813632e-08,
+ 1.9881698065660203e-08
+ ],
+ "gamma_dfa": 0.04874728451250121,
+ "acc_eval": 0.10546875,
+ "loss_eval": 14.110960960388184,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 58201.1015625,
+ 116915912.0,
+ 88056232.0,
+ 101457736.0,
+ 49574372.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.81610304759306e-08,
+ 3.3262503862374615e-10,
+ 3.28719912401354e-10,
+ 3.270855530868033e-10,
+ 3.2694977281089166e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.09774755401304e-05,
+ 2.6502128491756594e-08,
+ 2.010280297781719e-08,
+ 1.964214924043972e-08,
+ 1.9215420365981117e-08
+ ],
+ "gamma_dfa": 0.049133426626212895,
+ "acc_eval": 0.10546875,
+ "loss_eval": 14.251358985900879,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 59057.046875,
+ 122526296.0,
+ 92035232.0,
+ 106073072.0,
+ 51524732.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.615387514510076e-08,
+ 3.1993208082781166e-10,
+ 3.1755734153371407e-10,
+ 3.1527228050443057e-10,
+ 3.1427349611590216e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0898848813667428e-05,
+ 2.5704085970801316e-08,
+ 1.941714167230657e-08,
+ 1.896907697584993e-08,
+ 1.8563016013217748e-08
+ ],
+ "gamma_dfa": 0.04926633776631206,
+ "acc_eval": 0.10546875,
+ "loss_eval": 14.543952941894531,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 59915.00390625,
+ 128059208.0,
+ 95767408.0,
+ 110314168.0,
+ 53699800.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.616160585006583e-08,
+ 3.10205972020583e-10,
+ 3.0786348470535074e-10,
+ 3.0548555352005735e-10,
+ 3.044886287550952e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0854326319531538e-05,
+ 2.4907375717475588e-08,
+ 1.8864984241417915e-08,
+ 1.8437393833892202e-08,
+ 1.8046192096221603e-08
+ ],
+ "gamma_dfa": 0.04898433407652192,
+ "acc_eval": 0.10546875,
+ "loss_eval": 14.763640403747559,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 60732.77734375,
+ 133044840.0,
+ 99449000.0,
+ 114745104.0,
+ 55794780.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.66734808369074e-08,
+ 3.0199040490508366e-10,
+ 2.984798519456433e-10,
+ 2.9689897762530393e-10,
+ 2.9609348306536276e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0869742254726589e-05,
+ 2.4187817970755532e-08,
+ 1.8320044148367742e-08,
+ 1.79040302583644e-08,
+ 1.7519981909686067e-08
+ ],
+ "gamma_dfa": 0.049695645982865244,
+ "acc_eval": 0.10546875,
+ "loss_eval": 14.853147506713867,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 61537.2265625,
+ 138238256.0,
+ 103294888.0,
+ 119079736.0,
+ 57875032.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.672164852896458e-08,
+ 2.937747545228575e-10,
+ 2.90239082767485e-10,
+ 2.8853816558260803e-10,
+ 2.880042870856414e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0855384971364401e-05,
+ 2.3642215296604263e-08,
+ 1.78662986627387e-08,
+ 1.745818423160017e-08,
+ 1.7085612924461202e-08
+ ],
+ "gamma_dfa": 0.04945674288319424,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.014139175415039,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 62318.859375,
+ 143781376.0,
+ 107295080.0,
+ 123266280.0,
+ 60009076.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.63586393506921e-08,
+ 2.853322023099736e-10,
+ 2.819139366394552e-10,
+ 2.8051430622788587e-10,
+ 2.796505249591519e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0763029422378168e-05,
+ 2.2983703829027036e-08,
+ 1.7385014317028435e-08,
+ 1.699019236411914e-08,
+ 1.662707127536578e-08
+ ],
+ "gamma_dfa": 0.04949341545579955,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.234472274780273,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 63084.12109375,
+ 148953776.0,
+ 111167488.0,
+ 127493184.0,
+ 62116584.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.690788888543466e-08,
+ 2.77830092265674e-10,
+ 2.7401189650611e-10,
+ 2.7265251167918336e-10,
+ 2.71903860538103e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0762613783299457e-05,
+ 2.2435919788676983e-08,
+ 1.6915544520657022e-08,
+ 1.65265419127536e-08,
+ 1.6172732486552377e-08
+ ],
+ "gamma_dfa": 0.04998577304650098,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.356475830078125,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 63822.42578125,
+ 153887120.0,
+ 114903200.0,
+ 131868160.0,
+ 64092768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.741512402821172e-08,
+ 2.695783041239963e-10,
+ 2.676055765871155e-10,
+ 2.6572444244976623e-10,
+ 2.649161723322635e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.07648411358241e-05,
+ 2.1865258048592295e-08,
+ 1.6514658085498013e-08,
+ 1.6137914116143293e-08,
+ 1.5790037721785666e-08
+ ],
+ "gamma_dfa": 0.050343112263362855,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.516284942626953,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 64467.453125,
+ 158904000.0,
+ 118881072.0,
+ 136114000.0,
+ 66111872.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.664627415555515e-08,
+ 2.624416239882521e-10,
+ 2.6058996627220665e-10,
+ 2.5911758849694877e-10,
+ 2.584663871818549e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0719203601183835e-05,
+ 2.1336076017064443e-08,
+ 1.6169177996516737e-08,
+ 1.5802571695644474e-08,
+ 1.546756678294514e-08
+ ],
+ "gamma_dfa": 0.04984566644998267,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.6607084274292,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 65120.73828125,
+ 163883856.0,
+ 122702472.0,
+ 140198928.0,
+ 68242560.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.641593041147644e-08,
+ 2.5804472447710225e-10,
+ 2.5353724675269973e-10,
+ 2.5259389024867573e-10,
+ 2.520264275052142e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0724111234594602e-05,
+ 2.0917026333222566e-08,
+ 1.5751618676063117e-08,
+ 1.5394757468811804e-08,
+ 1.5069018033386783e-08
+ ],
+ "gamma_dfa": 0.05030635162256658,
+ "acc_eval": 0.10546875,
+ "loss_eval": 15.901081085205078,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 65754.40625,
+ 168991232.0,
+ 126758528.0,
+ 144376592.0,
+ 70329568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.677351104324771e-08,
+ 2.5239485501593606e-10,
+ 2.4832783052097795e-10,
+ 2.4752053184862177e-10,
+ 2.4696938938362223e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0669472430890892e-05,
+ 2.0359754770993277e-08,
+ 1.542808725218947e-08,
+ 1.5080953374990713e-08,
+ 1.4761029731857889e-08
+ ],
+ "gamma_dfa": 0.05062760764849372,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.04940414428711,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 66360.1953125,
+ 173885088.0,
+ 130550672.0,
+ 148377456.0,
+ 72298680.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.759133862668023e-08,
+ 2.4686536148621485e-10,
+ 2.4284077526637304e-10,
+ 2.4196153414202115e-10,
+ 2.414988486965086e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0671456038835458e-05,
+ 1.9936877038162493e-08,
+ 1.5118750695819472e-08,
+ 1.4775524803667395e-08,
+ 1.4458762187530283e-08
+ ],
+ "gamma_dfa": 0.050650376273551956,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.173294067382812,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 66955.3671875,
+ 179032416.0,
+ 134152312.0,
+ 152335472.0,
+ 74150016.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.732155265533947e-08,
+ 2.4187768454808634e-10,
+ 2.378792995916257e-10,
+ 2.3684243455335263e-10,
+ 2.3630350454162397e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0680658306227997e-05,
+ 1.9686593688561516e-08,
+ 1.484478495683561e-08,
+ 1.4507179457723396e-08,
+ 1.4196978703751029e-08
+ ],
+ "gamma_dfa": 0.05082969422801398,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.27086639404297,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 67549.515625,
+ 183555840.0,
+ 137880064.0,
+ 156240624.0,
+ 75989536.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.660003913973924e-08,
+ 2.357370687544602e-10,
+ 2.33779245961685e-10,
+ 2.3301963136823645e-10,
+ 2.3250262826124413e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0663774446584284e-05,
+ 1.9352745184164633e-08,
+ 1.4566153616613065e-08,
+ 1.423444206949398e-08,
+ 1.3932280218398319e-08
+ ],
+ "gamma_dfa": 0.05084921311936341,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.451187133789062,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 68104.8046875,
+ 188812128.0,
+ 141342304.0,
+ 160268688.0,
+ 77916768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.660642691893372e-08,
+ 2.327093101550659e-10,
+ 2.2930106424734475e-10,
+ 2.2855875525529257e-10,
+ 2.2804760857475515e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0613769518386107e-05,
+ 1.899090662504932e-08,
+ 1.4301366313418384e-08,
+ 1.3975586021786057e-08,
+ 1.3677930787991954e-08
+ ],
+ "gamma_dfa": 0.05096889057313092,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.63678741455078,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 68657.515625,
+ 193258416.0,
+ 144614160.0,
+ 164019216.0,
+ 79742168.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.68742304760417e-08,
+ 2.289267664323802e-10,
+ 2.2474513916570515e-10,
+ 2.2393865928282963e-10,
+ 2.2451285275337796e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0620946341077797e-05,
+ 1.866202836708908e-08,
+ 1.4068830544999855e-08,
+ 1.3749051674949442e-08,
+ 1.3455515812665908e-08
+ ],
+ "gamma_dfa": 0.05113464401802048,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.70541763305664,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 69158.5,
+ 197991056.0,
+ 148074896.0,
+ 168001296.0,
+ 81613432.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.685481134307338e-08,
+ 2.244555652453073e-10,
+ 2.21766327523909e-10,
+ 2.2105835217889336e-10,
+ 2.2056727277952604e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0557047062320635e-05,
+ 1.836115792741566e-08,
+ 1.3819986932617212e-08,
+ 1.35067770301589e-08,
+ 1.3220035732786073e-08
+ ],
+ "gamma_dfa": 0.05133810767438263,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.83820915222168,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 69652.15625,
+ 202764272.0,
+ 151440416.0,
+ 171388720.0,
+ 83290960.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.682473406906865e-08,
+ 2.209017690990578e-10,
+ 2.178418834208884e-10,
+ 2.1715784725984122e-10,
+ 2.166662266267494e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0563057912804652e-05,
+ 1.8060584139334424e-08,
+ 1.3589187553009197e-08,
+ 1.3282591027063972e-08,
+ 1.300101715173696e-08
+ ],
+ "gamma_dfa": 0.051503602182492614,
+ "acc_eval": 0.10546875,
+ "loss_eval": 16.996952056884766,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 70119.3046875,
+ 207371568.0,
+ 154513392.0,
+ 174693904.0,
+ 84899272.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.754268776556273e-08,
+ 2.177768798627966e-10,
+ 2.1394505611560533e-10,
+ 2.1310755937697934e-10,
+ 2.1278181994155432e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0583677067188546e-05,
+ 1.7867773038915402e-08,
+ 1.3404712007059061e-08,
+ 1.3099571205543725e-08,
+ 1.281919193019121e-08
+ ],
+ "gamma_dfa": 0.05178222866379656,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.03223419189453,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 70571.765625,
+ 211695824.0,
+ 157515872.0,
+ 178129360.0,
+ 86545024.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.717323396467691e-08,
+ 2.1452814524813846e-10,
+ 2.1192504695566328e-10,
+ 2.1126832228102188e-10,
+ 2.1079131495849168e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0588292752800044e-05,
+ 1.7631437643217396e-08,
+ 1.3229322526342457e-08,
+ 1.2929083581525447e-08,
+ 1.2654436609693676e-08
+ ],
+ "gamma_dfa": 0.0517645905201789,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.17680549621582,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 71016.2734375,
+ 216131392.0,
+ 160371248.0,
+ 181552016.0,
+ 88083200.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.714041399571215e-08,
+ 2.1204836497812352e-10,
+ 2.0845919435075189e-10,
+ 2.0772163156212997e-10,
+ 2.0731850958188858e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0558523172221612e-05,
+ 1.7396088125565257e-08,
+ 1.3074124005640897e-08,
+ 1.2776619762178143e-08,
+ 1.2503839741384581e-08
+ ],
+ "gamma_dfa": 0.05190763485734351,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.230438232421875,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 71423.875,
+ 220276432.0,
+ 163188992.0,
+ 184901952.0,
+ 89669880.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.695663922253516e-08,
+ 2.089625000811779e-10,
+ 2.0665336109004784e-10,
+ 2.060027565198297e-10,
+ 2.0553812818402406e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.054474341799505e-05,
+ 1.720214015676902e-08,
+ 1.2905923441053346e-08,
+ 1.2612286326429967e-08,
+ 1.2343328137376375e-08
+ ],
+ "gamma_dfa": 0.0516790475230664,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.364524841308594,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 71819.7265625,
+ 224240896.0,
+ 165905760.0,
+ 188025680.0,
+ 91055744.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.707031184940206e-08,
+ 2.0619655982656582e-10,
+ 2.0404426759323968e-10,
+ 2.0340489015335805e-10,
+ 2.0294699254463922e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0510210813663434e-05,
+ 1.6987915074651028e-08,
+ 1.2752495948120668e-08,
+ 1.2462213483388496e-08,
+ 1.2196251120144552e-08
+ ],
+ "gamma_dfa": 0.05187035645940341,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.464691162109375,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 72184.1796875,
+ 228069632.0,
+ 168371744.0,
+ 190844528.0,
+ 92434920.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.708528298484453e-08,
+ 2.0398974176494278e-10,
+ 2.0165806524641283e-10,
+ 2.0102944309208226e-10,
+ 2.0057676353157916e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0452381502545904e-05,
+ 1.678668404281325e-08,
+ 1.2599208787378302e-08,
+ 1.2311685892996138e-08,
+ 1.2049306441497265e-08
+ ],
+ "gamma_dfa": 0.052035300293937325,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.54598045349121,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 72520.546875,
+ 231382032.0,
+ 170794656.0,
+ 193581264.0,
+ 93730880.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.673346485466027e-08,
+ 2.0163908043269174e-10,
+ 1.9945969875756475e-10,
+ 1.988337966496445e-10,
+ 1.983077452250015e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.041769064613618e-05,
+ 1.6600257168875032e-08,
+ 1.2470060539726546e-08,
+ 1.218627776466974e-08,
+ 1.1927684617774048e-08
+ ],
+ "gamma_dfa": 0.052122256805887446,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.622678756713867,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 72848.296875,
+ 234345168.0,
+ 172920208.0,
+ 196159376.0,
+ 94861664.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.68633378559025e-08,
+ 1.9926535421710412e-10,
+ 1.9748097601635095e-10,
+ 1.9686471897095714e-10,
+ 1.9632170888961298e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0410145478090271e-05,
+ 1.6476832342959824e-08,
+ 1.2349259392863132e-08,
+ 1.2067844501473246e-08,
+ 1.1810766586961563e-08
+ ],
+ "gamma_dfa": 0.05221144680399448,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.67215347290039,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 73156.28125,
+ 237693904.0,
+ 175292576.0,
+ 198663152.0,
+ 96070024.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.698025766307182e-08,
+ 1.9732028511132427e-10,
+ 1.9561376130017294e-10,
+ 1.950042072262903e-10,
+ 1.9452565946931344e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0408021807961632e-05,
+ 1.6299335214853272e-08,
+ 1.224471191108023e-08,
+ 1.1966841739763368e-08,
+ 1.1711744463127616e-08
+ ],
+ "gamma_dfa": 0.05207514451467432,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.708881378173828,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 73450.0390625,
+ 240668752.0,
+ 177333776.0,
+ 200832576.0,
+ 97232808.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.750691904424457e-08,
+ 1.9538150264342136e-10,
+ 1.937518478989375e-10,
+ 1.9322175803804242e-10,
+ 1.9261021944050327e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0387684596935287e-05,
+ 1.614511546677022e-08,
+ 1.2127667758932148e-08,
+ 1.1853135362116518e-08,
+ 1.1600380211973516e-08
+ ],
+ "gamma_dfa": 0.052143561391858384,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.803735733032227,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 73722.7890625,
+ 243140912.0,
+ 179223280.0,
+ 203119056.0,
+ 98179728.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.777691107297869e-08,
+ 1.936056454043822e-10,
+ 1.921051789866013e-10,
+ 1.9142704088537243e-10,
+ 1.908224411817372e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0383127118984703e-05,
+ 1.6032700500545616e-08,
+ 1.2034083063383605e-08,
+ 1.1761529528087067e-08,
+ 1.1511005482134351e-08
+ ],
+ "gamma_dfa": 0.0522310700325761,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.871017456054688,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 73977.796875,
+ 245601744.0,
+ 181134272.0,
+ 205298592.0,
+ 99248704.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.645526605732812e-08,
+ 1.9214441149273398e-10,
+ 1.908457003541031e-10,
+ 1.8958104530675257e-10,
+ 1.891580642121582e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0368045877839904e-05,
+ 1.593527443333187e-08,
+ 1.1956020173897741e-08,
+ 1.1683961353980976e-08,
+ 1.1433988866826894e-08
+ ],
+ "gamma_dfa": 0.05229719865019433,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.842838287353516,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 74210.2890625,
+ 248047296.0,
+ 183004848.0,
+ 207310784.0,
+ 100283200.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.702664189286224e-08,
+ 1.9067503131964259e-10,
+ 1.8910681354178394e-10,
+ 1.886194395117613e-10,
+ 1.8805811075051082e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0340887456550263e-05,
+ 1.5766524086302525e-08,
+ 1.1852850256843794e-08,
+ 1.1584752712678892e-08,
+ 1.1337309757664116e-08
+ ],
+ "gamma_dfa": 0.05227879187441431,
+ "acc_eval": 0.10546875,
+ "loss_eval": 17.977331161499023,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 74442.2578125,
+ 250302768.0,
+ 184669344.0,
+ 209343920.0,
+ 101168016.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.73824319569394e-08,
+ 1.8929384448806985e-10,
+ 1.8772923493504123e-10,
+ 1.8724671813075133e-10,
+ 1.8670247292629227e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0353242942073848e-05,
+ 1.5672505071506748e-08,
+ 1.1772779195950989e-08,
+ 1.1506068098299238e-08,
+ 1.1260493870679511e-08
+ ],
+ "gamma_dfa": 0.05237349838716909,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.03546905517578,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 74647.3203125,
+ 252406032.0,
+ 186061376.0,
+ 211037200.0,
+ 101960680.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.6925361131307e-08,
+ 1.881417382998407e-10,
+ 1.867033888602876e-10,
+ 1.8579758565007154e-10,
+ 1.8538144630486642e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0341693268856034e-05,
+ 1.5606824277369924e-08,
+ 1.1714643477489517e-08,
+ 1.1449987624700952e-08,
+ 1.1205665728653003e-08
+ ],
+ "gamma_dfa": 0.05233656561176758,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.052072525024414,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 74842.0859375,
+ 254511632.0,
+ 187492928.0,
+ 212704224.0,
+ 102757816.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.698394537987042e-08,
+ 1.8709332694211156e-10,
+ 1.8572142435058225e-10,
+ 1.8484298813792321e-10,
+ 1.8442962435027965e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0342246241634712e-05,
+ 1.552284167871676e-08,
+ 1.1652745435242196e-08,
+ 1.1389352572166445e-08,
+ 1.114572434346428e-08
+ ],
+ "gamma_dfa": 0.05241188171203248,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.086322784423828,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 75024.015625,
+ 256539408.0,
+ 188878192.0,
+ 214226816.0,
+ 103471288.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.701635323404844e-08,
+ 1.8604462415083844e-10,
+ 1.84622400700718e-10,
+ 1.8390608480522985e-10,
+ 1.834675189549273e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.032539876177907e-05,
+ 1.5453247570462736e-08,
+ 1.1593147775101897e-08,
+ 1.133172844447472e-08,
+ 1.1090729223894868e-08
+ ],
+ "gamma_dfa": 0.05239276264910586,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.168014526367188,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 75180.9609375,
+ 258451104.0,
+ 190004976.0,
+ 215740128.0,
+ 104133768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.704767395784074e-08,
+ 1.8524454192814233e-10,
+ 1.8379993360628788e-10,
+ 1.8304618931708205e-10,
+ 1.8256345046818723e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0337872481613886e-05,
+ 1.5379262308101715e-08,
+ 1.1539456501452605e-08,
+ 1.127898041630715e-08,
+ 1.103767743870776e-08
+ ],
+ "gamma_dfa": 0.052515600953483954,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.164344787597656,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 75327.796875,
+ 260127200.0,
+ 191027072.0,
+ 216985472.0,
+ 104684240.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.744654422798703e-08,
+ 1.8438454929547987e-10,
+ 1.8290086112315862e-10,
+ 1.8214722785625526e-10,
+ 1.8167076176744956e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.032766067510238e-05,
+ 1.5304989275932712e-08,
+ 1.14842633180956e-08,
+ 1.122501380734775e-08,
+ 1.098510349351045e-08
+ ],
+ "gamma_dfa": 0.05257981286558788,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.223249435424805,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 75454.5703125,
+ 261646176.0,
+ 192111600.0,
+ 218110816.0,
+ 105216432.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.775589321885491e-08,
+ 1.8362063258781092e-10,
+ 1.8213851260551195e-10,
+ 1.8139376112280559e-10,
+ 1.809180305567537e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.032176169246668e-05,
+ 1.5236809147722852e-08,
+ 1.1438899605309416e-08,
+ 1.1181004566651609e-08,
+ 1.0941747952131209e-08
+ ],
+ "gamma_dfa": 0.052668574411654845,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.2590389251709,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 75578.140625,
+ 263041184.0,
+ 193033856.0,
+ 219211776.0,
+ 105729752.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.755376512681323e-08,
+ 1.830409435132907e-10,
+ 1.8150429770269483e-10,
+ 1.807565902511854e-10,
+ 1.8044568617092693e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0324319191568065e-05,
+ 1.5187332280675037e-08,
+ 1.1401711574876572e-08,
+ 1.1144490663639317e-08,
+ 1.0905955249995714e-08
+ ],
+ "gamma_dfa": 0.05269488821795676,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.284685134887695,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 75686.9765625,
+ 264364192.0,
+ 193939856.0,
+ 220289456.0,
+ 106222280.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.723260691567702e-08,
+ 1.8233220488994561e-10,
+ 1.808086180776769e-10,
+ 1.8018871117408963e-10,
+ 1.7971832355634376e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0300875146640465e-05,
+ 1.5149137055914252e-08,
+ 1.1367639274340036e-08,
+ 1.1110781628076438e-08,
+ 1.0873751676854226e-08
+ ],
+ "gamma_dfa": 0.05262827526894398,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.32525634765625,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 75782.5703125,
+ 265506368.0,
+ 194623696.0,
+ 221062096.0,
+ 106625800.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.738180667933193e-08,
+ 1.8182351457785018e-10,
+ 1.8023170456071824e-10,
+ 1.796851972768465e-10,
+ 1.7919579708980393e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0303671842848416e-05,
+ 1.510927916115179e-08,
+ 1.133329874392075e-08,
+ 1.107721647741755e-08,
+ 1.0840857100902213e-08
+ ],
+ "gamma_dfa": 0.0526832842733711,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.358993530273438,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 75869.921875,
+ 266527792.0,
+ 195260000.0,
+ 221772592.0,
+ 107003056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.824529373896439e-08,
+ 1.8133940182796238e-10,
+ 1.7974224886252443e-10,
+ 1.7921185369029757e-10,
+ 1.7870449564583168e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0309514436812606e-05,
+ 1.506138680440472e-08,
+ 1.129713478320582e-08,
+ 1.1042018854823255e-08,
+ 1.080576872425354e-08
+ ],
+ "gamma_dfa": 0.052798322300077416,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.391273498535156,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 75944.28125,
+ 267298400.0,
+ 195821152.0,
+ 222463360.0,
+ 107333864.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.755981895092191e-08,
+ 1.8102987164869688e-10,
+ 1.793504234015586e-10,
+ 1.788625914045383e-10,
+ 1.7835513621555776e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0287751138093881e-05,
+ 1.502210977832874e-08,
+ 1.1278022071792293e-08,
+ 1.1023718826663753e-08,
+ 1.0788149040763528e-08
+ ],
+ "gamma_dfa": 0.05272912958753295,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.391714096069336,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 76007.421875,
+ 268045776.0,
+ 196358640.0,
+ 223064400.0,
+ 107612040.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.762406622508934e-08,
+ 1.807102384399073e-10,
+ 1.7898976745200912e-10,
+ 1.785393638487065e-10,
+ 1.7802226359719953e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0287554687238298e-05,
+ 1.4994483876762388e-08,
+ 1.1257166754319314e-08,
+ 1.1003281841226453e-08,
+ 1.0768073543943046e-08
+ ],
+ "gamma_dfa": 0.052773734016227536,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.410842895507812,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 76064.7109375,
+ 268696256.0,
+ 196819616.0,
+ 223570480.0,
+ 107852768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.758166814004653e-08,
+ 1.8037309146290426e-10,
+ 1.7866680357414566e-10,
+ 1.782173991715652e-10,
+ 1.7768413129726213e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0283758456353098e-05,
+ 1.4970940043212977e-08,
+ 1.1237919927964413e-08,
+ 1.0984368081778939e-08,
+ 1.0749558576605978e-08
+ ],
+ "gamma_dfa": 0.05277359033061657,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.423473358154297,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 76113.765625,
+ 269233728.0,
+ 197204896.0,
+ 224016384.0,
+ 108068584.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.767738535198077e-08,
+ 1.800838783649894e-10,
+ 1.7838196197939027e-10,
+ 1.7793383433328813e-10,
+ 1.7738220614571532e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0285043572366703e-05,
+ 1.4949996796076448e-08,
+ 1.1221012563567001e-08,
+ 1.096789947752086e-08,
+ 1.0733534949736168e-08
+ ],
+ "gamma_dfa": 0.05277923475659918,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.44818878173828,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 76154.09375,
+ 269669792.0,
+ 197538960.0,
+ 224391824.0,
+ 108235960.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.767518266949992e-08,
+ 1.7989677802976445e-10,
+ 1.7819240527572333e-10,
+ 1.777451658080409e-10,
+ 1.771848640030882e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.029091072268784e-05,
+ 1.4940461312562547e-08,
+ 1.1209391637123645e-08,
+ 1.0956426876873593e-08,
+ 1.0722061460910481e-08
+ ],
+ "gamma_dfa": 0.05281960548018105,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.45142364501953,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 76187.59375,
+ 270051616.0,
+ 197844384.0,
+ 224727824.0,
+ 108387672.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.763404224509941e-08,
+ 1.7972098809160286e-10,
+ 1.780089131653284e-10,
+ 1.7756210390906801e-10,
+ 1.7699951226912702e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0288421435689088e-05,
+ 1.4926607505572065e-08,
+ 1.1199507987669222e-08,
+ 1.0946849648973966e-08,
+ 1.0712753351072024e-08
+ ],
+ "gamma_dfa": 0.05281454947544262,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.456693649291992,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 76216.3125,
+ 270347840.0,
+ 198067872.0,
+ 225002016.0,
+ 108500144.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.769242754169682e-08,
+ 1.795031345785958e-10,
+ 1.7781580374798267e-10,
+ 1.773555469153365e-10,
+ 1.7679230301936855e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0288722478435375e-05,
+ 1.4910959578173788e-08,
+ 1.1187878179441668e-08,
+ 1.0935604422002143e-08,
+ 1.070183497375865e-08
+ ],
+ "gamma_dfa": 0.052812248992267996,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.479557037353516,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 76238.2890625,
+ 270583392.0,
+ 198231920.0,
+ 225197232.0,
+ 108588960.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.765692172119088e-08,
+ 1.794125820131498e-10,
+ 1.7771174809499968e-10,
+ 1.7726634049530787e-10,
+ 1.7670596930141613e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0287496479577385e-05,
+ 1.490491285949247e-08,
+ 1.1181702674889493e-08,
+ 1.0929432470163647e-08,
+ 1.0695790031434171e-08
+ ],
+ "gamma_dfa": 0.052826936458586715,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.482463836669922,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 76254.984375,
+ 270769600.0,
+ 198360864.0,
+ 225341792.0,
+ 108654560.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.761775660559579e-08,
+ 1.7933368678946238e-10,
+ 1.776363084404764e-10,
+ 1.7719105349645048e-10,
+ 1.766297247352e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0286962606187444e-05,
+ 1.4897207911701571e-08,
+ 1.1177347936097703e-08,
+ 1.0925224280811108e-08,
+ 1.0691623586467358e-08
+ ],
+ "gamma_dfa": 0.052814016249612905,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.48452377319336,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 76267.0,
+ 270906656.0,
+ 198453952.0,
+ 225448800.0,
+ 108703144.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.761757186448449e-08,
+ 1.792699738656367e-10,
+ 1.7757639803051006e-10,
+ 1.771305185860328e-10,
+ 1.7656787143494057e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0286720680596773e-05,
+ 1.4893439370666783e-08,
+ 1.1173768577066312e-08,
+ 1.0921708870625935e-08,
+ 1.0688168572414725e-08
+ ],
+ "gamma_dfa": 0.05281054192164447,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.48675537109375,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 76274.53125,
+ 270996800.0,
+ 198521872.0,
+ 225534016.0,
+ 108737184.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.757600511444252e-08,
+ 1.7921109041196814e-10,
+ 1.7751719538772193e-10,
+ 1.7707224575502778e-10,
+ 1.7651151373865304e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0285029929946177e-05,
+ 1.4889327104583572e-08,
+ 1.1170673275273657e-08,
+ 1.09186730767874e-08,
+ 1.0685286433442798e-08
+ ],
+ "gamma_dfa": 0.052804862934863195,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.492807388305664,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 76278.6171875,
+ 271041184.0,
+ 198554096.0,
+ 225570960.0,
+ 108751040.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.758564717936679e-08,
+ 1.791868459166679e-10,
+ 1.7749526848298558e-10,
+ 1.770504159948061e-10,
+ 1.7648858763319453e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.028558563120896e-05,
+ 1.4887539201424715e-08,
+ 1.1169264624300013e-08,
+ 1.091728041302531e-08,
+ 1.068388577607493e-08
+ ],
+ "gamma_dfa": 0.052804886450758204,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.49222183227539,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 76282.2109375,
+ 271081440.0,
+ 198586512.0,
+ 225606800.0,
+ 108767848.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.758451741641693e-08,
+ 1.7916516881211209e-10,
+ 1.7747517344623986e-10,
+ 1.7702975196876025e-10,
+ 1.764676044180291e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.028525730362162e-05,
+ 1.488619361111887e-08,
+ 1.1168157953989066e-08,
+ 1.0916189729925918e-08,
+ 1.0682827955577068e-08
+ ],
+ "gamma_dfa": 0.05280597397359088,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.493602752685547,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 76284.046875,
+ 271101920.0,
+ 198601280.0,
+ 225624992.0,
+ 108775912.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.758536296227248e-08,
+ 1.7915657846145905e-10,
+ 1.7746643043992094e-10,
+ 1.7702135590713652e-10,
+ 1.7645920835640538e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.028511906042695e-05,
+ 1.488560208429135e-08,
+ 1.1167605507012013e-08,
+ 1.0915637282948865e-08,
+ 1.0682285278562631e-08
+ ],
+ "gamma_dfa": 0.05280651607608888,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.494029998779297,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 76284.0703125,
+ 271101952.0,
+ 198601472.0,
+ 225625280.0,
+ 108776088.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 8.758680536402608e-08,
+ 1.7915803562917887e-10,
+ 1.7746806801888226e-10,
+ 1.7702275756370511e-10,
+ 1.7646061001297397e-10
+ ],
+ "bp_grad_norms_F": [
+ 1.0285211828886531e-05,
+ 1.488571665930749e-08,
+ 1.1167688107605045e-08,
+ 1.0915716330828218e-08,
+ 1.0682358109193046e-08
+ ],
+ "gamma_dfa": 0.052806626496021636,
+ "acc_eval": 0.10546875,
+ "loss_eval": 18.493879318237305,
+ "epoch": 100
+ }
+ ]
+} \ No newline at end of file