diff options
Diffstat (limited to 'results/h2_no_residual_full_s456/snapshot_evolution_s456.json')
| -rw-r--r-- | results/h2_no_residual_full_s456/snapshot_evolution_s456.json | 2749 |
1 files changed, 2749 insertions, 0 deletions
diff --git a/results/h2_no_residual_full_s456/snapshot_evolution_s456.json b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json new file mode 100644 index 0000000..4070eaa --- /dev/null +++ b/results/h2_no_residual_full_s456/snapshot_evolution_s456.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/h2_no_residual_full_s456", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 456, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": true, + "w2_std": 0.5, + "random_targets": false, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.696551322937012, + 42.47159957885742, + 42.67432403564453, + 45.272701263427734, + 43.449092864990234 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011182057205587626, + 0.00021166827355045825, + 0.00014748115791007876, + 0.00011803740198956802, + 0.00010102539090439677 + ], + "bp_grad_norms_F": [ + 0.039927296340465546, + 0.006882709916681051, + 0.004750067833811045, + 0.00377994985319674, + 0.0032426300458610058 + ], + "gamma_dfa": 0.012312270817346871, + "acc_eval": 0.1142578125, + "loss_eval": 2.3956005573272705, + "epoch": 0 + }, + { + "hidden_norms": [ + 1556.684814453125, + 6497.32177734375, + 10603.298828125, + 15776.048828125, + 9974.5771484375 + ], + "bp_grad_norms_per_sample_med": [ + 7.715180458944815e-07, + 4.893955178886245e-07, + 4.84326051264361e-07, + 4.838655058847507e-07, + 4.83024962250056e-07 + ], + "bp_grad_norms_F": [ + 4.703722152044065e-05, + 2.927827154053375e-05, + 2.886639595089946e-05, + 2.8710121114272624e-05, + 2.851033423212357e-05 + ], + "gamma_dfa": 0.018546399660408497, + "acc_eval": 0.111328125, + "loss_eval": 2.356113910675049, + "epoch": 1 + }, + { + "hidden_norms": [ + 3438.555908203125, + 41675.72265625, + 66460.0234375, + 84792.1875, + 42575.42578125 + ], + "bp_grad_norms_per_sample_med": [ + 2.2151462530928256e-07, + 8.604414603041732e-08, + 8.536036233408595e-08, + 8.52630037684321e-08, + 8.530036410547837e-08 + ], + "bp_grad_norms_F": [ + 1.8386168449069373e-05, + 6.961788585613249e-06, + 6.748253326804843e-06, + 6.721136742271483e-06, + 6.674351880064933e-06 + ], + "gamma_dfa": 0.017316466895863414, + "acc_eval": 0.1005859375, + "loss_eval": 2.356572151184082, + "epoch": 2 + }, + { + "hidden_norms": [ + 5372.435546875, + 121188.546875, + 174809.4375, + 203405.859375, + 95077.4609375 + ], + "bp_grad_norms_per_sample_med": [ + 1.2532444770840812e-07, + 3.495903300176906e-08, + 3.4808731896873724e-08, + 3.474917420476231e-08, + 3.4685903926856554e-08 + ], + "bp_grad_norms_F": [ + 1.1882418220920954e-05, + 2.7211688120587496e-06, + 2.6087484457093524e-06, + 2.602359927550424e-06, + 2.590174972283421e-06 + ], + "gamma_dfa": 0.014974067453294992, + "acc_eval": 0.080078125, + "loss_eval": 2.381472110748291, + "epoch": 3 + }, + { + "hidden_norms": [ + 7225.4375, + 258499.359375, + 333575.4375, + 364076.25, + 168464.5 + ], + "bp_grad_norms_per_sample_med": [ + 8.640306248253182e-08, + 1.9808053863812347e-08, + 1.9682946827970227e-08, + 1.9666908102067282e-08, + 1.967319640527876e-08 + ], + "bp_grad_norms_F": [ + 1.1042752703360748e-05, + 1.5015855296951486e-06, + 1.3234410971563193e-06, + 1.3206722542236093e-06, + 1.314130940954783e-06 + ], + "gamma_dfa": 0.020775633631274104, + "acc_eval": 0.0654296875, + "loss_eval": 2.458400249481201, + "epoch": 4 + }, + { + "hidden_norms": [ + 8934.6435546875, + 470048.6875, + 549725.375, + 586957.8125, + 270350.28125 + ], + "bp_grad_norms_per_sample_med": [ + 7.15417982632971e-08, + 1.303753727199819e-08, + 1.2938533799911056e-08, + 1.2922544811999614e-08, + 1.2902905410783205e-08 + ], + "bp_grad_norms_F": [ + 9.721887181513011e-06, + 9.336578727925371e-07, + 8.095747716652113e-07, + 8.079554731921235e-07, + 8.037279712880263e-07 + ], + "gamma_dfa": 0.023886571638286114, + "acc_eval": 0.0732421875, + "loss_eval": 2.553205966949463, + "epoch": 5 + }, + { + "hidden_norms": [ + 10581.7958984375, + 749584.4375, + 812141.0, + 857193.1875, + 400190.71875 + ], + "bp_grad_norms_per_sample_med": [ + 6.321820222865426e-08, + 9.664934630393418e-09, + 9.634317343909515e-09, + 9.620791274755902e-09, + 9.613222218263218e-09 + ], + "bp_grad_norms_F": [ + 7.260930487973383e-06, + 5.95286962834507e-07, + 5.624330583486881e-07, + 5.61392937470373e-07, + 5.576875423685124e-07 + ], + "gamma_dfa": 0.024110323167406023, + "acc_eval": 0.1064453125, + "loss_eval": 2.702815532684326, + "epoch": 6 + }, + { + "hidden_norms": [ + 12157.236328125, + 1101113.5, + 1131608.625, + 1175579.75, + 556328.5625 + ], + "bp_grad_norms_per_sample_med": [ + 6.076628977780274e-08, + 7.990832884274823e-09, + 7.954333192117247e-09, + 7.956207248582814e-09, + 7.94490695454897e-09 + ], + "bp_grad_norms_F": [ + 9.092925211007241e-06, + 4.779853952641133e-07, + 4.453321764685825e-07, + 4.4446503011386085e-07, + 4.4091100903642655e-07 + ], + "gamma_dfa": 0.029227681923657656, + "acc_eval": 0.1123046875, + "loss_eval": 2.943108558654785, + "epoch": 7 + }, + { + "hidden_norms": [ + 13644.7734375, + 1553127.5, + 1514848.5, + 1594542.125, + 760487.4375 + ], + "bp_grad_norms_per_sample_med": [ + 6.183345391264083e-08, + 6.574770061718027e-09, + 6.521708506568302e-09, + 6.522410611609075e-09, + 6.511657879570976e-09 + ], + "bp_grad_norms_F": [ + 1.052718380378792e-05, + 3.7946443853797973e-07, + 3.55582386646347e-07, + 3.546880407157005e-07, + 3.51142261934001e-07 + ], + "gamma_dfa": 0.031233762740157545, + "acc_eval": 0.115234375, + "loss_eval": 3.18121600151062, + "epoch": 8 + }, + { + "hidden_norms": [ + 15180.75, + 2118332.5, + 1971916.0, + 2126576.75, + 1010951.875 + ], + "bp_grad_norms_per_sample_med": [ + 6.837856147967614e-08, + 5.575389039336187e-09, + 5.5562221490390584e-09, + 5.548445258796164e-09, + 5.536703984176938e-09 + ], + "bp_grad_norms_F": [ + 1.100128883990692e-05, + 3.2698190466362576e-07, + 3.031300082056987e-07, + 3.0168610010150587e-07, + 2.9835959480806196e-07 + ], + "gamma_dfa": 0.03483391250483692, + "acc_eval": 0.1162109375, + "loss_eval": 3.5671467781066895, + "epoch": 9 + }, + { + "hidden_norms": [ + 16599.55078125, + 2766443.75, + 2507868.5, + 2746855.25, + 1307418.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.16296781888559e-08, + 4.753268889601259e-09, + 4.731485869768903e-09, + 4.728840874435036e-09, + 4.7213348786101506e-09 + ], + "bp_grad_norms_F": [ + 1.1134686246805359e-05, + 2.7916473754885374e-07, + 2.561137080192566e-07, + 2.54354034723292e-07, + 2.5102386302933155e-07 + ], + "gamma_dfa": 0.04032926296349615, + "acc_eval": 0.115234375, + "loss_eval": 3.8605642318725586, + "epoch": 10 + }, + { + "hidden_norms": [ + 18096.76171875, + 3487919.0, + 3098858.25, + 3488545.25, + 1643380.75 + ], + "bp_grad_norms_per_sample_med": [ + 7.39422816309343e-08, + 4.142685749997099e-09, + 4.12689660223009e-09, + 4.106536444226094e-09, + 4.097727934748718e-09 + ], + "bp_grad_norms_F": [ + 1.2028808669128921e-05, + 2.466808268763998e-07, + 2.2443308012043417e-07, + 2.2274194577676099e-07, + 2.1958824447665393e-07 + ], + "gamma_dfa": 0.04084749217145145, + "acc_eval": 0.1162109375, + "loss_eval": 4.266114234924316, + "epoch": 11 + }, + { + "hidden_norms": [ + 19581.2265625, + 4300652.5, + 3764740.75, + 4282907.0, + 2046749.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.486859487926267e-08, + 3.5559581945676655e-09, + 3.521152702745667e-09, + 3.5090488292865984e-09, + 3.507678369985001e-09 + ], + "bp_grad_norms_F": [ + 1.1329559129080735e-05, + 2.097379336873928e-07, + 1.916048546490856e-07, + 1.900083077543968e-07, + 1.8724767869571224e-07 + ], + "gamma_dfa": 0.041128118813503534, + "acc_eval": 0.1123046875, + "loss_eval": 4.545563220977783, + "epoch": 12 + }, + { + "hidden_norms": [ + 21009.037109375, + 5305093.0, + 4626911.0, + 5321710.0, + 2528971.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.575832938755411e-08, + 3.0991811339475817e-09, + 3.0681037710422743e-09, + 3.060007136568288e-09, + 3.054509534194949e-09 + ], + "bp_grad_norms_F": [ + 1.31506558318506e-05, + 1.8260404033298983e-07, + 1.6721619999771065e-07, + 1.6574335859331768e-07, + 1.6327113883107813e-07 + ], + "gamma_dfa": 0.04362456756643951, + "acc_eval": 0.1142578125, + "loss_eval": 5.006200790405273, + "epoch": 13 + }, + { + "hidden_norms": [ + 22418.66015625, + 6455876.5, + 5546792.0, + 6434348.0, + 3069372.75 + ], + "bp_grad_norms_per_sample_med": [ + 7.665693146918784e-08, + 2.6803985697654298e-09, + 2.6608955039364446e-09, + 2.655886177649336e-09, + 2.650993424779813e-09 + ], + "bp_grad_norms_F": [ + 1.1598707715165801e-05, + 1.584767090889727e-07, + 1.4540981396748975e-07, + 1.442050745481538e-07, + 1.419812747371907e-07 + ], + "gamma_dfa": 0.043382189120166004, + "acc_eval": 0.115234375, + "loss_eval": 5.284748077392578, + "epoch": 14 + }, + { + "hidden_norms": [ + 23927.9296875, + 7772545.0, + 6605308.0, + 7661779.0, + 3671957.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.622067954571321e-08, + 2.3548620831093103e-09, + 2.3399049364769553e-09, + 2.3347188626843263e-09, + 2.3328083909035513e-09 + ], + "bp_grad_norms_F": [ + 1.2071202945662662e-05, + 1.4146635862744006e-07, + 1.285337845047252e-07, + 1.2724865428026533e-07, + 1.2524400005986536e-07 + ], + "gamma_dfa": 0.045932179084047675, + "acc_eval": 0.1123046875, + "loss_eval": 5.692019462585449, + "epoch": 15 + }, + { + "hidden_norms": [ + 25385.748046875, + 9261487.0, + 7775942.0, + 8990953.0, + 4363130.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.712851868291182e-08, + 2.1066282052117913e-09, + 2.0846218085068813e-09, + 2.0782020548892888e-09, + 2.0737342953935922e-09 + ], + "bp_grad_norms_F": [ + 1.4093741810938809e-05, + 1.278412895544534e-07, + 1.1472226901787508e-07, + 1.1351045259289094e-07, + 1.1163785273993199e-07 + ], + "gamma_dfa": 0.04430226338445209, + "acc_eval": 0.1103515625, + "loss_eval": 6.133723258972168, + "epoch": 16 + }, + { + "hidden_norms": [ + 26846.431640625, + 10875826.0, + 9052473.0, + 10511219.0, + 5116002.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.701503079715621e-08, + 1.8753321118225585e-09, + 1.861700571481606e-09, + 1.8542083424222255e-09, + 1.8551130631649926e-09 + ], + "bp_grad_norms_F": [ + 1.3089967978885397e-05, + 1.156644771072024e-07, + 1.0296086117023151e-07, + 1.0183324405943495e-07, + 1.0014894513687977e-07 + ], + "gamma_dfa": 0.04534357553347945, + "acc_eval": 0.103515625, + "loss_eval": 6.548648834228516, + "epoch": 17 + }, + { + "hidden_norms": [ + 28266.26953125, + 12742770.0, + 10505442.0, + 12262496.0, + 5946980.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.75791733076403e-08, + 1.6816592562918231e-09, + 1.6644484679417815e-09, + 1.662164628157825e-09, + 1.6569644545327833e-09 + ], + "bp_grad_norms_F": [ + 1.3716629837290384e-05, + 1.0489808488500785e-07, + 9.319560234644086e-08, + 9.210800300252231e-08, + 9.0522433993101e-08 + ], + "gamma_dfa": 0.04543712313170545, + "acc_eval": 0.0859375, + "loss_eval": 6.933040618896484, + "epoch": 18 + }, + { + "hidden_norms": [ + 29640.484375, + 14788877.0, + 12157201.0, + 14095277.0, + 6799392.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.606816865290966e-08, + 1.512424963046044e-09, + 1.495692236730406e-09, + 1.4903339673466576e-09, + 1.4848139384682213e-09 + ], + "bp_grad_norms_F": [ + 1.3458115063258447e-05, + 9.697606628833455e-08, + 8.518442484728439e-08, + 8.402660256479066e-08, + 8.255508987531357e-08 + ], + "gamma_dfa": 0.044778631010558456, + "acc_eval": 0.076171875, + "loss_eval": 7.425451278686523, + "epoch": 19 + }, + { + "hidden_norms": [ + 31005.751953125, + 17043824.0, + 13942765.0, + 16095532.0, + 7803190.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.645277122492189e-08, + 1.3731507042535895e-09, + 1.3549177335647755e-09, + 1.3525375264222816e-09, + 1.3489699357549512e-09 + ], + "bp_grad_norms_F": [ + 1.2845624951296486e-05, + 8.864368084005037e-08, + 7.73182620150692e-08, + 7.621348885322732e-08, + 7.483793496021462e-08 + ], + "gamma_dfa": 0.045761530549498275, + "acc_eval": 0.080078125, + "loss_eval": 7.776348114013672, + "epoch": 20 + }, + { + "hidden_norms": [ + 32358.83984375, + 19344688.0, + 15897992.0, + 18375228.0, + 8836651.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.644052146815739e-08, + 1.2519073555594673e-09, + 1.235606394978106e-09, + 1.2283364325682555e-09, + 1.2260956694376546e-09 + ], + "bp_grad_norms_F": [ + 1.3093407687847503e-05, + 8.157029185440479e-08, + 7.093318998840914e-08, + 6.988454259726495e-08, + 6.859116297164292e-08 + ], + "gamma_dfa": 0.04580485462793149, + "acc_eval": 0.0927734375, + "loss_eval": 8.182464599609375, + "epoch": 21 + }, + { + "hidden_norms": [ + 33740.52734375, + 21987014.0, + 17933020.0, + 20700014.0, + 9927617.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.858014328121499e-08, + 1.141782890456966e-09, + 1.131721383273998e-09, + 1.1269319921680676e-09, + 1.1228904472915247e-09 + ], + "bp_grad_norms_F": [ + 1.2902617527288385e-05, + 7.599386009360387e-08, + 6.517191053490023e-08, + 6.410991915117847e-08, + 6.290429155342281e-08 + ], + "gamma_dfa": 0.046245397155871615, + "acc_eval": 0.1044921875, + "loss_eval": 8.578572273254395, + "epoch": 22 + }, + { + "hidden_norms": [ + 35055.48828125, + 24700796.0, + 20204280.0, + 23173254.0, + 11098732.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.840032623107618e-08, + 1.054925813370744e-09, + 1.0381229209599496e-09, + 1.033837571107199e-09, + 1.0320241328187763e-09 + ], + "bp_grad_norms_F": [ + 1.3013632269576192e-05, + 7.11033791844784e-08, + 6.033156552121e-08, + 5.929242519187028e-08, + 5.8144280501437606e-08 + ], + "gamma_dfa": 0.04646674945252016, + "acc_eval": 0.10546875, + "loss_eval": 8.944098472595215, + "epoch": 23 + }, + { + "hidden_norms": [ + 36405.48046875, + 27759312.0, + 22467726.0, + 25750832.0, + 12358187.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.77747288793762e-08, + 9.745112494741193e-10, + 9.61777768537786e-10, + 9.57246060195871e-10, + 9.547377333163354e-10 + ], + "bp_grad_norms_F": [ + 1.3124400538799819e-05, + 6.744348723941584e-08, + 5.6144159543691785e-08, + 5.510578660050669e-08, + 5.4037375463167336e-08 + ], + "gamma_dfa": 0.04619356358307414, + "acc_eval": 0.10546875, + "loss_eval": 9.376721382141113, + "epoch": 24 + }, + { + "hidden_norms": [ + 37680.57421875, + 30906478.0, + 24827362.0, + 28558372.0, + 13662978.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.0997551776818e-08, + 9.035370229781847e-10, + 8.898414227687113e-10, + 8.862885980676083e-10, + 8.829543207689028e-10 + ], + "bp_grad_norms_F": [ + 1.3445563126879279e-05, + 6.41164845660569e-08, + 5.240685041485449e-08, + 5.135610692263981e-08, + 5.02956822856504e-08 + ], + "gamma_dfa": 0.046825854369672015, + "acc_eval": 0.10546875, + "loss_eval": 9.577943801879883, + "epoch": 25 + }, + { + "hidden_norms": [ + 38936.06640625, + 34144420.0, + 27240194.0, + 31329912.0, + 14997002.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.190059475055023e-08, + 8.378591709323757e-10, + 8.267845297282861e-10, + 8.228125403242359e-10, + 8.203847046139856e-10 + ], + "bp_grad_norms_F": [ + 1.2998734746361151e-05, + 6.114981232485661e-08, + 4.876913095586133e-08, + 4.772548578557689e-08, + 4.673227849139039e-08 + ], + "gamma_dfa": 0.047515806669252925, + "acc_eval": 0.10546875, + "loss_eval": 9.88414478302002, + "epoch": 26 + }, + { + "hidden_norms": [ + 40155.01953125, + 37508168.0, + 29749186.0, + 34078604.0, + 16502834.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.168245813067188e-08, + 7.775868282600129e-10, + 7.702881665849759e-10, + 7.661091205868331e-10, + 7.637669940940839e-10 + ], + "bp_grad_norms_F": [ + 1.3017543096793815e-05, + 5.765622645981239e-08, + 4.5165805317992636e-08, + 4.418279431206429e-08, + 4.329486813503536e-08 + ], + "gamma_dfa": 0.047424486168893054, + "acc_eval": 0.1064453125, + "loss_eval": 10.275530815124512, + "epoch": 27 + }, + { + "hidden_norms": [ + 41438.58203125, + 41153480.0, + 32568028.0, + 37348624.0, + 18107524.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.174999521770587e-08, + 7.312160876793428e-10, + 7.228238008138987e-10, + 7.196194196090744e-10, + 7.171208626921555e-10 + ], + "bp_grad_norms_F": [ + 1.2991866242373362e-05, + 5.5619945982243735e-08, + 4.266198772029384e-08, + 4.1693596131153754e-08, + 4.083043592117974e-08 + ], + "gamma_dfa": 0.04726689399103634, + "acc_eval": 0.10546875, + "loss_eval": 10.532907485961914, + "epoch": 28 + }, + { + "hidden_norms": [ + 42610.61328125, + 44767372.0, + 35250536.0, + 40433388.0, + 19648566.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.25098211976183e-08, + 6.862435619758855e-10, + 6.773137606330693e-10, + 6.743952063459346e-10, + 6.720446421581983e-10 + ], + "bp_grad_norms_F": [ + 1.2943252841068897e-05, + 5.273594538834914e-08, + 4.00670607803022e-08, + 3.916983715157585e-08, + 3.8364525778433745e-08 + ], + "gamma_dfa": 0.04717689534300007, + "acc_eval": 0.10546875, + "loss_eval": 10.889819145202637, + "epoch": 29 + }, + { + "hidden_norms": [ + 43802.12109375, + 48777580.0, + 38250948.0, + 43905160.0, + 21394392.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.3824673424715e-08, + 6.459773826961168e-10, + 6.385393880314894e-10, + 6.341404623633196e-10, + 6.317291689761362e-10 + ], + "bp_grad_norms_F": [ + 1.2702556887234095e-05, + 4.966772237935402e-08, + 3.767947376331904e-08, + 3.682788829451056e-08, + 3.60615324268565e-08 + ], + "gamma_dfa": 0.04775475192582235, + "acc_eval": 0.10546875, + "loss_eval": 11.143190383911133, + "epoch": 30 + }, + { + "hidden_norms": [ + 44971.96484375, + 53001532.0, + 41286860.0, + 47327540.0, + 23064180.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.44017193912805e-08, + 6.083171188997483e-10, + 6.001447672154825e-10, + 5.973078143206578e-10, + 5.949598036458781e-10 + ], + "bp_grad_norms_F": [ + 1.2565969882416539e-05, + 4.7034244943233716e-08, + 3.557239125484557e-08, + 3.4768806500551364e-08, + 3.403641457566664e-08 + ], + "gamma_dfa": 0.04808254592353478, + "acc_eval": 0.10546875, + "loss_eval": 11.375898361206055, + "epoch": 31 + }, + { + "hidden_norms": [ + 46135.65234375, + 57315672.0, + 44360792.0, + 51011808.0, + 24900550.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.566909315277371e-08, + 5.749250520103999e-10, + 5.675590553089194e-10, + 5.655514945246409e-10, + 5.63264157538157e-10 + ], + "bp_grad_norms_F": [ + 1.2200253877381328e-05, + 4.4094601747701745e-08, + 3.3572575830476126e-08, + 3.2811797723297786e-08, + 3.210490717719949e-08 + ], + "gamma_dfa": 0.04755272905458696, + "acc_eval": 0.1064453125, + "loss_eval": 11.584449768066406, + "epoch": 32 + }, + { + "hidden_norms": [ + 47265.27734375, + 61919976.0, + 47722620.0, + 54844944.0, + 26929922.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.478352953034118e-08, + 5.391301294288553e-10, + 5.344974463028507e-10, + 5.308364858791492e-10, + 5.291052596057e-10 + ], + "bp_grad_norms_F": [ + 1.2009260899503715e-05, + 4.1767787450908145e-08, + 3.1745546635875144e-08, + 3.102580947711431e-08, + 3.037316531617762e-08 + ], + "gamma_dfa": 0.0475847675697878, + "acc_eval": 0.10546875, + "loss_eval": 11.923343658447266, + "epoch": 33 + }, + { + "hidden_norms": [ + 48342.62109375, + 66327300.0, + 51030320.0, + 58382808.0, + 28803830.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.630867398551345e-08, + 5.130093017058357e-10, + 5.057400054298e-10, + 5.023059190811807e-10, + 5.003696346150832e-10 + ], + "bp_grad_norms_F": [ + 1.1836677003884688e-05, + 3.972920481487563e-08, + 3.016906902075789e-08, + 2.9483924635087533e-08, + 2.8860545953079964e-08 + ], + "gamma_dfa": 0.04806397232459858, + "acc_eval": 0.10546875, + "loss_eval": 12.134788513183594, + "epoch": 34 + }, + { + "hidden_norms": [ + 49438.7734375, + 70923576.0, + 54371588.0, + 62839076.0, + 30745350.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.529716666316745e-08, + 4.881638981935055e-10, + 4.826159472059999e-10, + 4.801878894511447e-10, + 4.785546958707698e-10 + ], + "bp_grad_norms_F": [ + 1.1614155482675415e-05, + 3.7715466305598966e-08, + 2.8843189170402184e-08, + 2.8193024803613298e-08, + 2.7588850315396485e-08 + ], + "gamma_dfa": 0.047784373455215245, + "acc_eval": 0.10546875, + "loss_eval": 12.365730285644531, + "epoch": 35 + }, + { + "hidden_norms": [ + 50484.30859375, + 75708880.0, + 57946872.0, + 66924284.0, + 32685426.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.612364865712152e-08, + 4.650996809907326e-10, + 4.5824133376726195e-10, + 4.5511036605994093e-10, + 4.534528585953268e-10 + ], + "bp_grad_norms_F": [ + 1.1689081475196872e-05, + 3.617047283910324e-08, + 2.7491989129657668e-08, + 2.6862345237077534e-08, + 2.6283149878736367e-08 + ], + "gamma_dfa": 0.04781174083473161, + "acc_eval": 0.10546875, + "loss_eval": 12.582022666931152, + "epoch": 36 + }, + { + "hidden_norms": [ + 51533.140625, + 80717000.0, + 61608756.0, + 71031448.0, + 34583536.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.646285465374604e-08, + 4.4203954385757527e-10, + 4.369871131615355e-10, + 4.329318292750628e-10, + 4.319989088674703e-10 + ], + "bp_grad_norms_F": [ + 1.1521507985889912e-05, + 3.4413087490747785e-08, + 2.619959005301098e-08, + 2.5601275766007348e-08, + 2.505496254912032e-08 + ], + "gamma_dfa": 0.04798329665209167, + "acc_eval": 0.10546875, + "loss_eval": 12.857856750488281, + "epoch": 37 + }, + { + "hidden_norms": [ + 52583.0859375, + 85961416.0, + 65257552.0, + 74859152.0, + 36629052.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.666147977010041e-08, + 4.2343398232169704e-10, + 4.1782510784571514e-10, + 4.1457998145588704e-10, + 4.136685161082454e-10 + ], + "bp_grad_norms_F": [ + 1.1553073818504345e-05, + 3.306437434957843e-08, + 2.515412056425248e-08, + 2.4584762670087912e-08, + 2.405546162265182e-08 + ], + "gamma_dfa": 0.04809549875790253, + "acc_eval": 0.10546875, + "loss_eval": 13.005304336547852, + "epoch": 38 + }, + { + "hidden_norms": [ + 53574.21875, + 91233752.0, + 68912136.0, + 78801432.0, + 38771888.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.665335116120332e-08, + 4.0339676043998907e-10, + 4.0027073322512763e-10, + 3.982228713450553e-10, + 3.9690134512326836e-10 + ], + "bp_grad_norms_F": [ + 1.1503744644869585e-05, + 3.151562921743789e-08, + 2.405471910549295e-08, + 2.3515880798186117e-08, + 2.3014273153876275e-08 + ], + "gamma_dfa": 0.04791133257094771, + "acc_eval": 0.10546875, + "loss_eval": 13.310943603515625, + "epoch": 39 + }, + { + "hidden_norms": [ + 54515.76953125, + 96143688.0, + 72537432.0, + 83291584.0, + 40846320.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.742490109625578e-08, + 3.8639558219699666e-10, + 3.8376418709518134e-10, + 3.813957205611729e-10, + 3.8053543649496646e-10 + ], + "bp_grad_norms_F": [ + 1.1331952919135801e-05, + 3.0162087938379045e-08, + 2.3133726045898584e-08, + 2.2621049922122438e-08, + 2.2133153976255926e-08 + ], + "gamma_dfa": 0.0483476699446328, + "acc_eval": 0.10546875, + "loss_eval": 13.509955406188965, + "epoch": 40 + }, + { + "hidden_norms": [ + 55471.92578125, + 101352504.0, + 76262640.0, + 87893288.0, + 43005752.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.776105886454388e-08, + 3.722072094980433e-10, + 3.6970662642410446e-10, + 3.67776836762701e-10, + 3.6656577773186427e-10 + ], + "bp_grad_norms_F": [ + 1.1259300663368776e-05, + 2.921965247537628e-08, + 2.22886100686992e-08, + 2.178610181147178e-08, + 2.1311375775212582e-08 + ], + "gamma_dfa": 0.04882028384599835, + "acc_eval": 0.10546875, + "loss_eval": 13.669061660766602, + "epoch": 41 + }, + { + "hidden_norms": [ + 56406.1796875, + 106503480.0, + 80309328.0, + 92335120.0, + 45272116.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.741802304257362e-08, + 3.5817968035978254e-10, + 3.546553328792612e-10, + 3.5286135124934503e-10, + 3.517087177051792e-10 + ], + "bp_grad_norms_F": [ + 1.1156203981954604e-05, + 2.829144030158659e-08, + 2.1501875835383544e-08, + 2.1014004758512783e-08, + 2.056106396253199e-08 + ], + "gamma_dfa": 0.04876198567217216, + "acc_eval": 0.10546875, + "loss_eval": 13.882933616638184, + "epoch": 42 + }, + { + "hidden_norms": [ + 57307.2421875, + 111696136.0, + 84071088.0, + 96859240.0, + 47347232.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.675155527271272e-08, + 3.451815777655298e-10, + 3.4170632989827254e-10, + 3.399925063707343e-10, + 3.38884892370217e-10 + ], + "bp_grad_norms_F": [ + 1.105228056985652e-05, + 2.731184522986041e-08, + 2.0790139387827367e-08, + 2.0321502702813632e-08, + 1.9881698065660203e-08 + ], + "gamma_dfa": 0.04874728451250121, + "acc_eval": 0.10546875, + "loss_eval": 14.110960960388184, + "epoch": 43 + }, + { + "hidden_norms": [ + 58201.1015625, + 116915912.0, + 88056232.0, + 101457736.0, + 49574372.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.81610304759306e-08, + 3.3262503862374615e-10, + 3.28719912401354e-10, + 3.270855530868033e-10, + 3.2694977281089166e-10 + ], + "bp_grad_norms_F": [ + 1.09774755401304e-05, + 2.6502128491756594e-08, + 2.010280297781719e-08, + 1.964214924043972e-08, + 1.9215420365981117e-08 + ], + "gamma_dfa": 0.049133426626212895, + "acc_eval": 0.10546875, + "loss_eval": 14.251358985900879, + "epoch": 44 + }, + { + "hidden_norms": [ + 59057.046875, + 122526296.0, + 92035232.0, + 106073072.0, + 51524732.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.615387514510076e-08, + 3.1993208082781166e-10, + 3.1755734153371407e-10, + 3.1527228050443057e-10, + 3.1427349611590216e-10 + ], + "bp_grad_norms_F": [ + 1.0898848813667428e-05, + 2.5704085970801316e-08, + 1.941714167230657e-08, + 1.896907697584993e-08, + 1.8563016013217748e-08 + ], + "gamma_dfa": 0.04926633776631206, + "acc_eval": 0.10546875, + "loss_eval": 14.543952941894531, + "epoch": 45 + }, + { + "hidden_norms": [ + 59915.00390625, + 128059208.0, + 95767408.0, + 110314168.0, + 53699800.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.616160585006583e-08, + 3.10205972020583e-10, + 3.0786348470535074e-10, + 3.0548555352005735e-10, + 3.044886287550952e-10 + ], + "bp_grad_norms_F": [ + 1.0854326319531538e-05, + 2.4907375717475588e-08, + 1.8864984241417915e-08, + 1.8437393833892202e-08, + 1.8046192096221603e-08 + ], + "gamma_dfa": 0.04898433407652192, + "acc_eval": 0.10546875, + "loss_eval": 14.763640403747559, + "epoch": 46 + }, + { + "hidden_norms": [ + 60732.77734375, + 133044840.0, + 99449000.0, + 114745104.0, + 55794780.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.66734808369074e-08, + 3.0199040490508366e-10, + 2.984798519456433e-10, + 2.9689897762530393e-10, + 2.9609348306536276e-10 + ], + "bp_grad_norms_F": [ + 1.0869742254726589e-05, + 2.4187817970755532e-08, + 1.8320044148367742e-08, + 1.79040302583644e-08, + 1.7519981909686067e-08 + ], + "gamma_dfa": 0.049695645982865244, + "acc_eval": 0.10546875, + "loss_eval": 14.853147506713867, + "epoch": 47 + }, + { + "hidden_norms": [ + 61537.2265625, + 138238256.0, + 103294888.0, + 119079736.0, + 57875032.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.672164852896458e-08, + 2.937747545228575e-10, + 2.90239082767485e-10, + 2.8853816558260803e-10, + 2.880042870856414e-10 + ], + "bp_grad_norms_F": [ + 1.0855384971364401e-05, + 2.3642215296604263e-08, + 1.78662986627387e-08, + 1.745818423160017e-08, + 1.7085612924461202e-08 + ], + "gamma_dfa": 0.04945674288319424, + "acc_eval": 0.10546875, + "loss_eval": 15.014139175415039, + "epoch": 48 + }, + { + "hidden_norms": [ + 62318.859375, + 143781376.0, + 107295080.0, + 123266280.0, + 60009076.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.63586393506921e-08, + 2.853322023099736e-10, + 2.819139366394552e-10, + 2.8051430622788587e-10, + 2.796505249591519e-10 + ], + "bp_grad_norms_F": [ + 1.0763029422378168e-05, + 2.2983703829027036e-08, + 1.7385014317028435e-08, + 1.699019236411914e-08, + 1.662707127536578e-08 + ], + "gamma_dfa": 0.04949341545579955, + "acc_eval": 0.10546875, + "loss_eval": 15.234472274780273, + "epoch": 49 + }, + { + "hidden_norms": [ + 63084.12109375, + 148953776.0, + 111167488.0, + 127493184.0, + 62116584.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.690788888543466e-08, + 2.77830092265674e-10, + 2.7401189650611e-10, + 2.7265251167918336e-10, + 2.71903860538103e-10 + ], + "bp_grad_norms_F": [ + 1.0762613783299457e-05, + 2.2435919788676983e-08, + 1.6915544520657022e-08, + 1.65265419127536e-08, + 1.6172732486552377e-08 + ], + "gamma_dfa": 0.04998577304650098, + "acc_eval": 0.10546875, + "loss_eval": 15.356475830078125, + "epoch": 50 + }, + { + "hidden_norms": [ + 63822.42578125, + 153887120.0, + 114903200.0, + 131868160.0, + 64092768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.741512402821172e-08, + 2.695783041239963e-10, + 2.676055765871155e-10, + 2.6572444244976623e-10, + 2.649161723322635e-10 + ], + "bp_grad_norms_F": [ + 1.07648411358241e-05, + 2.1865258048592295e-08, + 1.6514658085498013e-08, + 1.6137914116143293e-08, + 1.5790037721785666e-08 + ], + "gamma_dfa": 0.050343112263362855, + "acc_eval": 0.10546875, + "loss_eval": 15.516284942626953, + "epoch": 51 + }, + { + "hidden_norms": [ + 64467.453125, + 158904000.0, + 118881072.0, + 136114000.0, + 66111872.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.664627415555515e-08, + 2.624416239882521e-10, + 2.6058996627220665e-10, + 2.5911758849694877e-10, + 2.584663871818549e-10 + ], + "bp_grad_norms_F": [ + 1.0719203601183835e-05, + 2.1336076017064443e-08, + 1.6169177996516737e-08, + 1.5802571695644474e-08, + 1.546756678294514e-08 + ], + "gamma_dfa": 0.04984566644998267, + "acc_eval": 0.10546875, + "loss_eval": 15.6607084274292, + "epoch": 52 + }, + { + "hidden_norms": [ + 65120.73828125, + 163883856.0, + 122702472.0, + 140198928.0, + 68242560.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.641593041147644e-08, + 2.5804472447710225e-10, + 2.5353724675269973e-10, + 2.5259389024867573e-10, + 2.520264275052142e-10 + ], + "bp_grad_norms_F": [ + 1.0724111234594602e-05, + 2.0917026333222566e-08, + 1.5751618676063117e-08, + 1.5394757468811804e-08, + 1.5069018033386783e-08 + ], + "gamma_dfa": 0.05030635162256658, + "acc_eval": 0.10546875, + "loss_eval": 15.901081085205078, + "epoch": 53 + }, + { + "hidden_norms": [ + 65754.40625, + 168991232.0, + 126758528.0, + 144376592.0, + 70329568.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.677351104324771e-08, + 2.5239485501593606e-10, + 2.4832783052097795e-10, + 2.4752053184862177e-10, + 2.4696938938362223e-10 + ], + "bp_grad_norms_F": [ + 1.0669472430890892e-05, + 2.0359754770993277e-08, + 1.542808725218947e-08, + 1.5080953374990713e-08, + 1.4761029731857889e-08 + ], + "gamma_dfa": 0.05062760764849372, + "acc_eval": 0.10546875, + "loss_eval": 16.04940414428711, + "epoch": 54 + }, + { + "hidden_norms": [ + 66360.1953125, + 173885088.0, + 130550672.0, + 148377456.0, + 72298680.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.759133862668023e-08, + 2.4686536148621485e-10, + 2.4284077526637304e-10, + 2.4196153414202115e-10, + 2.414988486965086e-10 + ], + "bp_grad_norms_F": [ + 1.0671456038835458e-05, + 1.9936877038162493e-08, + 1.5118750695819472e-08, + 1.4775524803667395e-08, + 1.4458762187530283e-08 + ], + "gamma_dfa": 0.050650376273551956, + "acc_eval": 0.10546875, + "loss_eval": 16.173294067382812, + "epoch": 55 + }, + { + "hidden_norms": [ + 66955.3671875, + 179032416.0, + 134152312.0, + 152335472.0, + 74150016.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.732155265533947e-08, + 2.4187768454808634e-10, + 2.378792995916257e-10, + 2.3684243455335263e-10, + 2.3630350454162397e-10 + ], + "bp_grad_norms_F": [ + 1.0680658306227997e-05, + 1.9686593688561516e-08, + 1.484478495683561e-08, + 1.4507179457723396e-08, + 1.4196978703751029e-08 + ], + "gamma_dfa": 0.05082969422801398, + "acc_eval": 0.10546875, + "loss_eval": 16.27086639404297, + "epoch": 56 + }, + { + "hidden_norms": [ + 67549.515625, + 183555840.0, + 137880064.0, + 156240624.0, + 75989536.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.660003913973924e-08, + 2.357370687544602e-10, + 2.33779245961685e-10, + 2.3301963136823645e-10, + 2.3250262826124413e-10 + ], + "bp_grad_norms_F": [ + 1.0663774446584284e-05, + 1.9352745184164633e-08, + 1.4566153616613065e-08, + 1.423444206949398e-08, + 1.3932280218398319e-08 + ], + "gamma_dfa": 0.05084921311936341, + "acc_eval": 0.10546875, + "loss_eval": 16.451187133789062, + "epoch": 57 + }, + { + "hidden_norms": [ + 68104.8046875, + 188812128.0, + 141342304.0, + 160268688.0, + 77916768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.660642691893372e-08, + 2.327093101550659e-10, + 2.2930106424734475e-10, + 2.2855875525529257e-10, + 2.2804760857475515e-10 + ], + "bp_grad_norms_F": [ + 1.0613769518386107e-05, + 1.899090662504932e-08, + 1.4301366313418384e-08, + 1.3975586021786057e-08, + 1.3677930787991954e-08 + ], + "gamma_dfa": 0.05096889057313092, + "acc_eval": 0.10546875, + "loss_eval": 16.63678741455078, + "epoch": 58 + }, + { + "hidden_norms": [ + 68657.515625, + 193258416.0, + 144614160.0, + 164019216.0, + 79742168.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.68742304760417e-08, + 2.289267664323802e-10, + 2.2474513916570515e-10, + 2.2393865928282963e-10, + 2.2451285275337796e-10 + ], + "bp_grad_norms_F": [ + 1.0620946341077797e-05, + 1.866202836708908e-08, + 1.4068830544999855e-08, + 1.3749051674949442e-08, + 1.3455515812665908e-08 + ], + "gamma_dfa": 0.05113464401802048, + "acc_eval": 0.10546875, + "loss_eval": 16.70541763305664, + "epoch": 59 + }, + { + "hidden_norms": [ + 69158.5, + 197991056.0, + 148074896.0, + 168001296.0, + 81613432.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.685481134307338e-08, + 2.244555652453073e-10, + 2.21766327523909e-10, + 2.2105835217889336e-10, + 2.2056727277952604e-10 + ], + "bp_grad_norms_F": [ + 1.0557047062320635e-05, + 1.836115792741566e-08, + 1.3819986932617212e-08, + 1.35067770301589e-08, + 1.3220035732786073e-08 + ], + "gamma_dfa": 0.05133810767438263, + "acc_eval": 0.10546875, + "loss_eval": 16.83820915222168, + "epoch": 60 + }, + { + "hidden_norms": [ + 69652.15625, + 202764272.0, + 151440416.0, + 171388720.0, + 83290960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.682473406906865e-08, + 2.209017690990578e-10, + 2.178418834208884e-10, + 2.1715784725984122e-10, + 2.166662266267494e-10 + ], + "bp_grad_norms_F": [ + 1.0563057912804652e-05, + 1.8060584139334424e-08, + 1.3589187553009197e-08, + 1.3282591027063972e-08, + 1.300101715173696e-08 + ], + "gamma_dfa": 0.051503602182492614, + "acc_eval": 0.10546875, + "loss_eval": 16.996952056884766, + "epoch": 61 + }, + { + "hidden_norms": [ + 70119.3046875, + 207371568.0, + 154513392.0, + 174693904.0, + 84899272.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.754268776556273e-08, + 2.177768798627966e-10, + 2.1394505611560533e-10, + 2.1310755937697934e-10, + 2.1278181994155432e-10 + ], + "bp_grad_norms_F": [ + 1.0583677067188546e-05, + 1.7867773038915402e-08, + 1.3404712007059061e-08, + 1.3099571205543725e-08, + 1.281919193019121e-08 + ], + "gamma_dfa": 0.05178222866379656, + "acc_eval": 0.10546875, + "loss_eval": 17.03223419189453, + "epoch": 62 + }, + { + "hidden_norms": [ + 70571.765625, + 211695824.0, + 157515872.0, + 178129360.0, + 86545024.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.717323396467691e-08, + 2.1452814524813846e-10, + 2.1192504695566328e-10, + 2.1126832228102188e-10, + 2.1079131495849168e-10 + ], + "bp_grad_norms_F": [ + 1.0588292752800044e-05, + 1.7631437643217396e-08, + 1.3229322526342457e-08, + 1.2929083581525447e-08, + 1.2654436609693676e-08 + ], + "gamma_dfa": 0.0517645905201789, + "acc_eval": 0.10546875, + "loss_eval": 17.17680549621582, + "epoch": 63 + }, + { + "hidden_norms": [ + 71016.2734375, + 216131392.0, + 160371248.0, + 181552016.0, + 88083200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.714041399571215e-08, + 2.1204836497812352e-10, + 2.0845919435075189e-10, + 2.0772163156212997e-10, + 2.0731850958188858e-10 + ], + "bp_grad_norms_F": [ + 1.0558523172221612e-05, + 1.7396088125565257e-08, + 1.3074124005640897e-08, + 1.2776619762178143e-08, + 1.2503839741384581e-08 + ], + "gamma_dfa": 0.05190763485734351, + "acc_eval": 0.10546875, + "loss_eval": 17.230438232421875, + "epoch": 64 + }, + { + "hidden_norms": [ + 71423.875, + 220276432.0, + 163188992.0, + 184901952.0, + 89669880.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.695663922253516e-08, + 2.089625000811779e-10, + 2.0665336109004784e-10, + 2.060027565198297e-10, + 2.0553812818402406e-10 + ], + "bp_grad_norms_F": [ + 1.054474341799505e-05, + 1.720214015676902e-08, + 1.2905923441053346e-08, + 1.2612286326429967e-08, + 1.2343328137376375e-08 + ], + "gamma_dfa": 0.0516790475230664, + "acc_eval": 0.10546875, + "loss_eval": 17.364524841308594, + "epoch": 65 + }, + { + "hidden_norms": [ + 71819.7265625, + 224240896.0, + 165905760.0, + 188025680.0, + 91055744.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.707031184940206e-08, + 2.0619655982656582e-10, + 2.0404426759323968e-10, + 2.0340489015335805e-10, + 2.0294699254463922e-10 + ], + "bp_grad_norms_F": [ + 1.0510210813663434e-05, + 1.6987915074651028e-08, + 1.2752495948120668e-08, + 1.2462213483388496e-08, + 1.2196251120144552e-08 + ], + "gamma_dfa": 0.05187035645940341, + "acc_eval": 0.10546875, + "loss_eval": 17.464691162109375, + "epoch": 66 + }, + { + "hidden_norms": [ + 72184.1796875, + 228069632.0, + 168371744.0, + 190844528.0, + 92434920.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.708528298484453e-08, + 2.0398974176494278e-10, + 2.0165806524641283e-10, + 2.0102944309208226e-10, + 2.0057676353157916e-10 + ], + "bp_grad_norms_F": [ + 1.0452381502545904e-05, + 1.678668404281325e-08, + 1.2599208787378302e-08, + 1.2311685892996138e-08, + 1.2049306441497265e-08 + ], + "gamma_dfa": 0.052035300293937325, + "acc_eval": 0.10546875, + "loss_eval": 17.54598045349121, + "epoch": 67 + }, + { + "hidden_norms": [ + 72520.546875, + 231382032.0, + 170794656.0, + 193581264.0, + 93730880.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.673346485466027e-08, + 2.0163908043269174e-10, + 1.9945969875756475e-10, + 1.988337966496445e-10, + 1.983077452250015e-10 + ], + "bp_grad_norms_F": [ + 1.041769064613618e-05, + 1.6600257168875032e-08, + 1.2470060539726546e-08, + 1.218627776466974e-08, + 1.1927684617774048e-08 + ], + "gamma_dfa": 0.052122256805887446, + "acc_eval": 0.10546875, + "loss_eval": 17.622678756713867, + "epoch": 68 + }, + { + "hidden_norms": [ + 72848.296875, + 234345168.0, + 172920208.0, + 196159376.0, + 94861664.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.68633378559025e-08, + 1.9926535421710412e-10, + 1.9748097601635095e-10, + 1.9686471897095714e-10, + 1.9632170888961298e-10 + ], + "bp_grad_norms_F": [ + 1.0410145478090271e-05, + 1.6476832342959824e-08, + 1.2349259392863132e-08, + 1.2067844501473246e-08, + 1.1810766586961563e-08 + ], + "gamma_dfa": 0.05221144680399448, + "acc_eval": 0.10546875, + "loss_eval": 17.67215347290039, + "epoch": 69 + }, + { + "hidden_norms": [ + 73156.28125, + 237693904.0, + 175292576.0, + 198663152.0, + 96070024.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.698025766307182e-08, + 1.9732028511132427e-10, + 1.9561376130017294e-10, + 1.950042072262903e-10, + 1.9452565946931344e-10 + ], + "bp_grad_norms_F": [ + 1.0408021807961632e-05, + 1.6299335214853272e-08, + 1.224471191108023e-08, + 1.1966841739763368e-08, + 1.1711744463127616e-08 + ], + "gamma_dfa": 0.05207514451467432, + "acc_eval": 0.10546875, + "loss_eval": 17.708881378173828, + "epoch": 70 + }, + { + "hidden_norms": [ + 73450.0390625, + 240668752.0, + 177333776.0, + 200832576.0, + 97232808.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.750691904424457e-08, + 1.9538150264342136e-10, + 1.937518478989375e-10, + 1.9322175803804242e-10, + 1.9261021944050327e-10 + ], + "bp_grad_norms_F": [ + 1.0387684596935287e-05, + 1.614511546677022e-08, + 1.2127667758932148e-08, + 1.1853135362116518e-08, + 1.1600380211973516e-08 + ], + "gamma_dfa": 0.052143561391858384, + "acc_eval": 0.10546875, + "loss_eval": 17.803735733032227, + "epoch": 71 + }, + { + "hidden_norms": [ + 73722.7890625, + 243140912.0, + 179223280.0, + 203119056.0, + 98179728.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.777691107297869e-08, + 1.936056454043822e-10, + 1.921051789866013e-10, + 1.9142704088537243e-10, + 1.908224411817372e-10 + ], + "bp_grad_norms_F": [ + 1.0383127118984703e-05, + 1.6032700500545616e-08, + 1.2034083063383605e-08, + 1.1761529528087067e-08, + 1.1511005482134351e-08 + ], + "gamma_dfa": 0.0522310700325761, + "acc_eval": 0.10546875, + "loss_eval": 17.871017456054688, + "epoch": 72 + }, + { + "hidden_norms": [ + 73977.796875, + 245601744.0, + 181134272.0, + 205298592.0, + 99248704.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.645526605732812e-08, + 1.9214441149273398e-10, + 1.908457003541031e-10, + 1.8958104530675257e-10, + 1.891580642121582e-10 + ], + "bp_grad_norms_F": [ + 1.0368045877839904e-05, + 1.593527443333187e-08, + 1.1956020173897741e-08, + 1.1683961353980976e-08, + 1.1433988866826894e-08 + ], + "gamma_dfa": 0.05229719865019433, + "acc_eval": 0.10546875, + "loss_eval": 17.842838287353516, + "epoch": 73 + }, + { + "hidden_norms": [ + 74210.2890625, + 248047296.0, + 183004848.0, + 207310784.0, + 100283200.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.702664189286224e-08, + 1.9067503131964259e-10, + 1.8910681354178394e-10, + 1.886194395117613e-10, + 1.8805811075051082e-10 + ], + "bp_grad_norms_F": [ + 1.0340887456550263e-05, + 1.5766524086302525e-08, + 1.1852850256843794e-08, + 1.1584752712678892e-08, + 1.1337309757664116e-08 + ], + "gamma_dfa": 0.05227879187441431, + "acc_eval": 0.10546875, + "loss_eval": 17.977331161499023, + "epoch": 74 + }, + { + "hidden_norms": [ + 74442.2578125, + 250302768.0, + 184669344.0, + 209343920.0, + 101168016.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.73824319569394e-08, + 1.8929384448806985e-10, + 1.8772923493504123e-10, + 1.8724671813075133e-10, + 1.8670247292629227e-10 + ], + "bp_grad_norms_F": [ + 1.0353242942073848e-05, + 1.5672505071506748e-08, + 1.1772779195950989e-08, + 1.1506068098299238e-08, + 1.1260493870679511e-08 + ], + "gamma_dfa": 0.05237349838716909, + "acc_eval": 0.10546875, + "loss_eval": 18.03546905517578, + "epoch": 75 + }, + { + "hidden_norms": [ + 74647.3203125, + 252406032.0, + 186061376.0, + 211037200.0, + 101960680.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.6925361131307e-08, + 1.881417382998407e-10, + 1.867033888602876e-10, + 1.8579758565007154e-10, + 1.8538144630486642e-10 + ], + "bp_grad_norms_F": [ + 1.0341693268856034e-05, + 1.5606824277369924e-08, + 1.1714643477489517e-08, + 1.1449987624700952e-08, + 1.1205665728653003e-08 + ], + "gamma_dfa": 0.05233656561176758, + "acc_eval": 0.10546875, + "loss_eval": 18.052072525024414, + "epoch": 76 + }, + { + "hidden_norms": [ + 74842.0859375, + 254511632.0, + 187492928.0, + 212704224.0, + 102757816.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.698394537987042e-08, + 1.8709332694211156e-10, + 1.8572142435058225e-10, + 1.8484298813792321e-10, + 1.8442962435027965e-10 + ], + "bp_grad_norms_F": [ + 1.0342246241634712e-05, + 1.552284167871676e-08, + 1.1652745435242196e-08, + 1.1389352572166445e-08, + 1.114572434346428e-08 + ], + "gamma_dfa": 0.05241188171203248, + "acc_eval": 0.10546875, + "loss_eval": 18.086322784423828, + "epoch": 77 + }, + { + "hidden_norms": [ + 75024.015625, + 256539408.0, + 188878192.0, + 214226816.0, + 103471288.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.701635323404844e-08, + 1.8604462415083844e-10, + 1.84622400700718e-10, + 1.8390608480522985e-10, + 1.834675189549273e-10 + ], + "bp_grad_norms_F": [ + 1.032539876177907e-05, + 1.5453247570462736e-08, + 1.1593147775101897e-08, + 1.133172844447472e-08, + 1.1090729223894868e-08 + ], + "gamma_dfa": 0.05239276264910586, + "acc_eval": 0.10546875, + "loss_eval": 18.168014526367188, + "epoch": 78 + }, + { + "hidden_norms": [ + 75180.9609375, + 258451104.0, + 190004976.0, + 215740128.0, + 104133768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.704767395784074e-08, + 1.8524454192814233e-10, + 1.8379993360628788e-10, + 1.8304618931708205e-10, + 1.8256345046818723e-10 + ], + "bp_grad_norms_F": [ + 1.0337872481613886e-05, + 1.5379262308101715e-08, + 1.1539456501452605e-08, + 1.127898041630715e-08, + 1.103767743870776e-08 + ], + "gamma_dfa": 0.052515600953483954, + "acc_eval": 0.10546875, + "loss_eval": 18.164344787597656, + "epoch": 79 + }, + { + "hidden_norms": [ + 75327.796875, + 260127200.0, + 191027072.0, + 216985472.0, + 104684240.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.744654422798703e-08, + 1.8438454929547987e-10, + 1.8290086112315862e-10, + 1.8214722785625526e-10, + 1.8167076176744956e-10 + ], + "bp_grad_norms_F": [ + 1.032766067510238e-05, + 1.5304989275932712e-08, + 1.14842633180956e-08, + 1.122501380734775e-08, + 1.098510349351045e-08 + ], + "gamma_dfa": 0.05257981286558788, + "acc_eval": 0.10546875, + "loss_eval": 18.223249435424805, + "epoch": 80 + }, + { + "hidden_norms": [ + 75454.5703125, + 261646176.0, + 192111600.0, + 218110816.0, + 105216432.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.775589321885491e-08, + 1.8362063258781092e-10, + 1.8213851260551195e-10, + 1.8139376112280559e-10, + 1.809180305567537e-10 + ], + "bp_grad_norms_F": [ + 1.032176169246668e-05, + 1.5236809147722852e-08, + 1.1438899605309416e-08, + 1.1181004566651609e-08, + 1.0941747952131209e-08 + ], + "gamma_dfa": 0.052668574411654845, + "acc_eval": 0.10546875, + "loss_eval": 18.2590389251709, + "epoch": 81 + }, + { + "hidden_norms": [ + 75578.140625, + 263041184.0, + 193033856.0, + 219211776.0, + 105729752.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.755376512681323e-08, + 1.830409435132907e-10, + 1.8150429770269483e-10, + 1.807565902511854e-10, + 1.8044568617092693e-10 + ], + "bp_grad_norms_F": [ + 1.0324319191568065e-05, + 1.5187332280675037e-08, + 1.1401711574876572e-08, + 1.1144490663639317e-08, + 1.0905955249995714e-08 + ], + "gamma_dfa": 0.05269488821795676, + "acc_eval": 0.10546875, + "loss_eval": 18.284685134887695, + "epoch": 82 + }, + { + "hidden_norms": [ + 75686.9765625, + 264364192.0, + 193939856.0, + 220289456.0, + 106222280.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.723260691567702e-08, + 1.8233220488994561e-10, + 1.808086180776769e-10, + 1.8018871117408963e-10, + 1.7971832355634376e-10 + ], + "bp_grad_norms_F": [ + 1.0300875146640465e-05, + 1.5149137055914252e-08, + 1.1367639274340036e-08, + 1.1110781628076438e-08, + 1.0873751676854226e-08 + ], + "gamma_dfa": 0.05262827526894398, + "acc_eval": 0.10546875, + "loss_eval": 18.32525634765625, + "epoch": 83 + }, + { + "hidden_norms": [ + 75782.5703125, + 265506368.0, + 194623696.0, + 221062096.0, + 106625800.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.738180667933193e-08, + 1.8182351457785018e-10, + 1.8023170456071824e-10, + 1.796851972768465e-10, + 1.7919579708980393e-10 + ], + "bp_grad_norms_F": [ + 1.0303671842848416e-05, + 1.510927916115179e-08, + 1.133329874392075e-08, + 1.107721647741755e-08, + 1.0840857100902213e-08 + ], + "gamma_dfa": 0.0526832842733711, + "acc_eval": 0.10546875, + "loss_eval": 18.358993530273438, + "epoch": 84 + }, + { + "hidden_norms": [ + 75869.921875, + 266527792.0, + 195260000.0, + 221772592.0, + 107003056.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.824529373896439e-08, + 1.8133940182796238e-10, + 1.7974224886252443e-10, + 1.7921185369029757e-10, + 1.7870449564583168e-10 + ], + "bp_grad_norms_F": [ + 1.0309514436812606e-05, + 1.506138680440472e-08, + 1.129713478320582e-08, + 1.1042018854823255e-08, + 1.080576872425354e-08 + ], + "gamma_dfa": 0.052798322300077416, + "acc_eval": 0.10546875, + "loss_eval": 18.391273498535156, + "epoch": 85 + }, + { + "hidden_norms": [ + 75944.28125, + 267298400.0, + 195821152.0, + 222463360.0, + 107333864.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.755981895092191e-08, + 1.8102987164869688e-10, + 1.793504234015586e-10, + 1.788625914045383e-10, + 1.7835513621555776e-10 + ], + "bp_grad_norms_F": [ + 1.0287751138093881e-05, + 1.502210977832874e-08, + 1.1278022071792293e-08, + 1.1023718826663753e-08, + 1.0788149040763528e-08 + ], + "gamma_dfa": 0.05272912958753295, + "acc_eval": 0.10546875, + "loss_eval": 18.391714096069336, + "epoch": 86 + }, + { + "hidden_norms": [ + 76007.421875, + 268045776.0, + 196358640.0, + 223064400.0, + 107612040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.762406622508934e-08, + 1.807102384399073e-10, + 1.7898976745200912e-10, + 1.785393638487065e-10, + 1.7802226359719953e-10 + ], + "bp_grad_norms_F": [ + 1.0287554687238298e-05, + 1.4994483876762388e-08, + 1.1257166754319314e-08, + 1.1003281841226453e-08, + 1.0768073543943046e-08 + ], + "gamma_dfa": 0.052773734016227536, + "acc_eval": 0.10546875, + "loss_eval": 18.410842895507812, + "epoch": 87 + }, + { + "hidden_norms": [ + 76064.7109375, + 268696256.0, + 196819616.0, + 223570480.0, + 107852768.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758166814004653e-08, + 1.8037309146290426e-10, + 1.7866680357414566e-10, + 1.782173991715652e-10, + 1.7768413129726213e-10 + ], + "bp_grad_norms_F": [ + 1.0283758456353098e-05, + 1.4970940043212977e-08, + 1.1237919927964413e-08, + 1.0984368081778939e-08, + 1.0749558576605978e-08 + ], + "gamma_dfa": 0.05277359033061657, + "acc_eval": 0.10546875, + "loss_eval": 18.423473358154297, + "epoch": 88 + }, + { + "hidden_norms": [ + 76113.765625, + 269233728.0, + 197204896.0, + 224016384.0, + 108068584.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.767738535198077e-08, + 1.800838783649894e-10, + 1.7838196197939027e-10, + 1.7793383433328813e-10, + 1.7738220614571532e-10 + ], + "bp_grad_norms_F": [ + 1.0285043572366703e-05, + 1.4949996796076448e-08, + 1.1221012563567001e-08, + 1.096789947752086e-08, + 1.0733534949736168e-08 + ], + "gamma_dfa": 0.05277923475659918, + "acc_eval": 0.10546875, + "loss_eval": 18.44818878173828, + "epoch": 89 + }, + { + "hidden_norms": [ + 76154.09375, + 269669792.0, + 197538960.0, + 224391824.0, + 108235960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.767518266949992e-08, + 1.7989677802976445e-10, + 1.7819240527572333e-10, + 1.777451658080409e-10, + 1.771848640030882e-10 + ], + "bp_grad_norms_F": [ + 1.029091072268784e-05, + 1.4940461312562547e-08, + 1.1209391637123645e-08, + 1.0956426876873593e-08, + 1.0722061460910481e-08 + ], + "gamma_dfa": 0.05281960548018105, + "acc_eval": 0.10546875, + "loss_eval": 18.45142364501953, + "epoch": 90 + }, + { + "hidden_norms": [ + 76187.59375, + 270051616.0, + 197844384.0, + 224727824.0, + 108387672.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.763404224509941e-08, + 1.7972098809160286e-10, + 1.780089131653284e-10, + 1.7756210390906801e-10, + 1.7699951226912702e-10 + ], + "bp_grad_norms_F": [ + 1.0288421435689088e-05, + 1.4926607505572065e-08, + 1.1199507987669222e-08, + 1.0946849648973966e-08, + 1.0712753351072024e-08 + ], + "gamma_dfa": 0.05281454947544262, + "acc_eval": 0.10546875, + "loss_eval": 18.456693649291992, + "epoch": 91 + }, + { + "hidden_norms": [ + 76216.3125, + 270347840.0, + 198067872.0, + 225002016.0, + 108500144.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.769242754169682e-08, + 1.795031345785958e-10, + 1.7781580374798267e-10, + 1.773555469153365e-10, + 1.7679230301936855e-10 + ], + "bp_grad_norms_F": [ + 1.0288722478435375e-05, + 1.4910959578173788e-08, + 1.1187878179441668e-08, + 1.0935604422002143e-08, + 1.070183497375865e-08 + ], + "gamma_dfa": 0.052812248992267996, + "acc_eval": 0.10546875, + "loss_eval": 18.479557037353516, + "epoch": 92 + }, + { + "hidden_norms": [ + 76238.2890625, + 270583392.0, + 198231920.0, + 225197232.0, + 108588960.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.765692172119088e-08, + 1.794125820131498e-10, + 1.7771174809499968e-10, + 1.7726634049530787e-10, + 1.7670596930141613e-10 + ], + "bp_grad_norms_F": [ + 1.0287496479577385e-05, + 1.490491285949247e-08, + 1.1181702674889493e-08, + 1.0929432470163647e-08, + 1.0695790031434171e-08 + ], + "gamma_dfa": 0.052826936458586715, + "acc_eval": 0.10546875, + "loss_eval": 18.482463836669922, + "epoch": 93 + }, + { + "hidden_norms": [ + 76254.984375, + 270769600.0, + 198360864.0, + 225341792.0, + 108654560.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.761775660559579e-08, + 1.7933368678946238e-10, + 1.776363084404764e-10, + 1.7719105349645048e-10, + 1.766297247352e-10 + ], + "bp_grad_norms_F": [ + 1.0286962606187444e-05, + 1.4897207911701571e-08, + 1.1177347936097703e-08, + 1.0925224280811108e-08, + 1.0691623586467358e-08 + ], + "gamma_dfa": 0.052814016249612905, + "acc_eval": 0.10546875, + "loss_eval": 18.48452377319336, + "epoch": 94 + }, + { + "hidden_norms": [ + 76267.0, + 270906656.0, + 198453952.0, + 225448800.0, + 108703144.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.761757186448449e-08, + 1.792699738656367e-10, + 1.7757639803051006e-10, + 1.771305185860328e-10, + 1.7656787143494057e-10 + ], + "bp_grad_norms_F": [ + 1.0286720680596773e-05, + 1.4893439370666783e-08, + 1.1173768577066312e-08, + 1.0921708870625935e-08, + 1.0688168572414725e-08 + ], + "gamma_dfa": 0.05281054192164447, + "acc_eval": 0.10546875, + "loss_eval": 18.48675537109375, + "epoch": 95 + }, + { + "hidden_norms": [ + 76274.53125, + 270996800.0, + 198521872.0, + 225534016.0, + 108737184.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.757600511444252e-08, + 1.7921109041196814e-10, + 1.7751719538772193e-10, + 1.7707224575502778e-10, + 1.7651151373865304e-10 + ], + "bp_grad_norms_F": [ + 1.0285029929946177e-05, + 1.4889327104583572e-08, + 1.1170673275273657e-08, + 1.09186730767874e-08, + 1.0685286433442798e-08 + ], + "gamma_dfa": 0.052804862934863195, + "acc_eval": 0.10546875, + "loss_eval": 18.492807388305664, + "epoch": 96 + }, + { + "hidden_norms": [ + 76278.6171875, + 271041184.0, + 198554096.0, + 225570960.0, + 108751040.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758564717936679e-08, + 1.791868459166679e-10, + 1.7749526848298558e-10, + 1.770504159948061e-10, + 1.7648858763319453e-10 + ], + "bp_grad_norms_F": [ + 1.028558563120896e-05, + 1.4887539201424715e-08, + 1.1169264624300013e-08, + 1.091728041302531e-08, + 1.068388577607493e-08 + ], + "gamma_dfa": 0.052804886450758204, + "acc_eval": 0.10546875, + "loss_eval": 18.49222183227539, + "epoch": 97 + }, + { + "hidden_norms": [ + 76282.2109375, + 271081440.0, + 198586512.0, + 225606800.0, + 108767848.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758451741641693e-08, + 1.7916516881211209e-10, + 1.7747517344623986e-10, + 1.7702975196876025e-10, + 1.764676044180291e-10 + ], + "bp_grad_norms_F": [ + 1.028525730362162e-05, + 1.488619361111887e-08, + 1.1168157953989066e-08, + 1.0916189729925918e-08, + 1.0682827955577068e-08 + ], + "gamma_dfa": 0.05280597397359088, + "acc_eval": 0.10546875, + "loss_eval": 18.493602752685547, + "epoch": 98 + }, + { + "hidden_norms": [ + 76284.046875, + 271101920.0, + 198601280.0, + 225624992.0, + 108775912.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758536296227248e-08, + 1.7915657846145905e-10, + 1.7746643043992094e-10, + 1.7702135590713652e-10, + 1.7645920835640538e-10 + ], + "bp_grad_norms_F": [ + 1.028511906042695e-05, + 1.488560208429135e-08, + 1.1167605507012013e-08, + 1.0915637282948865e-08, + 1.0682285278562631e-08 + ], + "gamma_dfa": 0.05280651607608888, + "acc_eval": 0.10546875, + "loss_eval": 18.494029998779297, + "epoch": 99 + }, + { + "hidden_norms": [ + 76284.0703125, + 271101952.0, + 198601472.0, + 225625280.0, + 108776088.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.758680536402608e-08, + 1.7915803562917887e-10, + 1.7746806801888226e-10, + 1.7702275756370511e-10, + 1.7646061001297397e-10 + ], + "bp_grad_norms_F": [ + 1.0285211828886531e-05, + 1.488571665930749e-08, + 1.1167688107605045e-08, + 1.0915716330828218e-08, + 1.0682358109193046e-08 + ], + "gamma_dfa": 0.052806626496021636, + "acc_eval": 0.10546875, + "loss_eval": 18.493879318237305, + "epoch": 100 + } + ] +}
\ No newline at end of file |
