diff options
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s123.json')
| -rw-r--r-- | results/snapshot_vit_v1/snapshot_vit_s123.json | 4594 |
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s123.json b/results/snapshot_vit_v1/snapshot_vit_s123.json new file mode 100644 index 0000000..93853cf --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s123.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 123, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.3210873007774353, + 3.3568029403686523, + 4.891699314117432, + 6.200707912445068, + 7.5911865234375 + ], + "hidden_norms_avg": [ + 5.7549052238464355, + 6.750590801239014, + 7.9020819664001465, + 8.925304412841797, + 10.076716423034668 + ], + "bp_grad_per_sample_l2_med": [ + 0.004074312746524811, + 0.0011155740357935429, + 0.0009667170234024525, + 0.0008621186716482043, + 0.0008127145702019334 + ], + "bp_grad_F": [ + 0.20160320401191711, + 0.039521340280771255, + 0.033098917454481125, + 0.029271923005580902, + 0.027136052027344704 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.125, + "loss_eval": 2.422111988067627, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.4782717227935791, + 11.874238014221191, + 20.313709259033203, + 26.86528778076172, + 32.42327880859375 + ], + "hidden_norms_avg": [ + 3.8830745220184326, + 11.266603469848633, + 17.881502151489258, + 23.234352111816406, + 28.51181411743164 + ], + "bp_grad_per_sample_l2_med": [ + 0.002827065996825695, + 0.00024586476502008736, + 0.00014567613834515214, + 0.00013882767234463245, + 0.0001400413311785087 + ], + "bp_grad_F": [ + 0.12621107697486877, + 0.009982436895370483, + 0.00507162231951952, + 0.004677945747971535, + 0.004658848978579044 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4697265625, + "loss_eval": 1.4472862482070923, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6104467511177063, + 13.787332534790039, + 22.073436737060547, + 28.480369567871094, + 33.141117095947266 + ], + "hidden_norms_avg": [ + 3.951775074005127, + 12.005932807922363, + 18.336896896362305, + 23.67597198486328, + 27.899608612060547 + ], + "bp_grad_per_sample_l2_med": [ + 0.002604336943477392, + 0.00026667251950129867, + 0.00014805165119469166, + 0.00013079405471216887, + 0.00012911780504509807 + ], + "bp_grad_F": [ + 0.12487494200468063, + 0.010650832206010818, + 0.005604646634310484, + 0.004644650500267744, + 0.00448915408924222 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5146484375, + "loss_eval": 1.291869878768921, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.7104504108428955, + 13.74225902557373, + 21.90972328186035, + 28.958967208862305, + 33.262393951416016 + ], + "hidden_norms_avg": [ + 3.9180142879486084, + 13.097892761230469, + 19.570770263671875, + 24.899248123168945, + 28.65104866027832 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020766372326761484, + 0.00025831969105638564, + 0.00014769421250093728, + 0.00012920337030664086, + 0.00012324318231549114 + ], + "bp_grad_F": [ + 0.09676238149404526, + 0.010603155009448528, + 0.005832126829773188, + 0.00465927692130208, + 0.004435759503394365 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.529296875, + "loss_eval": 1.2694497108459473, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.801612377166748, + 12.882991790771484, + 20.474157333374023, + 27.37413215637207, + 32.06389617919922 + ], + "hidden_norms_avg": [ + 3.8871910572052, + 13.333250999450684, + 19.042104721069336, + 24.029348373413086, + 27.96086311340332 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020045258570462465, + 0.000285606540273875, + 0.00016217664233408868, + 0.00013080642384011298, + 0.00011968115722993389 + ], + "bp_grad_F": [ + 0.09496191889047623, + 0.011928788386285305, + 0.006509022321552038, + 0.005044482182711363, + 0.004537967965006828 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.58203125, + "loss_eval": 1.119094967842102, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.8653663396835327, + 12.994612693786621, + 20.49618148803711, + 26.709278106689453, + 30.303852081298828 + ], + "hidden_norms_avg": [ + 4.018242835998535, + 13.520885467529297, + 19.090721130371094, + 23.6751651763916, + 26.93212890625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018953323597088456, + 0.000296358106425032, + 0.00017310198745690286, + 0.0001364975469186902, + 0.00012098452862119302 + ], + "bp_grad_F": [ + 0.09499228745698929, + 0.012825642712414265, + 0.007407570723444223, + 0.005570532754063606, + 0.004951393231749535 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.595703125, + "loss_eval": 1.0847156047821045, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9313029646873474, + 13.966381072998047, + 21.648372650146484, + 28.33364486694336, + 32.91484069824219 + ], + "hidden_norms_avg": [ + 4.053382396697998, + 15.042261123657227, + 20.74883270263672, + 25.032489776611328, + 28.55679702758789 + ], + "bp_grad_per_sample_l2_med": [ + 0.001841629622504115, + 0.0002753600711002946, + 0.0001624371943762526, + 0.0001305017649428919, + 0.00011278261081315577 + ], + "bp_grad_F": [ + 0.09068351984024048, + 0.0128449946641922, + 0.007257991470396519, + 0.005361978895962238, + 0.004660472739487886 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6103515625, + "loss_eval": 1.095273494720459, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 0.9818395972251892, + 13.022477149963379, + 20.385391235351562, + 27.03214454650879, + 31.324769973754883 + ], + "hidden_norms_avg": [ + 4.1024041175842285, + 14.697205543518066, + 19.634239196777344, + 23.90021324157715, + 27.306678771972656 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015902157174423337, + 0.00027956697158515453, + 0.0001692597143119201, + 0.0001353132538497448, + 0.00011523282591952011 + ], + "bp_grad_F": [ + 0.07967441529035568, + 0.012528380379080772, + 0.007520876359194517, + 0.00570708978921175, + 0.004875381011515856 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.62890625, + "loss_eval": 1.0069011449813843, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.0194361209869385, + 13.912450790405273, + 20.85824203491211, + 27.968477249145508, + 32.243431091308594 + ], + "hidden_norms_avg": [ + 4.178755283355713, + 14.875143051147461, + 20.261545181274414, + 24.636741638183594, + 27.893512725830078 + ], + "bp_grad_per_sample_l2_med": [ + 0.001506888889707625, + 0.00028421770548447967, + 0.0001727779454085976, + 0.00013076694449409842, + 0.00010860477777896449 + ], + "bp_grad_F": [ + 0.07398127764463425, + 0.013124965131282806, + 0.007798053789883852, + 0.005717460531741381, + 0.004830002784729004 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.638671875, + "loss_eval": 0.9834396839141846, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.077261209487915, + 12.524529457092285, + 19.766538619995117, + 25.7626895904541, + 30.03727149963379 + ], + "hidden_norms_avg": [ + 4.1816864013671875, + 14.304539680480957, + 19.208524703979492, + 23.25862693786621, + 26.313356399536133 + ], + "bp_grad_per_sample_l2_med": [ + 0.0014360174536705017, + 0.0003003668098244816, + 0.0001815372525015846, + 0.0001390709658153355, + 0.00011320491466904059 + ], + "bp_grad_F": [ + 0.0756259635090828, + 0.014865156263113022, + 0.008982912637293339, + 0.006551471073180437, + 0.005398898851126432 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6494140625, + "loss_eval": 0.971701979637146, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1200045347213745, + 12.160452842712402, + 19.172168731689453, + 25.067665100097656, + 28.764787673950195 + ], + "hidden_norms_avg": [ + 4.289422035217285, + 15.51036262512207, + 20.407268524169922, + 24.061931610107422, + 26.493688583374023 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012870824430137873, + 0.00027074789977632463, + 0.0001742457679938525, + 0.0001348328951280564, + 0.000104573555290699 + ], + "bp_grad_F": [ + 0.07437644153833389, + 0.015084434300661087, + 0.009522279724478722, + 0.0069595095701515675, + 0.0055610560812056065 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6767578125, + "loss_eval": 0.8734689354896545, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.1509246826171875, + 12.219743728637695, + 19.352998733520508, + 25.70184326171875, + 29.580278396606445 + ], + "hidden_norms_avg": [ + 4.315939426422119, + 15.6610689163208, + 20.42215347290039, + 24.016841888427734, + 26.62118911743164 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013146374840289354, + 0.0002733681467361748, + 0.0001865291123976931, + 0.00013389455853030086, + 0.00010298956476617604 + ], + "bp_grad_F": [ + 0.07836466282606125, + 0.015104672871530056, + 0.009902945719659328, + 0.0069915857166051865, + 0.005596037954092026 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6767578125, + "loss_eval": 0.917751669883728, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.2017452716827393, + 12.72107219696045, + 18.952699661254883, + 25.067615509033203, + 29.466550827026367 + ], + "hidden_norms_avg": [ + 4.358119487762451, + 15.672205924987793, + 20.140914916992188, + 24.013885498046875, + 26.668514251708984 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011630960507318377, + 0.00025659528910182416, + 0.0001693729282123968, + 0.0001237613905686885, + 9.384296572534367e-05 + ], + "bp_grad_F": [ + 0.07334695011377335, + 0.015075902454555035, + 0.009827414527535439, + 0.007068648934364319, + 0.005549146793782711 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6982421875, + "loss_eval": 0.8279671669006348, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.234994649887085, + 12.283885955810547, + 18.62163543701172, + 24.3900203704834, + 28.36040496826172 + ], + "hidden_norms_avg": [ + 4.369320869445801, + 15.747625350952148, + 19.76953887939453, + 23.351999282836914, + 25.69841194152832 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011812442680820823, + 0.0002851892786566168, + 0.0001940266229212284, + 0.00013827465591020882, + 0.00010182376718148589 + ], + "bp_grad_F": [ + 0.07158326357603073, + 0.01604902744293213, + 0.010893523693084717, + 0.007844515144824982, + 0.005985426716506481 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.689453125, + "loss_eval": 0.8679210543632507, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.2675292491912842, + 11.706314086914062, + 18.347841262817383, + 24.01951789855957, + 28.1114501953125 + ], + "hidden_norms_avg": [ + 4.390969753265381, + 15.140497207641602, + 19.62596893310547, + 23.22857666015625, + 25.681791305541992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010449079563841224, + 0.0002611770760267973, + 0.00017687672516331077, + 0.00012088462244719267, + 8.996625547297299e-05 + ], + "bp_grad_F": [ + 0.06979352980852127, + 0.016320781782269478, + 0.01088168565183878, + 0.007916715927422047, + 0.006064872723072767 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6884765625, + "loss_eval": 0.8092349767684937, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.2957582473754883, + 11.933137893676758, + 18.238237380981445, + 23.88395118713379, + 27.868513107299805 + ], + "hidden_norms_avg": [ + 4.4383697509765625, + 15.46267318725586, + 19.841346740722656, + 23.529712677001953, + 25.852684020996094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009947444777935743, + 0.00024384066637139767, + 0.00016608397709205747, + 0.0001234996016137302, + 9.023427992360666e-05 + ], + "bp_grad_F": [ + 0.07019422203302383, + 0.016806265339255333, + 0.011433122679591179, + 0.008135766722261906, + 0.006158903241157532 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.712890625, + "loss_eval": 0.7795700430870056, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.3391923904418945, + 11.329567909240723, + 17.184999465942383, + 22.353059768676758, + 26.889299392700195 + ], + "hidden_norms_avg": [ + 4.53090238571167, + 15.341407775878906, + 19.109649658203125, + 22.223899841308594, + 24.45347023010254 + ], + "bp_grad_per_sample_l2_med": [ + 0.001086357282474637, + 0.00030167572549544275, + 0.0002114812668878585, + 0.00015480270667467266, + 0.00010993685282301158 + ], + "bp_grad_F": [ + 0.06569939106702805, + 0.017201317474246025, + 0.012068319134414196, + 0.008909368887543678, + 0.006427914369851351 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7314453125, + "loss_eval": 0.7724976539611816, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.3643215894699097, + 10.724340438842773, + 16.144981384277344, + 21.656490325927734, + 25.777481079101562 + ], + "hidden_norms_avg": [ + 4.520992279052734, + 15.036820411682129, + 18.98927879333496, + 22.688859939575195, + 24.71843910217285 + ], + "bp_grad_per_sample_l2_med": [ + 0.000967099389526993, + 0.0002715744194574654, + 0.00019328886992298067, + 0.00013628297892864794, + 9.314809722127393e-05 + ], + "bp_grad_F": [ + 0.06768078356981277, + 0.01841692440211773, + 0.012980606406927109, + 0.009295133873820305, + 0.006698420271277428 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.73828125, + "loss_eval": 0.7337102890014648, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.3963993787765503, + 11.463358879089355, + 16.49429702758789, + 21.585325241088867, + 25.636695861816406 + ], + "hidden_norms_avg": [ + 4.539251327514648, + 14.975208282470703, + 18.360631942749023, + 21.586400985717773, + 23.561830520629883 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008780099451541901, + 0.00024953793035820127, + 0.00017615300021134317, + 0.00012566034274641424, + 8.528940088581294e-05 + ], + "bp_grad_F": [ + 0.07198558002710342, + 0.019673649221658707, + 0.013869633898139, + 0.009656366892158985, + 0.006824122741818428 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7451171875, + "loss_eval": 0.7211208343505859, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.421103835105896, + 9.9105806350708, + 15.361790657043457, + 20.334768295288086, + 24.506919860839844 + ], + "hidden_norms_avg": [ + 4.622361660003662, + 14.7937650680542, + 18.042116165161133, + 21.208105087280273, + 23.21940040588379 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007793674594722688, + 0.0002331113355467096, + 0.00016331924416590482, + 0.00011330798588460311, + 7.215427467599511e-05 + ], + "bp_grad_F": [ + 0.07613872736692429, + 0.022306306287646294, + 0.015858706086874008, + 0.011275039985775948, + 0.007263499312102795 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7392578125, + "loss_eval": 0.7346716523170471, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.4554439783096313, + 10.118419647216797, + 15.106456756591797, + 20.052860260009766, + 24.34604263305664 + ], + "hidden_norms_avg": [ + 4.584441661834717, + 14.634279251098633, + 17.785133361816406, + 21.110010147094727, + 22.89650535583496 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007524031680077314, + 0.0002260785986436531, + 0.00016854463319759816, + 0.00011997718684142455, + 7.738151180092245e-05 + ], + "bp_grad_F": [ + 0.07370379567146301, + 0.021284889429807663, + 0.015382407233119011, + 0.010745048522949219, + 0.007394883316010237 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.74609375, + "loss_eval": 0.7024286389350891, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.4652466773986816, + 10.145299911499023, + 15.15330982208252, + 20.131061553955078, + 23.987186431884766 + ], + "hidden_norms_avg": [ + 4.602361679077148, + 14.532269477844238, + 17.825733184814453, + 21.43619728088379, + 23.12371253967285 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008222013129852712, + 0.0002455596113577485, + 0.00017989490879699588, + 0.00012026322656311095, + 8.26524556032382e-05 + ], + "bp_grad_F": [ + 0.0741497054696083, + 0.020758304744958878, + 0.01482379250228405, + 0.010753357782959938, + 0.007582026533782482 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7016957402229309, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.480756402015686, + 10.028592109680176, + 14.573174476623535, + 19.24639320373535, + 23.3629150390625 + ], + "hidden_norms_avg": [ + 4.621757984161377, + 14.29589557647705, + 17.4040470123291, + 20.71320343017578, + 22.405963897705078 + ], + "bp_grad_per_sample_l2_med": [ + 0.000667835003696382, + 0.00020642780873458833, + 0.0001538341457489878, + 0.00010652844503056258, + 6.964046770008281e-05 + ], + "bp_grad_F": [ + 0.07375485450029373, + 0.021967202425003052, + 0.016106218099594116, + 0.011507184244692326, + 0.007651185616850853 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7607421875, + "loss_eval": 0.6544591188430786, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.5069013833999634, + 9.897040367126465, + 14.096169471740723, + 18.488874435424805, + 22.214311599731445 + ], + "hidden_norms_avg": [ + 4.621402263641357, + 13.978808403015137, + 16.55535888671875, + 19.729736328125, + 21.272388458251953 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007426440715789795, + 0.0002414636837784201, + 0.00018161055049858987, + 0.00012697202328126878, + 8.096778037725016e-05 + ], + "bp_grad_F": [ + 0.07682260870933533, + 0.02333010919392109, + 0.017287475988268852, + 0.012499523349106312, + 0.008510846644639969 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7568359375, + "loss_eval": 0.6971542835235596, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.5169755220413208, + 9.5064058303833, + 13.812594413757324, + 17.95937156677246, + 21.51923370361328 + ], + "hidden_norms_avg": [ + 4.612667083740234, + 13.86723804473877, + 16.418981552124023, + 19.12198257446289, + 20.565521240234375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007257908000610769, + 0.00024720808141864836, + 0.0001871327986009419, + 0.00013439780741464347, + 8.671147952554747e-05 + ], + "bp_grad_F": [ + 0.07474599778652191, + 0.024257108569145203, + 0.01782340556383133, + 0.01281843613833189, + 0.008487668819725513 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.763671875, + "loss_eval": 0.6618016958236694, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.5133440494537354, + 9.023777961730957, + 13.088467597961426, + 17.324251174926758, + 21.083759307861328 + ], + "hidden_norms_avg": [ + 4.670994281768799, + 13.658943176269531, + 16.629199981689453, + 19.75893783569336, + 21.12710952758789 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005614451365545392, + 0.0001914121676236391, + 0.00014186649059411138, + 0.00010088241106132045, + 6.150588887976483e-05 + ], + "bp_grad_F": [ + 0.08172759413719177, + 0.027048049494624138, + 0.019993988797068596, + 0.014050732366740704, + 0.009047404862940311 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7626953125, + "loss_eval": 0.6708824634552002, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.5329865217208862, + 8.596381187438965, + 12.645307540893555, + 16.668807983398438, + 20.51462745666504 + ], + "hidden_norms_avg": [ + 4.642580986022949, + 13.140735626220703, + 15.32632064819336, + 17.985010147094727, + 19.472858428955078 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005455430946312845, + 0.00019156686903443187, + 0.00014253854169510305, + 0.00010098751954501495, + 6.338314415188506e-05 + ], + "bp_grad_F": [ + 0.08767001330852509, + 0.029545463621616364, + 0.021587952971458435, + 0.014973495155572891, + 0.009515349753201008 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.6813780069351196, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.554770588874817, + 8.98424243927002, + 12.76674747467041, + 16.438858032226562, + 19.893146514892578 + ], + "hidden_norms_avg": [ + 4.635522365570068, + 13.039203643798828, + 15.419903755187988, + 18.176319122314453, + 19.39232635498047 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005697832675650716, + 0.0001985357521334663, + 0.0001536469644634053, + 0.00010455933079356328, + 6.821998249506578e-05 + ], + "bp_grad_F": [ + 0.07977671921253204, + 0.02706393413245678, + 0.020037846639752388, + 0.014591805636882782, + 0.009512925520539284 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.628034770488739, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.5515426397323608, + 8.19682788848877, + 11.861184120178223, + 15.59919548034668, + 18.893400192260742 + ], + "hidden_norms_avg": [ + 4.5841450691223145, + 12.511472702026367, + 14.583609580993652, + 16.949586868286133, + 18.082292556762695 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005373116582632065, + 0.0001997901708818972, + 0.0001489907590439543, + 0.00010373342229286209, + 6.318451050901785e-05 + ], + "bp_grad_F": [ + 0.09340352565050125, + 0.03397079557180405, + 0.025108041241765022, + 0.017669958993792534, + 0.010975479148328304 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.7042175531387329, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.5542187690734863, + 8.489326477050781, + 11.786734580993652, + 15.331045150756836, + 18.48196792602539 + ], + "hidden_norms_avg": [ + 4.615735054016113, + 12.620647430419922, + 14.822388648986816, + 17.454334259033203, + 18.677461624145508 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005812083836644888, + 0.00021461205324158072, + 0.00015997944865375757, + 0.00011693408305291086, + 7.380295573966578e-05 + ], + "bp_grad_F": [ + 0.09380948543548584, + 0.03345760330557823, + 0.025129586458206177, + 0.01789030432701111, + 0.011130682192742825 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6850110292434692, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.5533884763717651, + 8.01724910736084, + 11.423017501831055, + 15.046612739562988, + 18.549089431762695 + ], + "hidden_norms_avg": [ + 4.590519428253174, + 12.431540489196777, + 14.243208885192871, + 16.609176635742188, + 18.00058937072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004959268844686449, + 0.00020078590023331344, + 0.00015426705067511648, + 0.00010096926416736096, + 5.95865749346558e-05 + ], + "bp_grad_F": [ + 0.09663982689380646, + 0.036162860691547394, + 0.02716146595776081, + 0.01926880143582821, + 0.011334826238453388 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6707749366760254, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.5530469417572021, + 7.959159851074219, + 11.2805757522583, + 14.567391395568848, + 17.63263511657715 + ], + "hidden_norms_avg": [ + 4.583434581756592, + 11.983453750610352, + 13.4386625289917, + 15.498583793640137, + 16.631824493408203 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005142099689692259, + 0.00020230942755006254, + 0.00015552931290585548, + 0.00011007695866283029, + 6.233472959138453e-05 + ], + "bp_grad_F": [ + 0.09787525236606598, + 0.037690743803977966, + 0.028980012983083725, + 0.02064511366188526, + 0.012224731035530567 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6748013496398926, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.5515272617340088, + 7.847743988037109, + 10.868992805480957, + 14.282126426696777, + 17.300424575805664 + ], + "hidden_norms_avg": [ + 4.579150199890137, + 11.951078414916992, + 13.621748924255371, + 15.971713066101074, + 17.04889488220215 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004585929855238646, + 0.00017806614050641656, + 0.0001380510366288945, + 9.63187703746371e-05, + 5.829996371176094e-05 + ], + "bp_grad_F": [ + 0.10181005299091339, + 0.038575656712055206, + 0.02964734099805355, + 0.020979750901460648, + 0.01240287534892559 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.648021936416626, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.5606788396835327, + 7.502675533294678, + 10.430459022521973, + 13.642136573791504, + 16.445953369140625 + ], + "hidden_norms_avg": [ + 4.601283550262451, + 11.615697860717773, + 13.472222328186035, + 15.831238746643066, + 16.856765747070312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004074577009305358, + 0.00017814920283854008, + 0.00013730341743212193, + 9.565176151227206e-05, + 5.229458474786952e-05 + ], + "bp_grad_F": [ + 0.11506060510873795, + 0.04695325344800949, + 0.03571247681975365, + 0.025198202580213547, + 0.013851121068000793 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.755859375, + "loss_eval": 0.7299192547798157, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5404834747314453, + 7.528626441955566, + 10.384718894958496, + 13.326257705688477, + 16.41958999633789 + ], + "hidden_norms_avg": [ + 4.533090591430664, + 11.6575345993042, + 13.231060028076172, + 15.337231636047363, + 16.463298797607422 + ], + "bp_grad_per_sample_l2_med": [ + 0.00042279696208424866, + 0.00016955600585788488, + 0.00012915951083414257, + 8.976108074421063e-05, + 4.930083014187403e-05 + ], + "bp_grad_F": [ + 0.11639728397130966, + 0.047109171748161316, + 0.03660130873322487, + 0.02588750049471855, + 0.013930009678006172 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7065586447715759, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.539638638496399, + 7.26485013961792, + 9.96584701538086, + 13.003418922424316, + 16.14008140563965 + ], + "hidden_norms_avg": [ + 4.537028789520264, + 11.146146774291992, + 12.836923599243164, + 14.992585182189941, + 16.076574325561523 + ], + "bp_grad_per_sample_l2_med": [ + 0.00039646061486564577, + 0.00017108044994529337, + 0.00013601842510979623, + 9.225023677572608e-05, + 4.893271398032084e-05 + ], + "bp_grad_F": [ + 0.11648086458444595, + 0.04862738400697708, + 0.0374443456530571, + 0.026762915775179863, + 0.014388044364750385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7939453125, + "loss_eval": 0.6772804260253906, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.5278778076171875, + 7.107171058654785, + 9.836174011230469, + 12.691095352172852, + 15.726043701171875 + ], + "hidden_norms_avg": [ + 4.5205254554748535, + 10.983088493347168, + 12.684239387512207, + 14.876561164855957, + 15.817031860351562 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003774319775402546, + 0.00015706375415902585, + 0.0001264828024432063, + 8.857168722897768e-05, + 4.440043630893342e-05 + ], + "bp_grad_F": [ + 0.12492093443870544, + 0.053397826850414276, + 0.040937285870313644, + 0.029012493789196014, + 0.015446576289832592 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7724609375, + "loss_eval": 0.707297146320343, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.51571524143219, + 7.153889179229736, + 9.856640815734863, + 12.511648178100586, + 15.47674560546875 + ], + "hidden_norms_avg": [ + 4.51829719543457, + 10.948126792907715, + 12.496319770812988, + 14.353506088256836, + 15.267280578613281 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003654273459687829, + 0.00015038737910799682, + 0.00011584001913433895, + 8.340556814800948e-05, + 4.3377422116464004e-05 + ], + "bp_grad_F": [ + 0.13914552330970764, + 0.0589178130030632, + 0.04522731155157089, + 0.0323280394077301, + 0.016300896182656288 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7626953125, + "loss_eval": 0.729290246963501, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.5081822872161865, + 6.952159404754639, + 9.558011054992676, + 12.107258796691895, + 15.05250358581543 + ], + "hidden_norms_avg": [ + 4.481203556060791, + 10.740157127380371, + 12.00869083404541, + 13.831336975097656, + 14.76778507232666 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003083393967244774, + 0.00012594371219165623, + 0.00010108885180670768, + 7.270355854416266e-05, + 3.639453643700108e-05 + ], + "bp_grad_F": [ + 0.14465992152690887, + 0.061646901071071625, + 0.047660429030656815, + 0.03381076827645302, + 0.01706051267683506 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7685546875, + "loss_eval": 0.7395438551902771, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.5159180164337158, + 6.878056526184082, + 9.382442474365234, + 11.969950675964355, + 15.129233360290527 + ], + "hidden_norms_avg": [ + 4.494526386260986, + 10.639691352844238, + 12.291059494018555, + 14.28632640838623, + 15.170000076293945 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028951463173143566, + 0.00012502263416536152, + 0.00010040518827736378, + 7.046512473607436e-05, + 3.719307642313652e-05 + ], + "bp_grad_F": [ + 0.1406005620956421, + 0.06109313294291496, + 0.047722309827804565, + 0.033977217972278595, + 0.01711316779255867 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7802734375, + "loss_eval": 0.7057114839553833, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.5058479309082031, + 6.699619770050049, + 9.136896133422852, + 11.609856605529785, + 14.701480865478516 + ], + "hidden_norms_avg": [ + 4.482093811035156, + 10.446189880371094, + 12.056195259094238, + 13.87569522857666, + 14.783234596252441 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002856751380022615, + 0.00013275284436531365, + 0.00010139105870621279, + 6.966136425035074e-05, + 3.293903864687309e-05 + ], + "bp_grad_F": [ + 0.1529398262500763, + 0.06890096515417099, + 0.052683208137750626, + 0.03734185919165611, + 0.01789216138422489 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7478293180465698, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.490049123764038, + 6.627772331237793, + 9.019189834594727, + 11.385313987731934, + 14.173355102539062 + ], + "hidden_norms_avg": [ + 4.458098411560059, + 10.279450416564941, + 11.593936920166016, + 13.30923080444336, + 14.155406951904297 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021343027765396982, + 9.837630932452157e-05, + 8.006956340977922e-05, + 5.6768003560137004e-05, + 2.7385456633055583e-05 + ], + "bp_grad_F": [ + 0.15772707760334015, + 0.07120667397975922, + 0.05564703419804573, + 0.03953033685684204, + 0.018776116892695427 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7724609375, + "loss_eval": 0.7677009105682373, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.4904595613479614, + 6.347933769226074, + 8.674281120300293, + 11.007567405700684, + 14.106690406799316 + ], + "hidden_norms_avg": [ + 4.430132865905762, + 10.265702247619629, + 11.588266372680664, + 13.410375595092773, + 14.36179256439209 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002224426862085238, + 0.00010000570182455704, + 7.794459816068411e-05, + 5.595289985649288e-05, + 2.7256841349299066e-05 + ], + "bp_grad_F": [ + 0.16928334534168243, + 0.07747916132211685, + 0.06056727096438408, + 0.04274875670671463, + 0.019731448963284492 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.771484375, + "loss_eval": 0.7774850726127625, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.4839239120483398, + 6.341518878936768, + 8.600671768188477, + 10.991724014282227, + 14.061833381652832 + ], + "hidden_norms_avg": [ + 4.403061866760254, + 10.020040512084961, + 11.371668815612793, + 13.18271255493164, + 14.007345199584961 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002152575325453654, + 0.00010309015488019213, + 7.964189717313275e-05, + 5.283725113258697e-05, + 2.479495196894277e-05 + ], + "bp_grad_F": [ + 0.17190901935100555, + 0.080362468957901, + 0.06201368197798729, + 0.042563296854496, + 0.019763268530368805 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.7503129243850708, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.479953408241272, + 6.386821269989014, + 8.521474838256836, + 10.847907066345215, + 13.541037559509277 + ], + "hidden_norms_avg": [ + 4.399942874908447, + 9.979388236999512, + 11.251038551330566, + 12.998858451843262, + 13.76570987701416 + ], + "bp_grad_per_sample_l2_med": [ + 0.000195752116269432, + 9.365259029436857e-05, + 7.282401929842308e-05, + 5.209222945268266e-05, + 2.3047552531352267e-05 + ], + "bp_grad_F": [ + 0.16316288709640503, + 0.07674747705459595, + 0.06052006781101227, + 0.04277755320072174, + 0.020131859928369522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7978515625, + "loss_eval": 0.732360303401947, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.4770045280456543, + 6.249807834625244, + 8.36440658569336, + 10.429434776306152, + 13.045490264892578 + ], + "hidden_norms_avg": [ + 4.391754627227783, + 9.821492195129395, + 10.789708137512207, + 12.3140869140625, + 13.067754745483398 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002329840644961223, + 0.00011798225023085251, + 9.261347440769896e-05, + 6.294570630416274e-05, + 2.9543562050093897e-05 + ], + "bp_grad_F": [ + 0.1812749058008194, + 0.08621949702501297, + 0.067754827439785, + 0.04831995815038681, + 0.021977350115776062 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.7784227132797241, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.467228651046753, + 6.0983357429504395, + 8.231528282165527, + 10.333056449890137, + 13.266757011413574 + ], + "hidden_norms_avg": [ + 4.390368461608887, + 9.647501945495605, + 10.692501068115234, + 12.274677276611328, + 13.044783592224121 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001511751615907997, + 7.784536137478426e-05, + 6.136627780506387e-05, + 4.35807196481619e-05, + 2.014869824051857e-05 + ], + "bp_grad_F": [ + 0.18805110454559326, + 0.09124159067869186, + 0.07224944978952408, + 0.050726212561130524, + 0.02254536561667919 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.814141571521759, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.4649879932403564, + 6.082813739776611, + 8.131811141967773, + 10.158056259155273, + 13.049956321716309 + ], + "hidden_norms_avg": [ + 4.377193927764893, + 9.599099159240723, + 10.660999298095703, + 12.21728801727295, + 12.965741157531738 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001712174853309989, + 8.400671504205093e-05, + 6.461612792918459e-05, + 4.6120971092022955e-05, + 2.0111323465243913e-05 + ], + "bp_grad_F": [ + 0.19550266861915588, + 0.09418290108442307, + 0.07462290674448013, + 0.053083814680576324, + 0.02292729914188385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.7999259233474731, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.4617111682891846, + 6.058816432952881, + 8.100686073303223, + 10.085453987121582, + 12.920005798339844 + ], + "hidden_norms_avg": [ + 4.367196559906006, + 9.56169605255127, + 10.609153747558594, + 12.135587692260742, + 12.871316909790039 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015642307698726654, + 7.727487536612898e-05, + 5.90925665164832e-05, + 4.136386633035727e-05, + 1.6983105524559505e-05 + ], + "bp_grad_F": [ + 0.202835351228714, + 0.09727983921766281, + 0.07683655619621277, + 0.05471916124224663, + 0.02326873689889908 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.783203125, + "loss_eval": 0.8152254223823547, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.4593255519866943, + 6.017489433288574, + 7.96034049987793, + 9.983046531677246, + 12.839889526367188 + ], + "hidden_norms_avg": [ + 4.349035739898682, + 9.508291244506836, + 10.475739479064941, + 12.025425910949707, + 12.764323234558105 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013039771874900907, + 6.479993317043409e-05, + 5.060105831944384e-05, + 3.637294139480218e-05, + 1.4738084246346261e-05 + ], + "bp_grad_F": [ + 0.2170599102973938, + 0.10417382419109344, + 0.08229079097509384, + 0.05735529586672783, + 0.024290865287184715 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.8357614278793335, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.4566220045089722, + 5.9422221183776855, + 7.888944149017334, + 9.933752059936523, + 12.817610740661621 + ], + "hidden_norms_avg": [ + 4.346043109893799, + 9.43443489074707, + 10.415618896484375, + 11.964469909667969, + 12.66396713256836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011193535465281457, + 5.694849824067205e-05, + 4.533635365078226e-05, + 3.3492226066300645e-05, + 1.4018894034961704e-05 + ], + "bp_grad_F": [ + 0.21774698793888092, + 0.1065358892083168, + 0.08431421220302582, + 0.05883141607046127, + 0.024615641683340073 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.8349668979644775, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.4569600820541382, + 5.859008312225342, + 7.792572498321533, + 9.738831520080566, + 12.622002601623535 + ], + "hidden_norms_avg": [ + 4.331563472747803, + 9.398598670959473, + 10.273933410644531, + 11.764141082763672, + 12.436033248901367 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012003595475107431, + 5.908689126954414e-05, + 4.746428385260515e-05, + 3.251975431339815e-05, + 1.3768915778200608e-05 + ], + "bp_grad_F": [ + 0.2144007831811905, + 0.10626016557216644, + 0.08404342085123062, + 0.05926896259188652, + 0.024889416992664337 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7861328125, + "loss_eval": 0.840790331363678, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.4559087753295898, + 5.8081440925598145, + 7.735576629638672, + 9.665096282958984, + 12.462581634521484 + ], + "hidden_norms_avg": [ + 4.331978797912598, + 9.35647964477539, + 10.206826210021973, + 11.663065910339355, + 12.307528495788574 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010101464431500062, + 5.143512680660933e-05, + 4.1592236811993644e-05, + 3.0060553399380296e-05, + 1.2701412742899265e-05 + ], + "bp_grad_F": [ + 0.22189198434352875, + 0.11008423566818237, + 0.08644267171621323, + 0.0603644996881485, + 0.025003522634506226 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8574135303497314, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.4537159204483032, + 5.80010461807251, + 7.719310760498047, + 9.681657791137695, + 12.724189758300781 + ], + "hidden_norms_avg": [ + 4.318180084228516, + 9.302933692932129, + 10.182857513427734, + 11.675416946411133, + 12.381869316101074 + ], + "bp_grad_per_sample_l2_med": [ + 9.399914415553212e-05, + 4.920759965898469e-05, + 3.82029902539216e-05, + 2.4410484911641106e-05, + 9.912354471453e-06 + ], + "bp_grad_F": [ + 0.2312120646238327, + 0.11490234732627869, + 0.09031722694635391, + 0.06280362606048584, + 0.02546737529337406 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8825892210006714, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.4533940553665161, + 5.765341758728027, + 7.664762496948242, + 9.541180610656738, + 12.46136474609375 + ], + "hidden_norms_avg": [ + 4.321633815765381, + 9.284127235412598, + 10.135884284973145, + 11.603636741638184, + 12.27259635925293 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010168847802560776, + 5.239037636783905e-05, + 4.169415478827432e-05, + 2.8813867174903862e-05, + 1.1632122550508939e-05 + ], + "bp_grad_F": [ + 0.23138603568077087, + 0.11581514030694962, + 0.09145721793174744, + 0.06368965655565262, + 0.025816213339567184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8627672791481018, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.4520151615142822, + 5.752710342407227, + 7.6372294425964355, + 9.493330001831055, + 12.49281120300293 + ], + "hidden_norms_avg": [ + 4.314420223236084, + 9.275971412658691, + 10.131872177124023, + 11.594268798828125, + 12.271230697631836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010349372314522043, + 5.0890805141534656e-05, + 4.167861698078923e-05, + 2.9301188988029025e-05, + 1.1288396308373194e-05 + ], + "bp_grad_F": [ + 0.23472057282924652, + 0.11708012968301773, + 0.09245092421770096, + 0.06478185206651688, + 0.025885937735438347 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8611111640930176, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.4508332014083862, + 5.741517066955566, + 7.59091329574585, + 9.493820190429688, + 12.553393363952637 + ], + "hidden_norms_avg": [ + 4.315334320068359, + 9.272273063659668, + 10.107754707336426, + 11.5936279296875, + 12.266173362731934 + ], + "bp_grad_per_sample_l2_med": [ + 9.209421114064753e-05, + 4.9557409511180595e-05, + 3.8665639294777066e-05, + 2.703870450204704e-05, + 1.0333649697713554e-05 + ], + "bp_grad_F": [ + 0.23745231330394745, + 0.11897031217813492, + 0.09419847279787064, + 0.06559450179338455, + 0.02597379870712757 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.8737660646438599, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.4514665603637695, + 5.724127292633057, + 7.567911624908447, + 9.464110374450684, + 12.53247356414795 + ], + "hidden_norms_avg": [ + 4.312892436981201, + 9.258728981018066, + 10.092171669006348, + 11.559837341308594, + 12.241935729980469 + ], + "bp_grad_per_sample_l2_med": [ + 8.842872193781659e-05, + 4.636628364096396e-05, + 3.5660887078847736e-05, + 2.4343042241525836e-05, + 9.563225830788724e-06 + ], + "bp_grad_F": [ + 0.23917540907859802, + 0.12006859481334686, + 0.09492167085409164, + 0.06607519090175629, + 0.02614584006369114 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7939453125, + "loss_eval": 0.8743407130241394, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.4513946771621704, + 5.7332282066345215, + 7.562880992889404, + 9.466405868530273, + 12.53167724609375 + ], + "hidden_norms_avg": [ + 4.3138651847839355, + 9.26041316986084, + 10.077324867248535, + 11.538521766662598, + 12.218836784362793 + ], + "bp_grad_per_sample_l2_med": [ + 9.282731480197981e-05, + 4.6137181925587356e-05, + 3.7237725337035954e-05, + 2.553310514485929e-05, + 9.964967830455862e-06 + ], + "bp_grad_F": [ + 0.24150457978248596, + 0.12129233777523041, + 0.09592130035161972, + 0.06674522906541824, + 0.026258554309606552 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8750766515731812, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.4510550498962402, + 5.730595111846924, + 7.558650493621826, + 9.460441589355469, + 12.49626636505127 + ], + "hidden_norms_avg": [ + 4.311552047729492, + 9.2510347366333, + 10.070302963256836, + 11.530484199523926, + 12.212501525878906 + ], + "bp_grad_per_sample_l2_med": [ + 8.91910312930122e-05, + 4.6800774725852534e-05, + 3.584511432563886e-05, + 2.5313198420917615e-05, + 9.680608854978345e-06 + ], + "bp_grad_F": [ + 0.24175073206424713, + 0.12143565714359283, + 0.09590216726064682, + 0.06680992990732193, + 0.026268428191542625 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8746636509895325, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.450972557067871, + 5.727794647216797, + 7.5582756996154785, + 9.462045669555664, + 12.50033187866211 + ], + "hidden_norms_avg": [ + 4.311238765716553, + 9.248146057128906, + 10.065601348876953, + 11.523144721984863, + 12.206249237060547 + ], + "bp_grad_per_sample_l2_med": [ + 8.883981354301795e-05, + 4.730010550701991e-05, + 3.57187855115626e-05, + 2.4922017473727465e-05, + 9.98118775896728e-06 + ], + "bp_grad_F": [ + 0.24178682267665863, + 0.12154776602983475, + 0.09598654508590698, + 0.06685590744018555, + 0.026261666789650917 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8750864863395691, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.3210873007774353, + 3.3568029403686523, + 4.891699314117432, + 6.200707912445068, + 7.5911865234375 + ], + "hidden_norms_avg": [ + 5.7549052238464355, + 6.750590801239014, + 7.9020819664001465, + 8.925304412841797, + 10.076716423034668 + ], + "bp_grad_per_sample_l2_med": [ + 0.004074312746524811, + 0.0011155740357935429, + 0.0009667170234024525, + 0.0008621186716482043, + 0.0008127145702019334 + ], + "bp_grad_F": [ + 0.20160320401191711, + 0.039521340280771255, + 0.033098917454481125, + 0.029271923005580902, + 0.027136052027344704 + ], + "gamma_dfa": 0.0011031709145754576, + "gamma_dfa_per_layer": [ + -0.004096934571862221, + -0.003170878393575549, + 0.003171987598761916, + 0.008508509024977684 + ], + "acc_eval": 0.125, + "loss_eval": 2.422111988067627, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.7445409297943115, + 3393.872314453125, + 8096.7275390625, + 11786.4453125, + 15317.9609375 + ], + "hidden_norms_avg": [ + 46.059967041015625, + 2908.78857421875, + 9192.9140625, + 12480.814453125, + 15843.904296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007700070273131132, + 5.177932962396881e-07, + 4.354141651674581e-07, + 4.0796010125632165e-07, + 4.096184795798763e-07 + ], + "bp_grad_F": [ + 0.14847944676876068, + 7.175570499384776e-05, + 1.7355905583826825e-05, + 1.4375820683198981e-05, + 1.4468741937889718e-05 + ], + "gamma_dfa": 0.00903075491078198, + "gamma_dfa_per_layer": [ + 0.014700280502438545, + 0.007455145940184593, + 0.009132559411227703, + 0.004835033789277077 + ], + "acc_eval": 0.2158203125, + "loss_eval": 2.072723388671875, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 3.5329439640045166, + 17943.025390625, + 46227.09765625, + 60098.9921875, + 105510.8828125 + ], + "hidden_norms_avg": [ + 95.54289245605469, + 14775.4267578125, + 44856.01953125, + 59234.35546875, + 87862.078125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00029628784977830946, + 1.0676165373979529e-07, + 7.34040170868866e-08, + 6.658416396021494e-08, + 6.750254044618487e-08 + ], + "bp_grad_F": [ + 0.12055971473455429, + 8.933278149925172e-05, + 3.910079612978734e-06, + 3.3086737403209554e-06, + 3.354543650857522e-06 + ], + "gamma_dfa": 0.007886230800068006, + "gamma_dfa_per_layer": [ + 0.016902755945920944, + 0.003473796183243394, + 0.009775697253644466, + 0.0013926738174632192 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.0924925804138184, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 5.165565013885498, + 33863.33203125, + 93132.8515625, + 145828.34375, + 276496.0 + ], + "hidden_norms_avg": [ + 142.7160186767578, + 36882.9296875, + 93356.96875, + 138199.0625, + 216913.359375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00022745825117453933, + 4.267175768291054e-08, + 3.181965624321492e-08, + 2.8314032007870082e-08, + 2.8843814448009653e-08 + ], + "bp_grad_F": [ + 0.06954267621040344, + 0.00012680335203185678, + 2.0300262804084923e-06, + 1.8529049157223199e-06, + 1.8672349142434541e-06 + ], + "gamma_dfa": 0.00556139531545341, + "gamma_dfa_per_layer": [ + 0.01000538095831871, + 0.0014471756294369698, + 0.011906315572559834, + -0.001113290898501873 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0521552562713623, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 6.674264907836914, + 43835.6796875, + 150229.609375, + 253133.515625, + 481876.5 + ], + "hidden_norms_avg": [ + 186.87832641601562, + 74412.015625, + 150159.890625, + 253252.734375, + 439077.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003350951592437923, + 2.7693221937852286e-08, + 1.989219278186738e-08, + 1.704596108709211e-08, + 1.7547710839949104e-08 + ], + "bp_grad_F": [ + 0.058595605194568634, + 0.0002476655936334282, + 1.0984595064655878e-06, + 1.0368654557169066e-06, + 1.0405622106191004e-06 + ], + "gamma_dfa": 0.002481349220033735, + "gamma_dfa_per_layer": [ + 3.730843309313059e-05, + 0.0014904557028785348, + 0.011494583450257778, + -0.0030969507060945034 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.058844566345215, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 8.061405181884766, + 102865.78125, + 229004.390625, + 413580.59375, + 706253.625 + ], + "hidden_norms_avg": [ + 228.99224853515625, + 131342.546875, + 229257.390625, + 410435.25, + 727001.6875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00029934433405287564, + 1.670629679040303e-08, + 1.3200744497510186e-08, + 1.1068386207568892e-08, + 1.1248447506773118e-08 + ], + "bp_grad_F": [ + 0.49810686707496643, + 0.0004038630868308246, + 1.391591922583757e-06, + 6.11680206930032e-07, + 5.242948759587307e-07 + ], + "gamma_dfa": 0.0009187236428260803, + "gamma_dfa_per_layer": [ + -0.003027769736945629, + 0.002294017933309078, + 0.00904145184904337, + -0.004632805474102497 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.091141700744629, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 9.400635719299316, + 164205.859375, + 302756.3125, + 584338.25, + 1250749.125 + ], + "hidden_norms_avg": [ + 270.8563232421875, + 190832.34375, + 307117.59375, + 620500.3125, + 1149191.375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00034470504033379257, + 1.3897826889319731e-08, + 8.662226491651381e-09, + 6.850678690994982e-09, + 7.0105756755367565e-09 + ], + "bp_grad_F": [ + 0.08854538202285767, + 0.0002125167811755091, + 3.9876397295302013e-07, + 2.9177280680414697e-07, + 2.903063318626664e-07 + ], + "gamma_dfa": 0.0008902656263671815, + "gamma_dfa_per_layer": [ + -0.004116768017411232, + 0.004187953192740679, + 0.007109872996807098, + -0.003619995666667819 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.09378981590271, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 10.676177978515625, + 216327.671875, + 429372.28125, + 910110.1875, + 1955787.375 + ], + "hidden_norms_avg": [ + 311.3556823730469, + 279124.65625, + 434169.5, + 917506.125, + 1714750.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002802011731546372, + 8.183582700382885e-09, + 5.617039278149605e-09, + 4.765932093420133e-09, + 4.884364024348997e-09 + ], + "bp_grad_F": [ + 0.2021757811307907, + 0.00017153903900180012, + 2.627296851187566e-07, + 1.9583571031489555e-07, + 1.9719628596703842e-07 + ], + "gamma_dfa": 0.00245969754178077, + "gamma_dfa_per_layer": [ + 0.0030665153171867132, + 0.0039703575894236565, + 0.005591260269284248, + -0.0027893430087715387 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0816030502319336, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 11.970849990844727, + 282019.0, + 553729.25, + 1250316.5, + 2676136.75 + ], + "hidden_norms_avg": [ + 350.0874938964844, + 367917.96875, + 563719.125, + 1231394.75, + 2379567.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015754146443214267, + 7.837374305097455e-09, + 4.1749870227647534e-09, + 3.572480755664742e-09, + 3.6429026462059255e-09 + ], + "bp_grad_F": [ + 0.06816119700670242, + 0.0002165154874091968, + 1.8739321205885062e-07, + 1.4396131575722393e-07, + 1.449055417879208e-07 + ], + "gamma_dfa": 0.0018902571755461395, + "gamma_dfa_per_layer": [ + 0.0010774387046694756, + 0.004019944928586483, + 0.004736708011478186, + -0.0022730629425495863 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.069587469100952, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 13.234355926513672, + 498576.65625, + 747356.3125, + 1569417.0, + 3492356.0 + ], + "hidden_norms_avg": [ + 390.34356689453125, + 517596.5, + 755798.625, + 1559863.25, + 3087860.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012954612611792982, + 6.955718223622398e-09, + 3.3238092278509157e-09, + 2.7362234700234467e-09, + 2.7891511322764018e-09 + ], + "bp_grad_F": [ + 0.03943011909723282, + 0.00019621588580776006, + 1.9796995331944345e-07, + 1.1484767270530938e-07, + 1.1313876058238748e-07 + ], + "gamma_dfa": 0.002013051969697699, + "gamma_dfa_per_layer": [ + 0.0007974229520186782, + 0.0045172227546572685, + 0.004162413999438286, + -0.0014248518273234367 + ], + "acc_eval": 0.21484375, + "loss_eval": 2.0846829414367676, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 14.412362098693848, + 653898.875, + 962527.9375, + 1974772.75, + 4235229.0 + ], + "hidden_norms_avg": [ + 426.1747741699219, + 660897.75, + 954217.625, + 1992937.5, + 3912584.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001297950657317415, + 8.463428180505161e-09, + 2.735849546908753e-09, + 2.2942541200166033e-09, + 2.329255233135541e-09 + ], + "bp_grad_F": [ + 0.07335253059864044, + 0.0002778704511001706, + 2.1924184068211616e-07, + 1.5885484572208952e-07, + 9.551467172741468e-08 + ], + "gamma_dfa": 0.001994484744500369, + "gamma_dfa_per_layer": [ + 0.0028600264340639114, + 0.0031631651800125837, + 0.0033731083385646343, + -0.0014183609746396542 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2.0768301486968994, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 15.627301216125488, + 805321.625, + 1191654.25, + 2375967.75, + 5068243.5 + ], + "hidden_norms_avg": [ + 464.92144775390625, + 870169.75, + 1209570.75, + 2342305.5, + 4797491.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014358766202349216, + 6.655038742309216e-09, + 2.213497385383789e-09, + 1.8578552030135143e-09, + 1.8845198734851465e-09 + ], + "bp_grad_F": [ + 0.22341646254062653, + 0.0010545816039666533, + 3.022053363110899e-07, + 8.581165644727662e-08, + 7.942276880612553e-08 + ], + "gamma_dfa": 0.0012935771082993597, + "gamma_dfa_per_layer": [ + -0.00014482985716313124, + 0.0035164642613381147, + 0.002910400740802288, + -0.0011077267117798328 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.076242446899414, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 16.751590728759766, + 758638.375, + 1437438.0, + 2779040.25, + 5662257.0 + ], + "hidden_norms_avg": [ + 501.60235595703125, + 1119163.625, + 1513203.375, + 2677392.25, + 5339190.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020390149438753724, + 5.5311413227343564e-09, + 1.8890189412701375e-09, + 1.6241474831701908e-09, + 1.6578916017806478e-09 + ], + "bp_grad_F": [ + 1.734735369682312, + 0.000374374445527792, + 1.2862761877840967e-07, + 1.1062630989044919e-07, + 6.887377423936414e-08 + ], + "gamma_dfa": 0.0020944410644005984, + "gamma_dfa_per_layer": [ + 0.0036250988487154245, + 0.0027163547929376364, + 0.0028407545760273933, + -0.0008044439600780606 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.083003520965576, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 17.76032066345215, + 1093088.5, + 1739864.0, + 3080344.5, + 6632118.5 + ], + "hidden_norms_avg": [ + 539.1420288085938, + 1433551.75, + 1843404.125, + 3096921.75, + 6237853.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014031230239197612, + 4.252878937904825e-09, + 1.704668295410272e-09, + 1.518661418842271e-09, + 1.5263605934734414e-09 + ], + "bp_grad_F": [ + 0.05247655138373375, + 0.00048432740732096136, + 1.395327586806161e-07, + 8.375257465331742e-08, + 5.970760241780226e-08 + ], + "gamma_dfa": 0.0018704376125242561, + "gamma_dfa_per_layer": [ + 0.0021162822376936674, + 0.003257386852055788, + 0.002796958899125457, + -0.0006888775387778878 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2.1021971702575684, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 18.760025024414062, + 2223954.75, + 2460609.0, + 3718541.25, + 7618764.0 + ], + "hidden_norms_avg": [ + 577.8324584960938, + 1908819.625, + 2348359.5, + 3542983.0, + 6779725.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010403544729342684, + 2.662567277766925e-09, + 1.6195218499603925e-09, + 1.422262307926303e-09, + 1.433551610752204e-09 + ], + "bp_grad_F": [ + 0.08673901855945587, + 0.0001567020226502791, + 8.41187173250546e-08, + 5.8843131256480774e-08, + 5.371895994699116e-08 + ], + "gamma_dfa": 0.003976444830186665, + "gamma_dfa_per_layer": [ + 0.010876781307160854, + 0.0029237696435302496, + 0.0026041539385914803, + -0.000498925568535924 + ], + "acc_eval": 0.2177734375, + "loss_eval": 2.138009548187256, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 19.738407135009766, + 2339586.0, + 2696652.5, + 4235438.5, + 7955372.0 + ], + "hidden_norms_avg": [ + 619.4888916015625, + 2243613.75, + 2801893.5, + 4018190.75, + 7143025.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014718857710249722, + 2.6654392026870255e-09, + 1.4668186665289795e-09, + 1.3113429231381701e-09, + 1.3212382299343517e-09 + ], + "bp_grad_F": [ + 0.1564428061246872, + 0.00024187436792999506, + 2.621962664761668e-07, + 5.580703898999673e-08, + 5.442945649747344e-08 + ], + "gamma_dfa": 0.0019682426573126577, + "gamma_dfa_per_layer": [ + 0.003052386222407222, + 0.0027148486115038395, + 0.0025699653197079897, + -0.00046422952436842024 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.145447254180908, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 20.727081298828125, + 2753822.5, + 3114285.75, + 4713040.0, + 8652256.0 + ], + "hidden_norms_avg": [ + 660.8045654296875, + 2684893.0, + 3331407.5, + 4614215.5, + 7864381.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013858993770554662, + 2.7730009399817845e-09, + 1.344458322449782e-09, + 1.2393497339502346e-09, + 1.2431760065823028e-09 + ], + "bp_grad_F": [ + 0.1324291080236435, + 0.00022225745487958193, + 9.285694346772289e-08, + 4.7669061586930184e-08, + 4.746264181676452e-08 + ], + "gamma_dfa": 0.001855946145951748, + "gamma_dfa_per_layer": [ + 0.004218719433993101, + 0.001718730665743351, + 0.0019668969325721264, + -0.0004805624485015869 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.101409673690796, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 21.603151321411133, + 3877476.75, + 4156743.75, + 5474745.5, + 10299149.0 + ], + "hidden_norms_avg": [ + 698.7645263671875, + 3523264.5, + 4085091.75, + 5354783.0, + 9094561.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000199332891497761, + 1.9098649328697093e-09, + 1.2144363292776461e-09, + 1.1166952917918138e-09, + 1.1315383074972374e-09 + ], + "bp_grad_F": [ + 0.15142236649990082, + 4.2183397454209626e-05, + 7.309424887580462e-08, + 5.2962114693855256e-08, + 4.2337880756804225e-08 + ], + "gamma_dfa": 0.0013709207050851546, + "gamma_dfa_per_layer": [ + 0.0023175266105681658, + 0.0016730788629502058, + 0.0018372924532741308, + -0.0003442151064518839 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.1280713081359863, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 22.48230743408203, + 3581296.5, + 4024996.25, + 6183271.0, + 11393130.0 + ], + "hidden_norms_avg": [ + 735.2485961914062, + 4017679.75, + 4751523.5, + 6215236.0, + 10366257.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018803548300638795, + 1.895784862426808e-09, + 1.1237420993737146e-09, + 1.0378963244406236e-09, + 1.0573794062551656e-09 + ], + "bp_grad_F": [ + 0.12878409028053284, + 4.194497887510806e-05, + 4.941083631138099e-08, + 3.9714532107382183e-08, + 3.994472663748638e-08 + ], + "gamma_dfa": 0.0012161588310846128, + "gamma_dfa_per_layer": [ + 0.0021385664585977793, + 0.0015012789517641068, + 0.0016565187834203243, + -0.0004317288694437593 + ], + "acc_eval": 0.2158203125, + "loss_eval": 2.1137895584106445, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 23.29258155822754, + 4616424.5, + 5061994.0, + 6831782.5, + 12437102.0 + ], + "hidden_norms_avg": [ + 768.5599975585938, + 4586839.5, + 5567332.5, + 6953557.0, + 11342041.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021542877948377281, + 1.9688994878919175e-09, + 1.0831572305747272e-09, + 9.59386015075836e-10, + 9.76972058808201e-10 + ], + "bp_grad_F": [ + 0.09346769750118256, + 4.979455843567848e-05, + 4.6927411290198506e-08, + 3.8312244043936516e-08, + 3.882623289541698e-08 + ], + "gamma_dfa": 0.0011904535058420151, + "gamma_dfa_per_layer": [ + 0.0024171490222215652, + 0.0012326111318543553, + 0.0015420420095324516, + -0.0004299881402403116 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0970499515533447, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 24.054462432861328, + 5806660.5, + 6270370.0, + 7861086.0, + 14600824.0 + ], + "hidden_norms_avg": [ + 801.1851806640625, + 5855518.5, + 6747570.0, + 8137969.0, + 13373154.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012799039541278034, + 1.5442244150065676e-09, + 9.774002718287989e-10, + 8.729071909741037e-10, + 8.921305361120346e-10 + ], + "bp_grad_F": [ + 0.9552626609802246, + 1.163827892014524e-05, + 2.461903250150499e-07, + 3.4675800009154045e-08, + 3.4831803219503854e-08 + ], + "gamma_dfa": 0.0018355100764892995, + "gamma_dfa_per_layer": [ + 0.004604285582900047, + 0.00167210737708956, + 0.001404301729053259, + -0.0003386543830856681 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.11769700050354, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 24.826902389526367, + 6414338.0, + 6989573.0, + 8609765.0, + 15368301.0 + ], + "hidden_norms_avg": [ + 830.1490478515625, + 6946265.5, + 7916239.0, + 9224772.0, + 14431417.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015248128329403698, + 1.4729809594271615e-09, + 9.462167716023373e-10, + 8.629364445233989e-10, + 8.805687845558907e-10 + ], + "bp_grad_F": [ + 0.1705506592988968, + 0.00016797611897345632, + 4.810285503253908e-08, + 3.399246040203252e-08, + 3.436711182303043e-08 + ], + "gamma_dfa": 0.0015317398574552499, + "gamma_dfa_per_layer": [ + 0.004021936096251011, + 0.0012830595951527357, + 0.0012305387062951922, + -0.00040857496787793934 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.102954864501953, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 25.52900505065918, + 8152435.5, + 8736555.0, + 9881049.0, + 16997340.0 + ], + "hidden_norms_avg": [ + 858.3137817382812, + 7544203.0, + 8860779.0, + 10224814.0, + 15607154.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001363755582133308, + 1.2969386675720784e-09, + 9.174655479782245e-10, + 8.421383035361885e-10, + 8.538599827190296e-10 + ], + "bp_grad_F": [ + 0.07549053430557251, + 2.9420058126561344e-05, + 5.8904493727141016e-08, + 3.187446395713778e-08, + 3.1860317051268794e-08 + ], + "gamma_dfa": 0.0023631651129107922, + "gamma_dfa_per_layer": [ + 0.007739294320344925, + 0.0009300304809585214, + 0.001171439653262496, + -0.00038810400292277336 + ], + "acc_eval": 0.2080078125, + "loss_eval": 2.1162400245666504, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 26.122589111328125, + 9255466.0, + 9964734.0, + 11054792.0, + 18565818.0 + ], + "hidden_norms_avg": [ + 884.7098388671875, + 8814330.0, + 10177720.0, + 11552646.0, + 17489728.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014142012514639646, + 1.3653665975610352e-09, + 8.580440802319345e-10, + 7.922714151398225e-10, + 8.032630116616701e-10 + ], + "bp_grad_F": [ + 0.11926258355379105, + 1.2633940968953539e-05, + 3.893048727832138e-08, + 3.075604126934195e-08, + 3.043995278062539e-08 + ], + "gamma_dfa": 0.0013515961618395522, + "gamma_dfa_per_layer": [ + 0.0038036422338336706, + 0.0009011125075630844, + 0.0010650388430804014, + -0.0003634089371189475 + ], + "acc_eval": 0.201171875, + "loss_eval": 2.134256362915039, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 26.71797752380371, + 8691604.0, + 9652268.0, + 11413482.0, + 19342164.0 + ], + "hidden_norms_avg": [ + 908.3400268554688, + 9418884.0, + 11132975.0, + 12548590.0, + 18516546.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016020517796278, + 1.5232745065318909e-09, + 8.103306359252826e-10, + 7.392123024807518e-10, + 7.529800671868259e-10 + ], + "bp_grad_F": [ + 0.08055854588747025, + 1.5452902516699396e-05, + 3.9288735820264264e-08, + 3.091117406484045e-08, + 2.9865013573271426e-08 + ], + "gamma_dfa": 0.0012649961790884845, + "gamma_dfa_per_layer": [ + 0.0036856848746538162, + 0.0008738536853343248, + 0.0009324033162556589, + -0.00043195715988986194 + ], + "acc_eval": 0.216796875, + "loss_eval": 2.1074087619781494, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 27.27407455444336, + 9931691.0, + 10836582.0, + 12350148.0, + 20677670.0 + ], + "hidden_norms_avg": [ + 931.8362426757812, + 10575293.0, + 12476721.0, + 13979366.0, + 20145220.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002644142950884998, + 1.4137412351900025e-09, + 7.711813965194381e-10, + 7.245293809354791e-10, + 7.329452600401964e-10 + ], + "bp_grad_F": [ + 0.08752908557653427, + 3.3139032893814147e-05, + 4.584432744536571e-08, + 2.996421955003825e-08, + 2.8689356668110122e-08 + ], + "gamma_dfa": 0.0013240749976830557, + "gamma_dfa_per_layer": [ + 0.003940493334084749, + 0.0008323215297423303, + 0.0009093738626688719, + -0.0003858887357637286 + ], + "acc_eval": 0.2080078125, + "loss_eval": 2.1011557579040527, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 27.817367553710938, + 12253263.0, + 13105294.0, + 14345712.0, + 22455440.0 + ], + "hidden_norms_avg": [ + 953.0517578125, + 12373978.0, + 14141729.0, + 15597335.0, + 22309104.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014759604528080672, + 1.123480086739903e-09, + 7.102037291595309e-10, + 6.690955567378865e-10, + 6.791667228611686e-10 + ], + "bp_grad_F": [ + 0.05615593492984772, + 0.00010146480053663254, + 3.714368190799178e-08, + 2.748037175592799e-08, + 2.6385574614096186e-08 + ], + "gamma_dfa": 0.0012311612081248313, + "gamma_dfa_per_layer": [ + 0.003369898535311222, + 0.0009893677197396755, + 0.0009041082230396569, + -0.0003387296455912292 + ], + "acc_eval": 0.234375, + "loss_eval": 2.105236291885376, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 28.32236099243164, + 13643201.0, + 14611628.0, + 15764247.0, + 24160378.0 + ], + "hidden_norms_avg": [ + 973.9281616210938, + 13221320.0, + 15394035.0, + 16890642.0, + 23678466.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016657183005008847, + 9.720990679085162e-10, + 6.881580305595492e-10, + 6.496979620962406e-10, + 6.5528305004392e-10 + ], + "bp_grad_F": [ + 0.21266740560531616, + 1.0097430276800878e-05, + 5.8009760550703504e-08, + 2.5056060337647068e-08, + 2.5318335872270836e-08 + ], + "gamma_dfa": 0.0010233484499622136, + "gamma_dfa_per_layer": [ + 0.0030805980786681175, + 0.0005203179316595197, + 0.000822446309030056, + -0.00032996851950883865 + ], + "acc_eval": 0.212890625, + "loss_eval": 2.137085437774658, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 28.79292106628418, + 13177481.0, + 14299000.0, + 15555998.0, + 23304192.0 + ], + "hidden_norms_avg": [ + 992.415771484375, + 14624837.0, + 16826644.0, + 18325902.0, + 25292966.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020211696391925216, + 1.1425522750130312e-09, + 6.55300591567709e-10, + 6.094423854463571e-10, + 6.189129764244683e-10 + ], + "bp_grad_F": [ + 0.17359277606010437, + 1.2817296010325663e-05, + 7.396955936656013e-08, + 2.5667416636565576e-08, + 2.485118777428852e-08 + ], + "gamma_dfa": 0.0013693289074581116, + "gamma_dfa_per_layer": [ + 0.004313473589718342, + 0.0007373306434601545, + 0.000740988994948566, + -0.00031447759829461575 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.095831871032715, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 29.206546783447266, + 13026473.0, + 14086985.0, + 16207103.0, + 25752542.0 + ], + "hidden_norms_avg": [ + 1012.0676879882812, + 14977745.0, + 17788350.0, + 19459138.0, + 26297900.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002467916056048125, + 1.5415436704913077e-09, + 6.588643519656046e-10, + 6.053296752739357e-10, + 6.112412798131572e-10 + ], + "bp_grad_F": [ + 0.042935822159051895, + 9.192503966914956e-06, + 3.478140442325639e-08, + 2.366191687031005e-08, + 2.384759412166204e-08 + ], + "gamma_dfa": 0.0008732089045224711, + "gamma_dfa_per_layer": [ + 0.002771018771454692, + 0.00032788922544568777, + 0.0007068651611916721, + -0.0003129375400021672 + ], + "acc_eval": 0.2294921875, + "loss_eval": 2.0877132415771484, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 29.655010223388672, + 18104814.0, + 18959442.0, + 20352136.0, + 30115644.0 + ], + "hidden_norms_avg": [ + 1030.1336669921875, + 17704192.0, + 19945910.0, + 21540694.0, + 29199112.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019920141494367272, + 8.472024748407136e-10, + 5.961620086480934e-10, + 5.578593698096768e-10, + 5.602495689593923e-10 + ], + "bp_grad_F": [ + 0.05658308416604996, + 2.5135868781944737e-05, + 4.3493169954444966e-08, + 2.1390142990185268e-08, + 2.1341643119399123e-08 + ], + "gamma_dfa": 0.0010463381186127663, + "gamma_dfa_per_layer": [ + 0.0027386434376239777, + 0.0009209397248923779, + 0.0007645037840120494, + -0.0002387344720773399 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.1298673152923584, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 30.063920974731445, + 20103628.0, + 20986630.0, + 22120356.0, + 31195618.0 + ], + "hidden_norms_avg": [ + 1046.1927490234375, + 18906620.0, + 21404482.0, + 23038508.0, + 30526688.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002040969266090542, + 9.528980937645315e-10, + 5.700001026731627e-10, + 5.158900528989818e-10, + 5.214851328538828e-10 + ], + "bp_grad_F": [ + 0.0816737711429596, + 5.908617822569795e-05, + 3.4592272157851767e-08, + 2.022995992945198e-08, + 2.0381063947638722e-08 + ], + "gamma_dfa": 0.001085347576008644, + "gamma_dfa_per_layer": [ + 0.0035934830084443092, + 0.0002959886915050447, + 0.0007062341319397092, + -0.0002543155278544873 + ], + "acc_eval": 0.2041015625, + "loss_eval": 2.116055965423584, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 30.392677307128906, + 21290946.0, + 22100456.0, + 23440498.0, + 32839040.0 + ], + "hidden_norms_avg": [ + 1062.797119140625, + 20072588.0, + 22866046.0, + 24608556.0, + 32259930.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00022883246128913015, + 1.3679187782500435e-09, + 5.444520945196984e-10, + 5.043216955158414e-10, + 5.114720313947885e-10 + ], + "bp_grad_F": [ + 0.2192479968070984, + 0.0001256070681847632, + 1.2757884348957305e-07, + 2.0006645229386777e-08, + 1.9971306386423748e-08 + ], + "gamma_dfa": 0.0019978012933279388, + "gamma_dfa_per_layer": [ + 0.0072806887328624725, + 0.0002412673202343285, + 0.000707695260643959, + -0.00023844614042900503 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.1034791469573975, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 30.711090087890625, + 22272344.0, + 23036462.0, + 24462584.0, + 35130192.0 + ], + "hidden_norms_avg": [ + 1082.3468017578125, + 20945452.0, + 23993758.0, + 25838460.0, + 33448582.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005148049676790833, + 2.304462176638822e-09, + 5.340937136999457e-10, + 4.950916898671665e-10, + 5.010572512453848e-10 + ], + "bp_grad_F": [ + 0.15110087394714355, + 3.209088754374534e-05, + 1.0334197497741116e-07, + 2.0131187383753968e-08, + 1.9814510920923567e-08 + ], + "gamma_dfa": 0.003046433750569122, + "gamma_dfa_per_layer": [ + 0.011593285948038101, + 0.00019314857490826398, + 0.0006439671851694584, + -0.0002446667058393359 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.112250328063965, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 31.0146427154541, + 29106790.0, + 29617952.0, + 31075512.0, + 42307980.0 + ], + "hidden_norms_avg": [ + 1102.4920654296875, + 22080922.0, + 25255976.0, + 27220448.0, + 35072796.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003266549902036786, + 3.0358568992028268e-09, + 4.893331295718895e-10, + 4.395950825575312e-10, + 4.4405815136094873e-10 + ], + "bp_grad_F": [ + 1.0139163732528687, + 1.6822159523144364e-05, + 1.2544650473955699e-07, + 1.6449900996917677e-08, + 1.5756539184508256e-08 + ], + "gamma_dfa": 0.004347974703705404, + "gamma_dfa_per_layer": [ + 0.016904333606362343, + -2.5271147023886442e-05, + 0.0006614690646529198, + -0.00014863270916976035 + ], + "acc_eval": 0.1806640625, + "loss_eval": 2.1869568824768066, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 31.282560348510742, + 30793450.0, + 31273076.0, + 33029836.0, + 44659544.0 + ], + "hidden_norms_avg": [ + 1120.8310546875, + 23223250.0, + 26597348.0, + 28740710.0, + 37219140.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004533866886049509, + 8.621259817154225e-10, + 4.717314872060285e-10, + 4.43607900413312e-10, + 4.492739236194865e-10 + ], + "bp_grad_F": [ + 0.8242164254188538, + 9.425415555597283e-06, + 6.696246401816097e-08, + 1.4385987512355314e-08, + 1.456661191667763e-08 + ], + "gamma_dfa": 0.004019053936644923, + "gamma_dfa_per_layer": [ + 0.015497363172471523, + 0.0001274545502383262, + 0.0006036070408299565, + -0.00015220901696011424 + ], + "acc_eval": 0.1396484375, + "loss_eval": 2.199540615081787, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 31.512802124023438, + 21969868.0, + 22884238.0, + 24682478.0, + 38405980.0 + ], + "hidden_norms_avg": [ + 1138.61962890625, + 23861642.0, + 27547416.0, + 29877192.0, + 38524416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00065120670478791, + 1.8789774181016128e-09, + 5.075246334307337e-10, + 4.637440431665141e-10, + 4.687980004192127e-10 + ], + "bp_grad_F": [ + 0.22404567897319794, + 6.978048531891545e-06, + 5.974419536869391e-08, + 1.854446907145757e-08, + 1.8726453276940447e-08 + ], + "gamma_dfa": 0.0030916051182430238, + "gamma_dfa_per_layer": [ + 0.011011095717549324, + 0.0010498585179448128, + 0.0005736061139032245, + -0.00026813987642526627 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.1297407150268555, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 31.728811264038086, + 29299954.0, + 29843046.0, + 31522240.0, + 44597740.0 + ], + "hidden_norms_avg": [ + 1154.2742919921875, + 26176784.0, + 29361794.0, + 31622036.0, + 40631524.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00057179294526577, + 8.620974489836897e-10, + 4.3859474385676833e-10, + 4.131678610352907e-10, + 4.158901834028228e-10 + ], + "bp_grad_F": [ + 0.1988120824098587, + 6.200312782311812e-06, + 7.633398269035752e-08, + 1.800971105581084e-08, + 1.6420651505200112e-08 + ], + "gamma_dfa": 0.0036353242212499026, + "gamma_dfa_per_layer": [ + 0.013258620165288448, + 0.0009053392568603158, + 0.0005595044931396842, + -0.00018216703028883785 + ], + "acc_eval": 0.193359375, + "loss_eval": 2.162503719329834, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 31.93093490600586, + 24153264.0, + 24958016.0, + 27164164.0, + 41821856.0 + ], + "hidden_norms_avg": [ + 1168.3504638671875, + 25251302.0, + 29331440.0, + 31888322.0, + 40732864.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007007869426161051, + 3.803806603031035e-09, + 4.6435830181046356e-10, + 4.2823591894780577e-10, + 4.335505288111108e-10 + ], + "bp_grad_F": [ + 0.23370306193828583, + 5.834654530190164e-06, + 4.249230300956697e-08, + 1.778762737103534e-08, + 1.7575523258983594e-08 + ], + "gamma_dfa": 0.003036663241800852, + "gamma_dfa_per_layer": [ + 0.010693107731640339, + 0.001166085829026997, + 0.0005278221797198057, + -0.00024036277318373322 + ], + "acc_eval": 0.2060546875, + "loss_eval": 2.145090103149414, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 32.11568069458008, + 30941254.0, + 31479742.0, + 33270594.0, + 46886708.0 + ], + "hidden_norms_avg": [ + 1180.89794921875, + 26732550.0, + 30676362.0, + 33269292.0, + 42382468.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006622264045290649, + 1.5328843749884413e-09, + 4.1302217201888425e-10, + 3.8878930630481534e-10, + 3.9369618676232676e-10 + ], + "bp_grad_F": [ + 0.7251601815223694, + 2.9320523026399314e-05, + 1.0578004605577007e-07, + 1.5190060764780355e-08, + 1.538120386612718e-08 + ], + "gamma_dfa": 0.0034242832334712148, + "gamma_dfa_per_layer": [ + 0.012806901708245277, + 0.0005313451401889324, + 0.0005365218385122716, + -0.00017763575306162238 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.1417269706726074, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 32.295955657958984, + 33935232.0, + 34368956.0, + 35934572.0, + 47697056.0 + ], + "hidden_norms_avg": [ + 1192.405517578125, + 27784236.0, + 31654758.0, + 34253712.0, + 43239588.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000609845039434731, + 1.1788049425476288e-09, + 4.4074988103659507e-10, + 3.883143528948807e-10, + 3.8990835560248627e-10 + ], + "bp_grad_F": [ + 0.3570167124271393, + 5.2556606533471495e-06, + 6.658066098452764e-08, + 1.6441132899558397e-08, + 1.5662063646004754e-08 + ], + "gamma_dfa": 0.0031971330136002507, + "gamma_dfa_per_layer": [ + 0.011760826222598553, + 0.000679977354593575, + 0.0005443703266791999, + -0.00019664184947032481 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.159468173980713, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 32.446258544921875, + 19652562.0, + 21036314.0, + 25921266.0, + 40927384.0 + ], + "hidden_norms_avg": [ + 1203.144287109375, + 31749304.0, + 34556376.0, + 36976868.0, + 47059032.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006137214368209243, + 8.001962981118993e-10, + 4.3686718131930036e-10, + 4.163595301864831e-10, + 4.1693556940280985e-10 + ], + "bp_grad_F": [ + 0.12317141890525818, + 1.0874373401748016e-05, + 3.419825134187704e-08, + 1.7081790204542813e-08, + 1.7078438219186864e-08 + ], + "gamma_dfa": 0.002385696723649744, + "gamma_dfa_per_layer": [ + 0.008561503142118454, + 0.000761325703933835, + 0.00044924806570634246, + -0.0002292900171596557 + ], + "acc_eval": 0.1943359375, + "loss_eval": 2.1486196517944336, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 32.65601348876953, + 18852588.0, + 20806824.0, + 26129350.0, + 41854136.0 + ], + "hidden_norms_avg": [ + 1211.216064453125, + 33512262.0, + 36150576.0, + 38488828.0, + 48876332.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041886867256835103, + 6.960994003435417e-10, + 3.895795075425923e-10, + 3.7316269518861134e-10, + 3.8092326515304364e-10 + ], + "bp_grad_F": [ + 0.14164908230304718, + 1.2379082363622729e-06, + 2.6289937338219715e-08, + 1.6158612226035984e-08, + 1.6345055087185756e-08 + ], + "gamma_dfa": 0.0026270662965544034, + "gamma_dfa_per_layer": [ + 0.009110232815146446, + 0.0011993220541626215, + 0.00041866287938319147, + -0.00021995256247464567 + ], + "acc_eval": 0.19140625, + "loss_eval": 2.1592655181884766, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 32.8077507019043, + 13604255.0, + 20737208.0, + 26201736.0, + 38498212.0 + ], + "hidden_norms_avg": [ + 1218.5357666015625, + 34337856.0, + 37186496.0, + 39492900.0, + 49837356.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024631666019558907, + 7.821958081244418e-10, + 3.8121927836698433e-10, + 3.6691791271969976e-10, + 3.7013728193535655e-10 + ], + "bp_grad_F": [ + 0.16077305376529694, + 4.323472239775583e-06, + 3.772007772795405e-08, + 1.5986831414238623e-08, + 1.5948634413121e-08 + ], + "gamma_dfa": 0.002168099657865241, + "gamma_dfa_per_layer": [ + 0.007105600088834763, + 0.0013786349445581436, + 0.00041434637387283146, + -0.00022618277580477297 + ], + "acc_eval": 0.193359375, + "loss_eval": 2.1537227630615234, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 32.95870590209961, + 17278438.0, + 21010234.0, + 26451948.0, + 41976576.0 + ], + "hidden_norms_avg": [ + 1225.39501953125, + 36196112.0, + 38833272.0, + 41042520.0, + 51415488.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00017274360288865864, + 7.227461407133262e-10, + 3.619011756939017e-10, + 3.5793992769761473e-10, + 3.6092046018509905e-10 + ], + "bp_grad_F": [ + 0.9672663807868958, + 3.41643476531317e-06, + 5.25712664511957e-08, + 1.5481989024124232e-08, + 1.548605688128646e-08 + ], + "gamma_dfa": 0.001979457345441915, + "gamma_dfa_per_layer": [ + 0.006772718392312527, + 0.0009743775590322912, + 0.00037397228879854083, + -0.00020323885837569833 + ], + "acc_eval": 0.208984375, + "loss_eval": 2.1646997928619385, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 33.06986999511719, + 23368844.0, + 24521804.0, + 27230594.0, + 45358652.0 + ], + "hidden_norms_avg": [ + 1231.394287109375, + 38020996.0, + 40414464.0, + 42538228.0, + 53283596.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015840897685848176, + 6.067092384043349e-10, + 3.4933173020945674e-10, + 3.3962907486362326e-10, + 3.42745692938351e-10 + ], + "bp_grad_F": [ + 0.3695656955242157, + 2.3579739263368538e-06, + 5.5092176154403205e-08, + 1.777137192959799e-08, + 1.4559810246339566e-08 + ], + "gamma_dfa": 0.0020704490307252854, + "gamma_dfa_per_layer": [ + 0.007164421491324902, + 0.0009055124246515334, + 0.0003939281450584531, + -0.00018206593813374639 + ], + "acc_eval": 0.203125, + "loss_eval": 2.1666717529296875, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 33.164432525634766, + 29174184.0, + 30089798.0, + 32367896.0, + 48892740.0 + ], + "hidden_norms_avg": [ + 1237.1142578125, + 37470168.0, + 40219512.0, + 42356984.0, + 52772660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024464691523462534, + 5.441591066634999e-10, + 3.6414088411262924e-10, + 3.320065611323031e-10, + 3.387692348866267e-10 + ], + "bp_grad_F": [ + 0.20688536763191223, + 4.435638402355835e-06, + 8.288016317692382e-08, + 1.4215274291018432e-08, + 1.4331217101926086e-08 + ], + "gamma_dfa": 0.0017712319058773573, + "gamma_dfa_per_layer": [ + 0.006079941056668758, + 0.0008057263912633061, + 0.00038248312193900347, + -0.0001832229463616386 + ], + "acc_eval": 0.1806640625, + "loss_eval": 2.173765182495117, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 33.24842071533203, + 33830332.0, + 34499304.0, + 36673048.0, + 51963528.0 + ], + "hidden_norms_avg": [ + 1242.226318359375, + 38073352.0, + 40806512.0, + 42901500.0, + 53437180.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002524294250179082, + 5.388652302151797e-10, + 3.6845529405304944e-10, + 3.3760005901939394e-10, + 3.4174474361492457e-10 + ], + "bp_grad_F": [ + 0.12659014761447906, + 2.532647158659529e-06, + 5.97612910269163e-08, + 1.3431267653629675e-08, + 1.3499856343912597e-08 + ], + "gamma_dfa": 0.0021579467684205156, + "gamma_dfa_per_layer": [ + 0.007928929291665554, + 0.00047530903248116374, + 0.00039780279621481895, + -0.0001702540466794744 + ], + "acc_eval": 0.2099609375, + "loss_eval": 2.161896228790283, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 33.338741302490234, + 19795148.0, + 21916948.0, + 27189936.0, + 43588712.0 + ], + "hidden_norms_avg": [ + 1246.7552490234375, + 38983196.0, + 41658504.0, + 43769460.0, + 54177164.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002599447325337678, + 6.2289540192495e-10, + 3.6807956682594067e-10, + 3.4037242468976103e-10, + 3.472495624379235e-10 + ], + "bp_grad_F": [ + 0.11130323261022568, + 6.972830760787474e-06, + 5.447330764241087e-08, + 1.4756569299834155e-08, + 1.4917180379825368e-08 + ], + "gamma_dfa": 0.0021847522366442718, + "gamma_dfa_per_layer": [ + 0.007594278547912836, + 0.0009666476398706436, + 0.0003712670295499265, + -0.00019318427075631917 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.1626296043395996, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 33.42045974731445, + 24898126.0, + 26009376.0, + 28516464.0, + 47394980.0 + ], + "hidden_norms_avg": [ + 1250.1884765625, + 39632580.0, + 42285708.0, + 44390100.0, + 55233620.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001829452667152509, + 5.726033536213038e-10, + 3.5659752928296484e-10, + 3.292066619309253e-10, + 3.31846911061362e-10 + ], + "bp_grad_F": [ + 0.23442988097667694, + 3.2595114589639707e-06, + 1.0605135969399271e-07, + 1.4677630666426467e-08, + 1.445219677265186e-08 + ], + "gamma_dfa": 0.0021932553718215786, + "gamma_dfa_per_layer": [ + 0.007973091676831245, + 0.0006458763382397592, + 0.00032728860969655216, + -0.00017323513748124242 + ], + "acc_eval": 0.1923828125, + "loss_eval": 2.175835609436035, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 33.47613525390625, + 25550002.0, + 26776384.0, + 28507352.0, + 47268464.0 + ], + "hidden_norms_avg": [ + 1253.279541015625, + 39494300.0, + 42348356.0, + 44479368.0, + 55121100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00012893354869447649, + 5.787402224122218e-10, + 3.341840137949248e-10, + 3.2919431069977634e-10, + 3.3201591476128556e-10 + ], + "bp_grad_F": [ + 0.10876749455928802, + 4.772132342623081e-06, + 7.90316647680811e-08, + 1.4042406348835357e-08, + 1.4153799909877307e-08 + ], + "gamma_dfa": 0.001727514507365413, + "gamma_dfa_per_layer": [ + 0.0062596434727311134, + 0.0004772312822751701, + 0.000357049866579473, + -0.0001838665921241045 + ], + "acc_eval": 0.1904296875, + "loss_eval": 2.164583444595337, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 33.52043914794922, + 28050636.0, + 29099278.0, + 31227182.0, + 49045872.0 + ], + "hidden_norms_avg": [ + 1255.7454833984375, + 40231008.0, + 42960368.0, + 45079784.0, + 55989944.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015386792074423283, + 5.41802436249128e-10, + 3.373940293815991e-10, + 3.3321326253776817e-10, + 3.361276257329848e-10 + ], + "bp_grad_F": [ + 0.2656819522380829, + 2.482481932020164e-06, + 8.287289432473699e-08, + 1.3792345932017724e-08, + 1.3917338392843703e-08 + ], + "gamma_dfa": 0.001938080065883696, + "gamma_dfa_per_layer": [ + 0.006978346034884453, + 0.0005946386372670531, + 0.00036033656215295196, + -0.00018100097076967359 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.176473379135132, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 33.55419921875, + 25508434.0, + 26505134.0, + 29051658.0, + 47339916.0 + ], + "hidden_norms_avg": [ + 1257.7822265625, + 40388772.0, + 43162480.0, + 45217960.0, + 55966100.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018102869216818362, + 5.443374639924059e-10, + 3.9548594954474936e-10, + 3.679410942591943e-10, + 3.717116892065775e-10 + ], + "bp_grad_F": [ + 0.28429684042930603, + 3.3983885714405915e-06, + 8.993236377818903e-08, + 1.4510244561449781e-08, + 1.4562592021150067e-08 + ], + "gamma_dfa": 0.001642326584260445, + "gamma_dfa_per_layer": [ + 0.006192460190504789, + 0.00019942648941650987, + 0.00037004181649535894, + -0.0001926221593748778 + ], + "acc_eval": 0.2001953125, + "loss_eval": 2.1743006706237793, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 33.58127212524414, + 28540952.0, + 29607362.0, + 31472670.0, + 49191068.0 + ], + "hidden_norms_avg": [ + 1259.4189453125, + 40550800.0, + 43364984.0, + 45506960.0, + 56297104.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018638238543644547, + 5.299162220140374e-10, + 3.2437005859087265e-10, + 3.1624741714253446e-10, + 3.1920088794379353e-10 + ], + "bp_grad_F": [ + 0.21056434512138367, + 3.217361381757655e-06, + 5.1724125427199397e-08, + 1.390105897058902e-08, + 1.3961146017038573e-08 + ], + "gamma_dfa": 0.0018532263711676933, + "gamma_dfa_per_layer": [ + 0.006584585644304752, + 0.0006806463352404535, + 0.00032758695306256413, + -0.00017991344793699682 + ], + "acc_eval": 0.19921875, + "loss_eval": 2.167957067489624, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 33.60611343383789, + 27949698.0, + 28918304.0, + 31366946.0, + 48876736.0 + ], + "hidden_norms_avg": [ + 1260.694091796875, + 41001392.0, + 43744060.0, + 45853688.0, + 56636716.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021861983987037092, + 5.396287861003657e-10, + 3.377726154329963e-10, + 3.201852394330018e-10, + 3.237338452866112e-10 + ], + "bp_grad_F": [ + 0.12415990233421326, + 1.6796100226201816e-06, + 6.823196940786147e-08, + 1.384469427989643e-08, + 1.3965705036866893e-08 + ], + "gamma_dfa": 0.0017868579998321366, + "gamma_dfa_per_layer": [ + 0.006317156832665205, + 0.0006519090966321528, + 0.0003622731601353735, + -0.00018390709010418504 + ], + "acc_eval": 0.1953125, + "loss_eval": 2.178144931793213, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 33.620914459228516, + 27607036.0, + 28622492.0, + 31370470.0, + 48645068.0 + ], + "hidden_norms_avg": [ + 1261.64208984375, + 40948476.0, + 43773536.0, + 45888992.0, + 56623536.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002112231741193682, + 5.336073249928575e-10, + 3.533912051878474e-10, + 3.186636232666018e-10, + 3.226934830458106e-10 + ], + "bp_grad_F": [ + 0.1486925333738327, + 3.3336793876515003e-06, + 9.466339889740993e-08, + 1.4568017014937595e-08, + 1.4240884915750485e-08 + ], + "gamma_dfa": 0.0018792969822243322, + "gamma_dfa_per_layer": [ + 0.006730419583618641, + 0.000605170032940805, + 0.0003661802038550377, + -0.00018458189151715487 + ], + "acc_eval": 0.1982421875, + "loss_eval": 2.172356367111206, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 33.63143539428711, + 28410040.0, + 29532286.0, + 31697578.0, + 48914624.0 + ], + "hidden_norms_avg": [ + 1262.2918701171875, + 40698620.0, + 43622904.0, + 45764712.0, + 56531748.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002270409750053659, + 5.479600106994553e-10, + 3.2429942065093087e-10, + 3.150284755282229e-10, + 3.179212726411862e-10 + ], + "bp_grad_F": [ + 0.10118122398853302, + 2.5195840862579644e-06, + 8.798109263352671e-08, + 1.3570585544186997e-08, + 1.3736383586149259e-08 + ], + "gamma_dfa": 0.0017859039653558284, + "gamma_dfa_per_layer": [ + 0.006382801569998264, + 0.0005453285994008183, + 0.00039217708399519324, + -0.00017669139197096229 + ], + "acc_eval": 0.1943359375, + "loss_eval": 2.1648902893066406, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 33.63875961303711, + 31114778.0, + 32184654.0, + 34278688.0, + 50894352.0 + ], + "hidden_norms_avg": [ + 1262.7132568359375, + 40792528.0, + 43713536.0, + 45850224.0, + 56615416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019923689251299948, + 5.368823718931992e-10, + 3.306654117185559e-10, + 3.113070912164062e-10, + 3.1328556415743947e-10 + ], + "bp_grad_F": [ + 0.3573400378227234, + 1.249598790309392e-05, + 1.6106491784739774e-07, + 3.301076745287901e-08, + 1.3328084413899433e-08 + ], + "gamma_dfa": 0.0016940671957854647, + "gamma_dfa_per_layer": [ + 0.006114102900028229, + 0.0004918627091683447, + 0.00032346430816687644, + -0.00015316113422159106 + ], + "acc_eval": 0.201171875, + "loss_eval": 2.1634349822998047, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 33.642520904541016, + 31868976.0, + 32779660.0, + 35005740.0, + 51305220.0 + ], + "hidden_norms_avg": [ + 1262.9461669921875, + 41087592.0, + 43928832.0, + 46043268.0, + 56839576.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002181618328904733, + 5.162476557352136e-10, + 3.3206276617292474e-10, + 3.1130611977125966e-10, + 3.1441516057384433e-10 + ], + "bp_grad_F": [ + 0.12289460748434067, + 1.5301338862627745e-05, + 8.779379356838035e-08, + 1.4331889452989799e-08, + 1.318165843144925e-08 + ], + "gamma_dfa": 0.001529279034002684, + "gamma_dfa_per_layer": [ + 0.00539398193359375, + 0.0005496743833646178, + 0.00034435215638950467, + -0.00017089233733713627 + ], + "acc_eval": 0.2021484375, + "loss_eval": 2.164745807647705, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 33.6442756652832, + 31315430.0, + 32160978.0, + 34340796.0, + 51077484.0 + ], + "hidden_norms_avg": [ + 1263.062744140625, + 41015680.0, + 43882708.0, + 46002096.0, + 56770896.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021884885791223496, + 5.177114292820306e-10, + 3.350683897007656e-10, + 3.101042200803761e-10, + 3.12167347527037e-10 + ], + "bp_grad_F": [ + 0.11127890646457672, + 1.1515544429130387e-05, + 8.542571805492116e-08, + 1.319963871537766e-08, + 1.3264477516372608e-08 + ], + "gamma_dfa": 0.0016308917693095282, + "gamma_dfa_per_layer": [ + 0.005676542408764362, + 0.0006629846757277846, + 0.0003523063496686518, + -0.0001682663569226861 + ], + "acc_eval": 0.19921875, + "loss_eval": 2.1635866165161133, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 33.643985748291016, + 31097308.0, + 32052318.0, + 34155804.0, + 50803736.0 + ], + "hidden_norms_avg": [ + 1263.064208984375, + 40997444.0, + 43870400.0, + 45990872.0, + 56755540.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021703331731259823, + 5.1921633659191e-10, + 3.35882821556055e-10, + 3.102589296588576e-10, + 3.1300673164480486e-10 + ], + "bp_grad_F": [ + 0.1889268010854721, + 1.0328590178687591e-05, + 1.1096560825762936e-07, + 1.3215729843807367e-08, + 1.3306935997547953e-08 + ], + "gamma_dfa": 0.0016646812255203258, + "gamma_dfa_per_layer": [ + 0.005869406741112471, + 0.0006016636616550386, + 0.0003579354961402714, + -0.00017028099682647735 + ], + "acc_eval": 0.2021484375, + "loss_eval": 2.163691520690918, + "epoch": 60 + } + ] +}
\ No newline at end of file |
