{ "config": { "output_dir": "results/snapshot_vit_v1", "epochs": 60, "lr": 0.001, "wd": 0.05, "seed": 123, "depth": 4, "d_model": 128, "n_heads": 4 }, "depth": 4, "d_model": 128, "architecture": "ViTMini", "bp_log": [ { "hidden_norms_cls": [ 0.3210873007774353, 3.3568029403686523, 4.891699314117432, 6.200707912445068, 7.5911865234375 ], "hidden_norms_avg": [ 5.7549052238464355, 6.750590801239014, 7.9020819664001465, 8.925304412841797, 10.076716423034668 ], "bp_grad_per_sample_l2_med": [ 0.004074312746524811, 0.0011155740357935429, 0.0009667170234024525, 0.0008621186716482043, 0.0008127145702019334 ], "bp_grad_F": [ 0.20160320401191711, 0.039521340280771255, 0.033098917454481125, 0.029271923005580902, 0.027136052027344704 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.125, "loss_eval": 2.422111988067627, "epoch": 0 }, { "hidden_norms_cls": [ 0.4782717227935791, 11.874238014221191, 20.313709259033203, 26.86528778076172, 32.42327880859375 ], "hidden_norms_avg": [ 3.8830745220184326, 11.266603469848633, 17.881502151489258, 23.234352111816406, 28.51181411743164 ], "bp_grad_per_sample_l2_med": [ 0.002827065996825695, 0.00024586476502008736, 0.00014567613834515214, 0.00013882767234463245, 0.0001400413311785087 ], "bp_grad_F": [ 0.12621107697486877, 0.009982436895370483, 0.00507162231951952, 0.004677945747971535, 0.004658848978579044 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4697265625, "loss_eval": 1.4472862482070923, "epoch": 1 }, { "hidden_norms_cls": [ 0.6104467511177063, 13.787332534790039, 22.073436737060547, 28.480369567871094, 33.141117095947266 ], "hidden_norms_avg": [ 3.951775074005127, 12.005932807922363, 18.336896896362305, 23.67597198486328, 27.899608612060547 ], "bp_grad_per_sample_l2_med": [ 0.002604336943477392, 0.00026667251950129867, 0.00014805165119469166, 0.00013079405471216887, 0.00012911780504509807 ], "bp_grad_F": [ 0.12487494200468063, 0.010650832206010818, 0.005604646634310484, 0.004644650500267744, 0.00448915408924222 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5146484375, "loss_eval": 1.291869878768921, "epoch": 2 }, { "hidden_norms_cls": [ 0.7104504108428955, 13.74225902557373, 21.90972328186035, 28.958967208862305, 33.262393951416016 ], "hidden_norms_avg": [ 3.9180142879486084, 13.097892761230469, 19.570770263671875, 24.899248123168945, 28.65104866027832 ], "bp_grad_per_sample_l2_med": [ 0.0020766372326761484, 0.00025831969105638564, 0.00014769421250093728, 0.00012920337030664086, 0.00012324318231549114 ], "bp_grad_F": [ 0.09676238149404526, 0.010603155009448528, 0.005832126829773188, 0.00465927692130208, 0.004435759503394365 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.529296875, "loss_eval": 1.2694497108459473, "epoch": 3 }, { "hidden_norms_cls": [ 0.801612377166748, 12.882991790771484, 20.474157333374023, 27.37413215637207, 32.06389617919922 ], "hidden_norms_avg": [ 3.8871910572052, 13.333250999450684, 19.042104721069336, 24.029348373413086, 27.96086311340332 ], "bp_grad_per_sample_l2_med": [ 0.0020045258570462465, 0.000285606540273875, 0.00016217664233408868, 0.00013080642384011298, 0.00011968115722993389 ], "bp_grad_F": [ 0.09496191889047623, 0.011928788386285305, 0.006509022321552038, 0.005044482182711363, 0.004537967965006828 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.58203125, "loss_eval": 1.119094967842102, "epoch": 4 }, { "hidden_norms_cls": [ 0.8653663396835327, 12.994612693786621, 20.49618148803711, 26.709278106689453, 30.303852081298828 ], "hidden_norms_avg": [ 4.018242835998535, 13.520885467529297, 19.090721130371094, 23.6751651763916, 26.93212890625 ], "bp_grad_per_sample_l2_med": [ 0.0018953323597088456, 0.000296358106425032, 0.00017310198745690286, 0.0001364975469186902, 0.00012098452862119302 ], "bp_grad_F": [ 0.09499228745698929, 0.012825642712414265, 0.007407570723444223, 0.005570532754063606, 0.004951393231749535 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.595703125, "loss_eval": 1.0847156047821045, "epoch": 5 }, { "hidden_norms_cls": [ 0.9313029646873474, 13.966381072998047, 21.648372650146484, 28.33364486694336, 32.91484069824219 ], "hidden_norms_avg": [ 4.053382396697998, 15.042261123657227, 20.74883270263672, 25.032489776611328, 28.55679702758789 ], "bp_grad_per_sample_l2_med": [ 0.001841629622504115, 0.0002753600711002946, 0.0001624371943762526, 0.0001305017649428919, 0.00011278261081315577 ], "bp_grad_F": [ 0.09068351984024048, 0.0128449946641922, 0.007257991470396519, 0.005361978895962238, 0.004660472739487886 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6103515625, "loss_eval": 1.095273494720459, "epoch": 6 }, { "hidden_norms_cls": [ 0.9818395972251892, 13.022477149963379, 20.385391235351562, 27.03214454650879, 31.324769973754883 ], "hidden_norms_avg": [ 4.1024041175842285, 14.697205543518066, 19.634239196777344, 23.90021324157715, 27.306678771972656 ], "bp_grad_per_sample_l2_med": [ 0.0015902157174423337, 0.00027956697158515453, 0.0001692597143119201, 0.0001353132538497448, 0.00011523282591952011 ], "bp_grad_F": [ 0.07967441529035568, 0.012528380379080772, 0.007520876359194517, 0.00570708978921175, 0.004875381011515856 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.62890625, "loss_eval": 1.0069011449813843, "epoch": 7 }, { "hidden_norms_cls": [ 1.0194361209869385, 13.912450790405273, 20.85824203491211, 27.968477249145508, 32.243431091308594 ], "hidden_norms_avg": [ 4.178755283355713, 14.875143051147461, 20.261545181274414, 24.636741638183594, 27.893512725830078 ], "bp_grad_per_sample_l2_med": [ 0.001506888889707625, 0.00028421770548447967, 0.0001727779454085976, 0.00013076694449409842, 0.00010860477777896449 ], "bp_grad_F": [ 0.07398127764463425, 0.013124965131282806, 0.007798053789883852, 0.005717460531741381, 0.004830002784729004 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.638671875, "loss_eval": 0.9834396839141846, "epoch": 8 }, { "hidden_norms_cls": [ 1.077261209487915, 12.524529457092285, 19.766538619995117, 25.7626895904541, 30.03727149963379 ], "hidden_norms_avg": [ 4.1816864013671875, 14.304539680480957, 19.208524703979492, 23.25862693786621, 26.313356399536133 ], "bp_grad_per_sample_l2_med": [ 0.0014360174536705017, 0.0003003668098244816, 0.0001815372525015846, 0.0001390709658153355, 0.00011320491466904059 ], "bp_grad_F": [ 0.0756259635090828, 0.014865156263113022, 0.008982912637293339, 0.006551471073180437, 0.005398898851126432 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6494140625, "loss_eval": 0.971701979637146, "epoch": 9 }, { "hidden_norms_cls": [ 1.1200045347213745, 12.160452842712402, 19.172168731689453, 25.067665100097656, 28.764787673950195 ], "hidden_norms_avg": [ 4.289422035217285, 15.51036262512207, 20.407268524169922, 24.061931610107422, 26.493688583374023 ], "bp_grad_per_sample_l2_med": [ 0.0012870824430137873, 0.00027074789977632463, 0.0001742457679938525, 0.0001348328951280564, 0.000104573555290699 ], "bp_grad_F": [ 0.07437644153833389, 0.015084434300661087, 0.009522279724478722, 0.0069595095701515675, 0.0055610560812056065 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6767578125, "loss_eval": 0.8734689354896545, "epoch": 10 }, { "hidden_norms_cls": [ 1.1509246826171875, 12.219743728637695, 19.352998733520508, 25.70184326171875, 29.580278396606445 ], "hidden_norms_avg": [ 4.315939426422119, 15.6610689163208, 20.42215347290039, 24.016841888427734, 26.62118911743164 ], "bp_grad_per_sample_l2_med": [ 0.0013146374840289354, 0.0002733681467361748, 0.0001865291123976931, 0.00013389455853030086, 0.00010298956476617604 ], "bp_grad_F": [ 0.07836466282606125, 0.015104672871530056, 0.009902945719659328, 0.0069915857166051865, 0.005596037954092026 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6767578125, "loss_eval": 0.917751669883728, "epoch": 11 }, { "hidden_norms_cls": [ 1.2017452716827393, 12.72107219696045, 18.952699661254883, 25.067615509033203, 29.466550827026367 ], "hidden_norms_avg": [ 4.358119487762451, 15.672205924987793, 20.140914916992188, 24.013885498046875, 26.668514251708984 ], "bp_grad_per_sample_l2_med": [ 0.0011630960507318377, 0.00025659528910182416, 0.0001693729282123968, 0.0001237613905686885, 9.384296572534367e-05 ], "bp_grad_F": [ 0.07334695011377335, 0.015075902454555035, 0.009827414527535439, 0.007068648934364319, 0.005549146793782711 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6982421875, "loss_eval": 0.8279671669006348, "epoch": 12 }, { "hidden_norms_cls": [ 1.234994649887085, 12.283885955810547, 18.62163543701172, 24.3900203704834, 28.36040496826172 ], "hidden_norms_avg": [ 4.369320869445801, 15.747625350952148, 19.76953887939453, 23.351999282836914, 25.69841194152832 ], "bp_grad_per_sample_l2_med": [ 0.0011812442680820823, 0.0002851892786566168, 0.0001940266229212284, 0.00013827465591020882, 0.00010182376718148589 ], "bp_grad_F": [ 0.07158326357603073, 0.01604902744293213, 0.010893523693084717, 0.007844515144824982, 0.005985426716506481 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.689453125, "loss_eval": 0.8679210543632507, "epoch": 13 }, { "hidden_norms_cls": [ 1.2675292491912842, 11.706314086914062, 18.347841262817383, 24.01951789855957, 28.1114501953125 ], "hidden_norms_avg": [ 4.390969753265381, 15.140497207641602, 19.62596893310547, 23.22857666015625, 25.681791305541992 ], "bp_grad_per_sample_l2_med": [ 0.0010449079563841224, 0.0002611770760267973, 0.00017687672516331077, 0.00012088462244719267, 8.996625547297299e-05 ], "bp_grad_F": [ 0.06979352980852127, 0.016320781782269478, 0.01088168565183878, 0.007916715927422047, 0.006064872723072767 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6884765625, "loss_eval": 0.8092349767684937, "epoch": 14 }, { "hidden_norms_cls": [ 1.2957582473754883, 11.933137893676758, 18.238237380981445, 23.88395118713379, 27.868513107299805 ], "hidden_norms_avg": [ 4.4383697509765625, 15.46267318725586, 19.841346740722656, 23.529712677001953, 25.852684020996094 ], "bp_grad_per_sample_l2_med": [ 0.0009947444777935743, 0.00024384066637139767, 0.00016608397709205747, 0.0001234996016137302, 9.023427992360666e-05 ], "bp_grad_F": [ 0.07019422203302383, 0.016806265339255333, 0.011433122679591179, 0.008135766722261906, 0.006158903241157532 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.712890625, "loss_eval": 0.7795700430870056, "epoch": 15 }, { "hidden_norms_cls": [ 1.3391923904418945, 11.329567909240723, 17.184999465942383, 22.353059768676758, 26.889299392700195 ], "hidden_norms_avg": [ 4.53090238571167, 15.341407775878906, 19.109649658203125, 22.223899841308594, 24.45347023010254 ], "bp_grad_per_sample_l2_med": [ 0.001086357282474637, 0.00030167572549544275, 0.0002114812668878585, 0.00015480270667467266, 0.00010993685282301158 ], "bp_grad_F": [ 0.06569939106702805, 0.017201317474246025, 0.012068319134414196, 0.008909368887543678, 0.006427914369851351 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7314453125, "loss_eval": 0.7724976539611816, "epoch": 16 }, { "hidden_norms_cls": [ 1.3643215894699097, 10.724340438842773, 16.144981384277344, 21.656490325927734, 25.777481079101562 ], "hidden_norms_avg": [ 4.520992279052734, 15.036820411682129, 18.98927879333496, 22.688859939575195, 24.71843910217285 ], "bp_grad_per_sample_l2_med": [ 0.000967099389526993, 0.0002715744194574654, 0.00019328886992298067, 0.00013628297892864794, 9.314809722127393e-05 ], "bp_grad_F": [ 0.06768078356981277, 0.01841692440211773, 0.012980606406927109, 0.009295133873820305, 0.006698420271277428 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.73828125, "loss_eval": 0.7337102890014648, "epoch": 17 }, { "hidden_norms_cls": [ 1.3963993787765503, 11.463358879089355, 16.49429702758789, 21.585325241088867, 25.636695861816406 ], "hidden_norms_avg": [ 4.539251327514648, 14.975208282470703, 18.360631942749023, 21.586400985717773, 23.561830520629883 ], "bp_grad_per_sample_l2_med": [ 0.0008780099451541901, 0.00024953793035820127, 0.00017615300021134317, 0.00012566034274641424, 8.528940088581294e-05 ], "bp_grad_F": [ 0.07198558002710342, 0.019673649221658707, 0.013869633898139, 0.009656366892158985, 0.006824122741818428 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7451171875, "loss_eval": 0.7211208343505859, "epoch": 18 }, { "hidden_norms_cls": [ 1.421103835105896, 9.9105806350708, 15.361790657043457, 20.334768295288086, 24.506919860839844 ], "hidden_norms_avg": [ 4.622361660003662, 14.7937650680542, 18.042116165161133, 21.208105087280273, 23.21940040588379 ], "bp_grad_per_sample_l2_med": [ 0.0007793674594722688, 0.0002331113355467096, 0.00016331924416590482, 0.00011330798588460311, 7.215427467599511e-05 ], "bp_grad_F": [ 0.07613872736692429, 0.022306306287646294, 0.015858706086874008, 0.011275039985775948, 0.007263499312102795 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7392578125, "loss_eval": 0.7346716523170471, "epoch": 19 }, { "hidden_norms_cls": [ 1.4554439783096313, 10.118419647216797, 15.106456756591797, 20.052860260009766, 24.34604263305664 ], "hidden_norms_avg": [ 4.584441661834717, 14.634279251098633, 17.785133361816406, 21.110010147094727, 22.89650535583496 ], "bp_grad_per_sample_l2_med": [ 0.0007524031680077314, 0.0002260785986436531, 0.00016854463319759816, 0.00011997718684142455, 7.738151180092245e-05 ], "bp_grad_F": [ 0.07370379567146301, 0.021284889429807663, 0.015382407233119011, 0.010745048522949219, 0.007394883316010237 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.74609375, "loss_eval": 0.7024286389350891, "epoch": 20 }, { "hidden_norms_cls": [ 1.4652466773986816, 10.145299911499023, 15.15330982208252, 20.131061553955078, 23.987186431884766 ], "hidden_norms_avg": [ 4.602361679077148, 14.532269477844238, 17.825733184814453, 21.43619728088379, 23.12371253967285 ], "bp_grad_per_sample_l2_med": [ 0.0008222013129852712, 0.0002455596113577485, 0.00017989490879699588, 0.00012026322656311095, 8.26524556032382e-05 ], "bp_grad_F": [ 0.0741497054696083, 0.020758304744958878, 0.01482379250228405, 0.010753357782959938, 0.007582026533782482 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7412109375, "loss_eval": 0.7016957402229309, "epoch": 21 }, { "hidden_norms_cls": [ 1.480756402015686, 10.028592109680176, 14.573174476623535, 19.24639320373535, 23.3629150390625 ], "hidden_norms_avg": [ 4.621757984161377, 14.29589557647705, 17.4040470123291, 20.71320343017578, 22.405963897705078 ], "bp_grad_per_sample_l2_med": [ 0.000667835003696382, 0.00020642780873458833, 0.0001538341457489878, 0.00010652844503056258, 6.964046770008281e-05 ], "bp_grad_F": [ 0.07375485450029373, 0.021967202425003052, 0.016106218099594116, 0.011507184244692326, 0.007651185616850853 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7607421875, "loss_eval": 0.6544591188430786, "epoch": 22 }, { "hidden_norms_cls": [ 1.5069013833999634, 9.897040367126465, 14.096169471740723, 18.488874435424805, 22.214311599731445 ], "hidden_norms_avg": [ 4.621402263641357, 13.978808403015137, 16.55535888671875, 19.729736328125, 21.272388458251953 ], "bp_grad_per_sample_l2_med": [ 0.0007426440715789795, 0.0002414636837784201, 0.00018161055049858987, 0.00012697202328126878, 8.096778037725016e-05 ], "bp_grad_F": [ 0.07682260870933533, 0.02333010919392109, 0.017287475988268852, 0.012499523349106312, 0.008510846644639969 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7568359375, "loss_eval": 0.6971542835235596, "epoch": 23 }, { "hidden_norms_cls": [ 1.5169755220413208, 9.5064058303833, 13.812594413757324, 17.95937156677246, 21.51923370361328 ], "hidden_norms_avg": [ 4.612667083740234, 13.86723804473877, 16.418981552124023, 19.12198257446289, 20.565521240234375 ], "bp_grad_per_sample_l2_med": [ 0.0007257908000610769, 0.00024720808141864836, 0.0001871327986009419, 0.00013439780741464347, 8.671147952554747e-05 ], "bp_grad_F": [ 0.07474599778652191, 0.024257108569145203, 0.01782340556383133, 0.01281843613833189, 0.008487668819725513 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.763671875, "loss_eval": 0.6618016958236694, "epoch": 24 }, { "hidden_norms_cls": [ 1.5133440494537354, 9.023777961730957, 13.088467597961426, 17.324251174926758, 21.083759307861328 ], "hidden_norms_avg": [ 4.670994281768799, 13.658943176269531, 16.629199981689453, 19.75893783569336, 21.12710952758789 ], "bp_grad_per_sample_l2_med": [ 0.0005614451365545392, 0.0001914121676236391, 0.00014186649059411138, 0.00010088241106132045, 6.150588887976483e-05 ], "bp_grad_F": [ 0.08172759413719177, 0.027048049494624138, 0.019993988797068596, 0.014050732366740704, 0.009047404862940311 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7626953125, "loss_eval": 0.6708824634552002, "epoch": 25 }, { "hidden_norms_cls": [ 1.5329865217208862, 8.596381187438965, 12.645307540893555, 16.668807983398438, 20.51462745666504 ], "hidden_norms_avg": [ 4.642580986022949, 13.140735626220703, 15.32632064819336, 17.985010147094727, 19.472858428955078 ], "bp_grad_per_sample_l2_med": [ 0.0005455430946312845, 0.00019156686903443187, 0.00014253854169510305, 0.00010098751954501495, 6.338314415188506e-05 ], "bp_grad_F": [ 0.08767001330852509, 0.029545463621616364, 0.021587952971458435, 0.014973495155572891, 0.009515349753201008 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.767578125, "loss_eval": 0.6813780069351196, "epoch": 26 }, { "hidden_norms_cls": [ 1.554770588874817, 8.98424243927002, 12.76674747467041, 16.438858032226562, 19.893146514892578 ], "hidden_norms_avg": [ 4.635522365570068, 13.039203643798828, 15.419903755187988, 18.176319122314453, 19.39232635498047 ], "bp_grad_per_sample_l2_med": [ 0.0005697832675650716, 0.0001985357521334663, 0.0001536469644634053, 0.00010455933079356328, 6.821998249506578e-05 ], "bp_grad_F": [ 0.07977671921253204, 0.02706393413245678, 0.020037846639752388, 0.014591805636882782, 0.009512925520539284 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.794921875, "loss_eval": 0.628034770488739, "epoch": 27 }, { "hidden_norms_cls": [ 1.5515426397323608, 8.19682788848877, 11.861184120178223, 15.59919548034668, 18.893400192260742 ], "hidden_norms_avg": [ 4.5841450691223145, 12.511472702026367, 14.583609580993652, 16.949586868286133, 18.082292556762695 ], "bp_grad_per_sample_l2_med": [ 0.0005373116582632065, 0.0001997901708818972, 0.0001489907590439543, 0.00010373342229286209, 6.318451050901785e-05 ], "bp_grad_F": [ 0.09340352565050125, 0.03397079557180405, 0.025108041241765022, 0.017669958993792534, 0.010975479148328304 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.767578125, "loss_eval": 0.7042175531387329, "epoch": 28 }, { "hidden_norms_cls": [ 1.5542187690734863, 8.489326477050781, 11.786734580993652, 15.331045150756836, 18.48196792602539 ], "hidden_norms_avg": [ 4.615735054016113, 12.620647430419922, 14.822388648986816, 17.454334259033203, 18.677461624145508 ], "bp_grad_per_sample_l2_med": [ 0.0005812083836644888, 0.00021461205324158072, 0.00015997944865375757, 0.00011693408305291086, 7.380295573966578e-05 ], "bp_grad_F": [ 0.09380948543548584, 0.03345760330557823, 0.025129586458206177, 0.01789030432701111, 0.011130682192742825 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7666015625, "loss_eval": 0.6850110292434692, "epoch": 29 }, { "hidden_norms_cls": [ 1.5533884763717651, 8.01724910736084, 11.423017501831055, 15.046612739562988, 18.549089431762695 ], "hidden_norms_avg": [ 4.590519428253174, 12.431540489196777, 14.243208885192871, 16.609176635742188, 18.00058937072754 ], "bp_grad_per_sample_l2_med": [ 0.0004959268844686449, 0.00020078590023331344, 0.00015426705067511648, 0.00010096926416736096, 5.95865749346558e-05 ], "bp_grad_F": [ 0.09663982689380646, 0.036162860691547394, 0.02716146595776081, 0.01926880143582821, 0.011334826238453388 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7783203125, "loss_eval": 0.6707749366760254, "epoch": 30 }, { "hidden_norms_cls": [ 1.5530469417572021, 7.959159851074219, 11.2805757522583, 14.567391395568848, 17.63263511657715 ], "hidden_norms_avg": [ 4.583434581756592, 11.983453750610352, 13.4386625289917, 15.498583793640137, 16.631824493408203 ], "bp_grad_per_sample_l2_med": [ 0.0005142099689692259, 0.00020230942755006254, 0.00015552931290585548, 0.00011007695866283029, 6.233472959138453e-05 ], "bp_grad_F": [ 0.09787525236606598, 0.037690743803977966, 0.028980012983083725, 0.02064511366188526, 0.012224731035530567 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7763671875, "loss_eval": 0.6748013496398926, "epoch": 31 }, { "hidden_norms_cls": [ 1.5515272617340088, 7.847743988037109, 10.868992805480957, 14.282126426696777, 17.300424575805664 ], "hidden_norms_avg": [ 4.579150199890137, 11.951078414916992, 13.621748924255371, 15.971713066101074, 17.04889488220215 ], "bp_grad_per_sample_l2_med": [ 0.0004585929855238646, 0.00017806614050641656, 0.0001380510366288945, 9.63187703746371e-05, 5.829996371176094e-05 ], "bp_grad_F": [ 0.10181005299091339, 0.038575656712055206, 0.02964734099805355, 0.020979750901460648, 0.01240287534892559 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.78125, "loss_eval": 0.648021936416626, "epoch": 32 }, { "hidden_norms_cls": [ 1.5606788396835327, 7.502675533294678, 10.430459022521973, 13.642136573791504, 16.445953369140625 ], "hidden_norms_avg": [ 4.601283550262451, 11.615697860717773, 13.472222328186035, 15.831238746643066, 16.856765747070312 ], "bp_grad_per_sample_l2_med": [ 0.0004074577009305358, 0.00017814920283854008, 0.00013730341743212193, 9.565176151227206e-05, 5.229458474786952e-05 ], "bp_grad_F": [ 0.11506060510873795, 0.04695325344800949, 0.03571247681975365, 0.025198202580213547, 0.013851121068000793 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.755859375, "loss_eval": 0.7299192547798157, "epoch": 33 }, { "hidden_norms_cls": [ 1.5404834747314453, 7.528626441955566, 10.384718894958496, 13.326257705688477, 16.41958999633789 ], "hidden_norms_avg": [ 4.533090591430664, 11.6575345993042, 13.231060028076172, 15.337231636047363, 16.463298797607422 ], "bp_grad_per_sample_l2_med": [ 0.00042279696208424866, 0.00016955600585788488, 0.00012915951083414257, 8.976108074421063e-05, 4.930083014187403e-05 ], "bp_grad_F": [ 0.11639728397130966, 0.047109171748161316, 0.03660130873322487, 0.02588750049471855, 0.013930009678006172 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.7065586447715759, "epoch": 34 }, { "hidden_norms_cls": [ 1.539638638496399, 7.26485013961792, 9.96584701538086, 13.003418922424316, 16.14008140563965 ], "hidden_norms_avg": [ 4.537028789520264, 11.146146774291992, 12.836923599243164, 14.992585182189941, 16.076574325561523 ], "bp_grad_per_sample_l2_med": [ 0.00039646061486564577, 0.00017108044994529337, 0.00013601842510979623, 9.225023677572608e-05, 4.893271398032084e-05 ], "bp_grad_F": [ 0.11648086458444595, 0.04862738400697708, 0.0374443456530571, 0.026762915775179863, 0.014388044364750385 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7939453125, "loss_eval": 0.6772804260253906, "epoch": 35 }, { "hidden_norms_cls": [ 1.5278778076171875, 7.107171058654785, 9.836174011230469, 12.691095352172852, 15.726043701171875 ], "hidden_norms_avg": [ 4.5205254554748535, 10.983088493347168, 12.684239387512207, 14.876561164855957, 15.817031860351562 ], "bp_grad_per_sample_l2_med": [ 0.0003774319775402546, 0.00015706375415902585, 0.0001264828024432063, 8.857168722897768e-05, 4.440043630893342e-05 ], "bp_grad_F": [ 0.12492093443870544, 0.053397826850414276, 0.040937285870313644, 0.029012493789196014, 0.015446576289832592 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7724609375, "loss_eval": 0.707297146320343, "epoch": 36 }, { "hidden_norms_cls": [ 1.51571524143219, 7.153889179229736, 9.856640815734863, 12.511648178100586, 15.47674560546875 ], "hidden_norms_avg": [ 4.51829719543457, 10.948126792907715, 12.496319770812988, 14.353506088256836, 15.267280578613281 ], "bp_grad_per_sample_l2_med": [ 0.0003654273459687829, 0.00015038737910799682, 0.00011584001913433895, 8.340556814800948e-05, 4.3377422116464004e-05 ], "bp_grad_F": [ 0.13914552330970764, 0.0589178130030632, 0.04522731155157089, 0.0323280394077301, 0.016300896182656288 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7626953125, "loss_eval": 0.729290246963501, "epoch": 37 }, { "hidden_norms_cls": [ 1.5081822872161865, 6.952159404754639, 9.558011054992676, 12.107258796691895, 15.05250358581543 ], "hidden_norms_avg": [ 4.481203556060791, 10.740157127380371, 12.00869083404541, 13.831336975097656, 14.76778507232666 ], "bp_grad_per_sample_l2_med": [ 0.0003083393967244774, 0.00012594371219165623, 0.00010108885180670768, 7.270355854416266e-05, 3.639453643700108e-05 ], "bp_grad_F": [ 0.14465992152690887, 0.061646901071071625, 0.047660429030656815, 0.03381076827645302, 0.01706051267683506 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7685546875, "loss_eval": 0.7395438551902771, "epoch": 38 }, { "hidden_norms_cls": [ 1.5159180164337158, 6.878056526184082, 9.382442474365234, 11.969950675964355, 15.129233360290527 ], "hidden_norms_avg": [ 4.494526386260986, 10.639691352844238, 12.291059494018555, 14.28632640838623, 15.170000076293945 ], "bp_grad_per_sample_l2_med": [ 0.00028951463173143566, 0.00012502263416536152, 0.00010040518827736378, 7.046512473607436e-05, 3.719307642313652e-05 ], "bp_grad_F": [ 0.1406005620956421, 0.06109313294291496, 0.047722309827804565, 0.033977217972278595, 0.01711316779255867 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7802734375, "loss_eval": 0.7057114839553833, "epoch": 39 }, { "hidden_norms_cls": [ 1.5058479309082031, 6.699619770050049, 9.136896133422852, 11.609856605529785, 14.701480865478516 ], "hidden_norms_avg": [ 4.482093811035156, 10.446189880371094, 12.056195259094238, 13.87569522857666, 14.783234596252441 ], "bp_grad_per_sample_l2_med": [ 0.0002856751380022615, 0.00013275284436531365, 0.00010139105870621279, 6.966136425035074e-05, 3.293903864687309e-05 ], "bp_grad_F": [ 0.1529398262500763, 0.06890096515417099, 0.052683208137750626, 0.03734185919165611, 0.01789216138422489 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.7478293180465698, "epoch": 40 }, { "hidden_norms_cls": [ 1.490049123764038, 6.627772331237793, 9.019189834594727, 11.385313987731934, 14.173355102539062 ], "hidden_norms_avg": [ 4.458098411560059, 10.279450416564941, 11.593936920166016, 13.30923080444336, 14.155406951904297 ], "bp_grad_per_sample_l2_med": [ 0.00021343027765396982, 9.837630932452157e-05, 8.006956340977922e-05, 5.6768003560137004e-05, 2.7385456633055583e-05 ], "bp_grad_F": [ 0.15772707760334015, 0.07120667397975922, 0.05564703419804573, 0.03953033685684204, 0.018776116892695427 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7724609375, "loss_eval": 0.7677009105682373, "epoch": 41 }, { "hidden_norms_cls": [ 1.4904595613479614, 6.347933769226074, 8.674281120300293, 11.007567405700684, 14.106690406799316 ], "hidden_norms_avg": [ 4.430132865905762, 10.265702247619629, 11.588266372680664, 13.410375595092773, 14.36179256439209 ], "bp_grad_per_sample_l2_med": [ 0.0002224426862085238, 0.00010000570182455704, 7.794459816068411e-05, 5.595289985649288e-05, 2.7256841349299066e-05 ], "bp_grad_F": [ 0.16928334534168243, 0.07747916132211685, 0.06056727096438408, 0.04274875670671463, 0.019731448963284492 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.771484375, "loss_eval": 0.7774850726127625, "epoch": 42 }, { "hidden_norms_cls": [ 1.4839239120483398, 6.341518878936768, 8.600671768188477, 10.991724014282227, 14.061833381652832 ], "hidden_norms_avg": [ 4.403061866760254, 10.020040512084961, 11.371668815612793, 13.18271255493164, 14.007345199584961 ], "bp_grad_per_sample_l2_med": [ 0.0002152575325453654, 0.00010309015488019213, 7.964189717313275e-05, 5.283725113258697e-05, 2.479495196894277e-05 ], "bp_grad_F": [ 0.17190901935100555, 0.080362468957901, 0.06201368197798729, 0.042563296854496, 0.019763268530368805 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.791015625, "loss_eval": 0.7503129243850708, "epoch": 43 }, { "hidden_norms_cls": [ 1.479953408241272, 6.386821269989014, 8.521474838256836, 10.847907066345215, 13.541037559509277 ], "hidden_norms_avg": [ 4.399942874908447, 9.979388236999512, 11.251038551330566, 12.998858451843262, 13.76570987701416 ], "bp_grad_per_sample_l2_med": [ 0.000195752116269432, 9.365259029436857e-05, 7.282401929842308e-05, 5.209222945268266e-05, 2.3047552531352267e-05 ], "bp_grad_F": [ 0.16316288709640503, 0.07674747705459595, 0.06052006781101227, 0.04277755320072174, 0.020131859928369522 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7978515625, "loss_eval": 0.732360303401947, "epoch": 44 }, { "hidden_norms_cls": [ 1.4770045280456543, 6.249807834625244, 8.36440658569336, 10.429434776306152, 13.045490264892578 ], "hidden_norms_avg": [ 4.391754627227783, 9.821492195129395, 10.789708137512207, 12.3140869140625, 13.067754745483398 ], "bp_grad_per_sample_l2_med": [ 0.0002329840644961223, 0.00011798225023085251, 9.261347440769896e-05, 6.294570630416274e-05, 2.9543562050093897e-05 ], "bp_grad_F": [ 0.1812749058008194, 0.08621949702501297, 0.067754827439785, 0.04831995815038681, 0.021977350115776062 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.7784227132797241, "epoch": 45 }, { "hidden_norms_cls": [ 1.467228651046753, 6.0983357429504395, 8.231528282165527, 10.333056449890137, 13.266757011413574 ], "hidden_norms_avg": [ 4.390368461608887, 9.647501945495605, 10.692501068115234, 12.274677276611328, 13.044783592224121 ], "bp_grad_per_sample_l2_med": [ 0.0001511751615907997, 7.784536137478426e-05, 6.136627780506387e-05, 4.35807196481619e-05, 2.014869824051857e-05 ], "bp_grad_F": [ 0.18805110454559326, 0.09124159067869186, 0.07224944978952408, 0.050726212561130524, 0.02254536561667919 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.814141571521759, "epoch": 46 }, { "hidden_norms_cls": [ 1.4649879932403564, 6.082813739776611, 8.131811141967773, 10.158056259155273, 13.049956321716309 ], "hidden_norms_avg": [ 4.377193927764893, 9.599099159240723, 10.660999298095703, 12.21728801727295, 12.965741157531738 ], "bp_grad_per_sample_l2_med": [ 0.0001712174853309989, 8.400671504205093e-05, 6.461612792918459e-05, 4.6120971092022955e-05, 2.0111323465243913e-05 ], "bp_grad_F": [ 0.19550266861915588, 0.09418290108442307, 0.07462290674448013, 0.053083814680576324, 0.02292729914188385 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7890625, "loss_eval": 0.7999259233474731, "epoch": 47 }, { "hidden_norms_cls": [ 1.4617111682891846, 6.058816432952881, 8.100686073303223, 10.085453987121582, 12.920005798339844 ], "hidden_norms_avg": [ 4.367196559906006, 9.56169605255127, 10.609153747558594, 12.135587692260742, 12.871316909790039 ], "bp_grad_per_sample_l2_med": [ 0.00015642307698726654, 7.727487536612898e-05, 5.90925665164832e-05, 4.136386633035727e-05, 1.6983105524559505e-05 ], "bp_grad_F": [ 0.202835351228714, 0.09727983921766281, 0.07683655619621277, 0.05471916124224663, 0.02326873689889908 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.783203125, "loss_eval": 0.8152254223823547, "epoch": 48 }, { "hidden_norms_cls": [ 1.4593255519866943, 6.017489433288574, 7.96034049987793, 9.983046531677246, 12.839889526367188 ], "hidden_norms_avg": [ 4.349035739898682, 9.508291244506836, 10.475739479064941, 12.025425910949707, 12.764323234558105 ], "bp_grad_per_sample_l2_med": [ 0.00013039771874900907, 6.479993317043409e-05, 5.060105831944384e-05, 3.637294139480218e-05, 1.4738084246346261e-05 ], "bp_grad_F": [ 0.2170599102973938, 0.10417382419109344, 0.08229079097509384, 0.05735529586672783, 0.024290865287184715 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7841796875, "loss_eval": 0.8357614278793335, "epoch": 49 }, { "hidden_norms_cls": [ 1.4566220045089722, 5.9422221183776855, 7.888944149017334, 9.933752059936523, 12.817610740661621 ], "hidden_norms_avg": [ 4.346043109893799, 9.43443489074707, 10.415618896484375, 11.964469909667969, 12.66396713256836 ], "bp_grad_per_sample_l2_med": [ 0.00011193535465281457, 5.694849824067205e-05, 4.533635365078226e-05, 3.3492226066300645e-05, 1.4018894034961704e-05 ], "bp_grad_F": [ 0.21774698793888092, 0.1065358892083168, 0.08431421220302582, 0.05883141607046127, 0.024615641683340073 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.8349668979644775, "epoch": 50 }, { "hidden_norms_cls": [ 1.4569600820541382, 5.859008312225342, 7.792572498321533, 9.738831520080566, 12.622002601623535 ], "hidden_norms_avg": [ 4.331563472747803, 9.398598670959473, 10.273933410644531, 11.764141082763672, 12.436033248901367 ], "bp_grad_per_sample_l2_med": [ 0.00012003595475107431, 5.908689126954414e-05, 4.746428385260515e-05, 3.251975431339815e-05, 1.3768915778200608e-05 ], "bp_grad_F": [ 0.2144007831811905, 0.10626016557216644, 0.08404342085123062, 0.05926896259188652, 0.024889416992664337 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7861328125, "loss_eval": 0.840790331363678, "epoch": 51 }, { "hidden_norms_cls": [ 1.4559087753295898, 5.8081440925598145, 7.735576629638672, 9.665096282958984, 12.462581634521484 ], "hidden_norms_avg": [ 4.331978797912598, 9.35647964477539, 10.206826210021973, 11.663065910339355, 12.307528495788574 ], "bp_grad_per_sample_l2_med": [ 0.00010101464431500062, 5.143512680660933e-05, 4.1592236811993644e-05, 3.0060553399380296e-05, 1.2701412742899265e-05 ], "bp_grad_F": [ 0.22189198434352875, 0.11008423566818237, 0.08644267171621323, 0.0603644996881485, 0.025003522634506226 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7900390625, "loss_eval": 0.8574135303497314, "epoch": 52 }, { "hidden_norms_cls": [ 1.4537159204483032, 5.80010461807251, 7.719310760498047, 9.681657791137695, 12.724189758300781 ], "hidden_norms_avg": [ 4.318180084228516, 9.302933692932129, 10.182857513427734, 11.675416946411133, 12.381869316101074 ], "bp_grad_per_sample_l2_med": [ 9.399914415553212e-05, 4.920759965898469e-05, 3.82029902539216e-05, 2.4410484911641106e-05, 9.912354471453e-06 ], "bp_grad_F": [ 0.2312120646238327, 0.11490234732627869, 0.09031722694635391, 0.06280362606048584, 0.02546737529337406 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7900390625, "loss_eval": 0.8825892210006714, "epoch": 53 }, { "hidden_norms_cls": [ 1.4533940553665161, 5.765341758728027, 7.664762496948242, 9.541180610656738, 12.46136474609375 ], "hidden_norms_avg": [ 4.321633815765381, 9.284127235412598, 10.135884284973145, 11.603636741638184, 12.27259635925293 ], "bp_grad_per_sample_l2_med": [ 0.00010168847802560776, 5.239037636783905e-05, 4.169415478827432e-05, 2.8813867174903862e-05, 1.1632122550508939e-05 ], "bp_grad_F": [ 0.23138603568077087, 0.11581514030694962, 0.09145721793174744, 0.06368965655565262, 0.025816213339567184 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7900390625, "loss_eval": 0.8627672791481018, "epoch": 54 }, { "hidden_norms_cls": [ 1.4520151615142822, 5.752710342407227, 7.6372294425964355, 9.493330001831055, 12.49281120300293 ], "hidden_norms_avg": [ 4.314420223236084, 9.275971412658691, 10.131872177124023, 11.594268798828125, 12.271230697631836 ], "bp_grad_per_sample_l2_med": [ 0.00010349372314522043, 5.0890805141534656e-05, 4.167861698078923e-05, 2.9301188988029025e-05, 1.1288396308373194e-05 ], "bp_grad_F": [ 0.23472057282924652, 0.11708012968301773, 0.09245092421770096, 0.06478185206651688, 0.025885937735438347 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.791015625, "loss_eval": 0.8611111640930176, "epoch": 55 }, { "hidden_norms_cls": [ 1.4508332014083862, 5.741517066955566, 7.59091329574585, 9.493820190429688, 12.553393363952637 ], "hidden_norms_avg": [ 4.315334320068359, 9.272273063659668, 10.107754707336426, 11.5936279296875, 12.266173362731934 ], "bp_grad_per_sample_l2_med": [ 9.209421114064753e-05, 4.9557409511180595e-05, 3.8665639294777066e-05, 2.703870450204704e-05, 1.0333649697713554e-05 ], "bp_grad_F": [ 0.23745231330394745, 0.11897031217813492, 0.09419847279787064, 0.06559450179338455, 0.02597379870712757 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.794921875, "loss_eval": 0.8737660646438599, "epoch": 56 }, { "hidden_norms_cls": [ 1.4514665603637695, 5.724127292633057, 7.567911624908447, 9.464110374450684, 12.53247356414795 ], "hidden_norms_avg": [ 4.312892436981201, 9.258728981018066, 10.092171669006348, 11.559837341308594, 12.241935729980469 ], "bp_grad_per_sample_l2_med": [ 8.842872193781659e-05, 4.636628364096396e-05, 3.5660887078847736e-05, 2.4343042241525836e-05, 9.563225830788724e-06 ], "bp_grad_F": [ 0.23917540907859802, 0.12006859481334686, 0.09492167085409164, 0.06607519090175629, 0.02614584006369114 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7939453125, "loss_eval": 0.8743407130241394, "epoch": 57 }, { "hidden_norms_cls": [ 1.4513946771621704, 5.7332282066345215, 7.562880992889404, 9.466405868530273, 12.53167724609375 ], "hidden_norms_avg": [ 4.3138651847839355, 9.26041316986084, 10.077324867248535, 11.538521766662598, 12.218836784362793 ], "bp_grad_per_sample_l2_med": [ 9.282731480197981e-05, 4.6137181925587356e-05, 3.7237725337035954e-05, 2.553310514485929e-05, 9.964967830455862e-06 ], "bp_grad_F": [ 0.24150457978248596, 0.12129233777523041, 0.09592130035161972, 0.06674522906541824, 0.026258554309606552 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7890625, "loss_eval": 0.8750766515731812, "epoch": 58 }, { "hidden_norms_cls": [ 1.4510550498962402, 5.730595111846924, 7.558650493621826, 9.460441589355469, 12.49626636505127 ], "hidden_norms_avg": [ 4.311552047729492, 9.2510347366333, 10.070302963256836, 11.530484199523926, 12.212501525878906 ], "bp_grad_per_sample_l2_med": [ 8.91910312930122e-05, 4.6800774725852534e-05, 3.584511432563886e-05, 2.5313198420917615e-05, 9.680608854978345e-06 ], "bp_grad_F": [ 0.24175073206424713, 0.12143565714359283, 0.09590216726064682, 0.06680992990732193, 0.026268428191542625 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.787109375, "loss_eval": 0.8746636509895325, "epoch": 59 }, { "hidden_norms_cls": [ 1.450972557067871, 5.727794647216797, 7.5582756996154785, 9.462045669555664, 12.50033187866211 ], "hidden_norms_avg": [ 4.311238765716553, 9.248146057128906, 10.065601348876953, 11.523144721984863, 12.206249237060547 ], "bp_grad_per_sample_l2_med": [ 8.883981354301795e-05, 4.730010550701991e-05, 3.57187855115626e-05, 2.4922017473727465e-05, 9.98118775896728e-06 ], "bp_grad_F": [ 0.24178682267665863, 0.12154776602983475, 0.09598654508590698, 0.06685590744018555, 0.026261666789650917 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.787109375, "loss_eval": 0.8750864863395691, "epoch": 60 } ], "dfa_log": [ { "hidden_norms_cls": [ 0.3210873007774353, 3.3568029403686523, 4.891699314117432, 6.200707912445068, 7.5911865234375 ], "hidden_norms_avg": [ 5.7549052238464355, 6.750590801239014, 7.9020819664001465, 8.925304412841797, 10.076716423034668 ], "bp_grad_per_sample_l2_med": [ 0.004074312746524811, 0.0011155740357935429, 0.0009667170234024525, 0.0008621186716482043, 0.0008127145702019334 ], "bp_grad_F": [ 0.20160320401191711, 0.039521340280771255, 0.033098917454481125, 0.029271923005580902, 0.027136052027344704 ], "gamma_dfa": 0.0011031709145754576, "gamma_dfa_per_layer": [ -0.004096934571862221, -0.003170878393575549, 0.003171987598761916, 0.008508509024977684 ], "acc_eval": 0.125, "loss_eval": 2.422111988067627, "epoch": 0 }, { "hidden_norms_cls": [ 1.7445409297943115, 3393.872314453125, 8096.7275390625, 11786.4453125, 15317.9609375 ], "hidden_norms_avg": [ 46.059967041015625, 2908.78857421875, 9192.9140625, 12480.814453125, 15843.904296875 ], "bp_grad_per_sample_l2_med": [ 0.0007700070273131132, 5.177932962396881e-07, 4.354141651674581e-07, 4.0796010125632165e-07, 4.096184795798763e-07 ], "bp_grad_F": [ 0.14847944676876068, 7.175570499384776e-05, 1.7355905583826825e-05, 1.4375820683198981e-05, 1.4468741937889718e-05 ], "gamma_dfa": 0.00903075491078198, "gamma_dfa_per_layer": [ 0.014700280502438545, 0.007455145940184593, 0.009132559411227703, 0.004835033789277077 ], "acc_eval": 0.2158203125, "loss_eval": 2.072723388671875, "epoch": 1 }, { "hidden_norms_cls": [ 3.5329439640045166, 17943.025390625, 46227.09765625, 60098.9921875, 105510.8828125 ], "hidden_norms_avg": [ 95.54289245605469, 14775.4267578125, 44856.01953125, 59234.35546875, 87862.078125 ], "bp_grad_per_sample_l2_med": [ 0.00029628784977830946, 1.0676165373979529e-07, 7.34040170868866e-08, 6.658416396021494e-08, 6.750254044618487e-08 ], "bp_grad_F": [ 0.12055971473455429, 8.933278149925172e-05, 3.910079612978734e-06, 3.3086737403209554e-06, 3.354543650857522e-06 ], "gamma_dfa": 0.007886230800068006, "gamma_dfa_per_layer": [ 0.016902755945920944, 0.003473796183243394, 0.009775697253644466, 0.0013926738174632192 ], "acc_eval": 0.2197265625, "loss_eval": 2.0924925804138184, "epoch": 2 }, { "hidden_norms_cls": [ 5.165565013885498, 33863.33203125, 93132.8515625, 145828.34375, 276496.0 ], "hidden_norms_avg": [ 142.7160186767578, 36882.9296875, 93356.96875, 138199.0625, 216913.359375 ], "bp_grad_per_sample_l2_med": [ 0.00022745825117453933, 4.267175768291054e-08, 3.181965624321492e-08, 2.8314032007870082e-08, 2.8843814448009653e-08 ], "bp_grad_F": [ 0.06954267621040344, 0.00012680335203185678, 2.0300262804084923e-06, 1.8529049157223199e-06, 1.8672349142434541e-06 ], "gamma_dfa": 0.00556139531545341, "gamma_dfa_per_layer": [ 0.01000538095831871, 0.0014471756294369698, 0.011906315572559834, -0.001113290898501873 ], "acc_eval": 0.2412109375, "loss_eval": 2.0521552562713623, "epoch": 3 }, { "hidden_norms_cls": [ 6.674264907836914, 43835.6796875, 150229.609375, 253133.515625, 481876.5 ], "hidden_norms_avg": [ 186.87832641601562, 74412.015625, 150159.890625, 253252.734375, 439077.25 ], "bp_grad_per_sample_l2_med": [ 0.0003350951592437923, 2.7693221937852286e-08, 1.989219278186738e-08, 1.704596108709211e-08, 1.7547710839949104e-08 ], "bp_grad_F": [ 0.058595605194568634, 0.0002476655936334282, 1.0984595064655878e-06, 1.0368654557169066e-06, 1.0405622106191004e-06 ], "gamma_dfa": 0.002481349220033735, "gamma_dfa_per_layer": [ 3.730843309313059e-05, 0.0014904557028785348, 0.011494583450257778, -0.0030969507060945034 ], "acc_eval": 0.232421875, "loss_eval": 2.058844566345215, "epoch": 4 }, { "hidden_norms_cls": [ 8.061405181884766, 102865.78125, 229004.390625, 413580.59375, 706253.625 ], "hidden_norms_avg": [ 228.99224853515625, 131342.546875, 229257.390625, 410435.25, 727001.6875 ], "bp_grad_per_sample_l2_med": [ 0.00029934433405287564, 1.670629679040303e-08, 1.3200744497510186e-08, 1.1068386207568892e-08, 1.1248447506773118e-08 ], "bp_grad_F": [ 0.49810686707496643, 0.0004038630868308246, 1.391591922583757e-06, 6.11680206930032e-07, 5.242948759587307e-07 ], "gamma_dfa": 0.0009187236428260803, "gamma_dfa_per_layer": [ -0.003027769736945629, 0.002294017933309078, 0.00904145184904337, -0.004632805474102497 ], "acc_eval": 0.2197265625, "loss_eval": 2.091141700744629, "epoch": 5 }, { "hidden_norms_cls": [ 9.400635719299316, 164205.859375, 302756.3125, 584338.25, 1250749.125 ], "hidden_norms_avg": [ 270.8563232421875, 190832.34375, 307117.59375, 620500.3125, 1149191.375 ], "bp_grad_per_sample_l2_med": [ 0.00034470504033379257, 1.3897826889319731e-08, 8.662226491651381e-09, 6.850678690994982e-09, 7.0105756755367565e-09 ], "bp_grad_F": [ 0.08854538202285767, 0.0002125167811755091, 3.9876397295302013e-07, 2.9177280680414697e-07, 2.903063318626664e-07 ], "gamma_dfa": 0.0008902656263671815, "gamma_dfa_per_layer": [ -0.004116768017411232, 0.004187953192740679, 0.007109872996807098, -0.003619995666667819 ], "acc_eval": 0.208984375, "loss_eval": 2.09378981590271, "epoch": 6 }, { "hidden_norms_cls": [ 10.676177978515625, 216327.671875, 429372.28125, 910110.1875, 1955787.375 ], "hidden_norms_avg": [ 311.3556823730469, 279124.65625, 434169.5, 917506.125, 1714750.5 ], "bp_grad_per_sample_l2_med": [ 0.0002802011731546372, 8.183582700382885e-09, 5.617039278149605e-09, 4.765932093420133e-09, 4.884364024348997e-09 ], "bp_grad_F": [ 0.2021757811307907, 0.00017153903900180012, 2.627296851187566e-07, 1.9583571031489555e-07, 1.9719628596703842e-07 ], "gamma_dfa": 0.00245969754178077, "gamma_dfa_per_layer": [ 0.0030665153171867132, 0.0039703575894236565, 0.005591260269284248, -0.0027893430087715387 ], "acc_eval": 0.224609375, "loss_eval": 2.0816030502319336, "epoch": 7 }, { "hidden_norms_cls": [ 11.970849990844727, 282019.0, 553729.25, 1250316.5, 2676136.75 ], "hidden_norms_avg": [ 350.0874938964844, 367917.96875, 563719.125, 1231394.75, 2379567.75 ], "bp_grad_per_sample_l2_med": [ 0.00015754146443214267, 7.837374305097455e-09, 4.1749870227647534e-09, 3.572480755664742e-09, 3.6429026462059255e-09 ], "bp_grad_F": [ 0.06816119700670242, 0.0002165154874091968, 1.8739321205885062e-07, 1.4396131575722393e-07, 1.449055417879208e-07 ], "gamma_dfa": 0.0018902571755461395, "gamma_dfa_per_layer": [ 0.0010774387046694756, 0.004019944928586483, 0.004736708011478186, -0.0022730629425495863 ], "acc_eval": 0.2236328125, "loss_eval": 2.069587469100952, "epoch": 8 }, { "hidden_norms_cls": [ 13.234355926513672, 498576.65625, 747356.3125, 1569417.0, 3492356.0 ], "hidden_norms_avg": [ 390.34356689453125, 517596.5, 755798.625, 1559863.25, 3087860.75 ], "bp_grad_per_sample_l2_med": [ 0.00012954612611792982, 6.955718223622398e-09, 3.3238092278509157e-09, 2.7362234700234467e-09, 2.7891511322764018e-09 ], "bp_grad_F": [ 0.03943011909723282, 0.00019621588580776006, 1.9796995331944345e-07, 1.1484767270530938e-07, 1.1313876058238748e-07 ], "gamma_dfa": 0.002013051969697699, "gamma_dfa_per_layer": [ 0.0007974229520186782, 0.0045172227546572685, 0.004162413999438286, -0.0014248518273234367 ], "acc_eval": 0.21484375, "loss_eval": 2.0846829414367676, "epoch": 9 }, { "hidden_norms_cls": [ 14.412362098693848, 653898.875, 962527.9375, 1974772.75, 4235229.0 ], "hidden_norms_avg": [ 426.1747741699219, 660897.75, 954217.625, 1992937.5, 3912584.0 ], "bp_grad_per_sample_l2_med": [ 0.0001297950657317415, 8.463428180505161e-09, 2.735849546908753e-09, 2.2942541200166033e-09, 2.329255233135541e-09 ], "bp_grad_F": [ 0.07335253059864044, 0.0002778704511001706, 2.1924184068211616e-07, 1.5885484572208952e-07, 9.551467172741468e-08 ], "gamma_dfa": 0.001994484744500369, "gamma_dfa_per_layer": [ 0.0028600264340639114, 0.0031631651800125837, 0.0033731083385646343, -0.0014183609746396542 ], "acc_eval": 0.2373046875, "loss_eval": 2.0768301486968994, "epoch": 10 }, { "hidden_norms_cls": [ 15.627301216125488, 805321.625, 1191654.25, 2375967.75, 5068243.5 ], "hidden_norms_avg": [ 464.92144775390625, 870169.75, 1209570.75, 2342305.5, 4797491.0 ], "bp_grad_per_sample_l2_med": [ 0.00014358766202349216, 6.655038742309216e-09, 2.213497385383789e-09, 1.8578552030135143e-09, 1.8845198734851465e-09 ], "bp_grad_F": [ 0.22341646254062653, 0.0010545816039666533, 3.022053363110899e-07, 8.581165644727662e-08, 7.942276880612553e-08 ], "gamma_dfa": 0.0012935771082993597, "gamma_dfa_per_layer": [ -0.00014482985716313124, 0.0035164642613381147, 0.002910400740802288, -0.0011077267117798328 ], "acc_eval": 0.2138671875, "loss_eval": 2.076242446899414, "epoch": 11 }, { "hidden_norms_cls": [ 16.751590728759766, 758638.375, 1437438.0, 2779040.25, 5662257.0 ], "hidden_norms_avg": [ 501.60235595703125, 1119163.625, 1513203.375, 2677392.25, 5339190.0 ], "bp_grad_per_sample_l2_med": [ 0.00020390149438753724, 5.5311413227343564e-09, 1.8890189412701375e-09, 1.6241474831701908e-09, 1.6578916017806478e-09 ], "bp_grad_F": [ 1.734735369682312, 0.000374374445527792, 1.2862761877840967e-07, 1.1062630989044919e-07, 6.887377423936414e-08 ], "gamma_dfa": 0.0020944410644005984, "gamma_dfa_per_layer": [ 0.0036250988487154245, 0.0027163547929376364, 0.0028407545760273933, -0.0008044439600780606 ], "acc_eval": 0.23046875, "loss_eval": 2.083003520965576, "epoch": 12 }, { "hidden_norms_cls": [ 17.76032066345215, 1093088.5, 1739864.0, 3080344.5, 6632118.5 ], "hidden_norms_avg": [ 539.1420288085938, 1433551.75, 1843404.125, 3096921.75, 6237853.0 ], "bp_grad_per_sample_l2_med": [ 0.00014031230239197612, 4.252878937904825e-09, 1.704668295410272e-09, 1.518661418842271e-09, 1.5263605934734414e-09 ], "bp_grad_F": [ 0.05247655138373375, 0.00048432740732096136, 1.395327586806161e-07, 8.375257465331742e-08, 5.970760241780226e-08 ], "gamma_dfa": 0.0018704376125242561, "gamma_dfa_per_layer": [ 0.0021162822376936674, 0.003257386852055788, 0.002796958899125457, -0.0006888775387778878 ], "acc_eval": 0.2177734375, "loss_eval": 2.1021971702575684, "epoch": 13 }, { "hidden_norms_cls": [ 18.760025024414062, 2223954.75, 2460609.0, 3718541.25, 7618764.0 ], "hidden_norms_avg": [ 577.8324584960938, 1908819.625, 2348359.5, 3542983.0, 6779725.0 ], "bp_grad_per_sample_l2_med": [ 0.00010403544729342684, 2.662567277766925e-09, 1.6195218499603925e-09, 1.422262307926303e-09, 1.433551610752204e-09 ], "bp_grad_F": [ 0.08673901855945587, 0.0001567020226502791, 8.41187173250546e-08, 5.8843131256480774e-08, 5.371895994699116e-08 ], "gamma_dfa": 0.003976444830186665, "gamma_dfa_per_layer": [ 0.010876781307160854, 0.0029237696435302496, 0.0026041539385914803, -0.000498925568535924 ], "acc_eval": 0.2177734375, "loss_eval": 2.138009548187256, "epoch": 14 }, { "hidden_norms_cls": [ 19.738407135009766, 2339586.0, 2696652.5, 4235438.5, 7955372.0 ], "hidden_norms_avg": [ 619.4888916015625, 2243613.75, 2801893.5, 4018190.75, 7143025.0 ], "bp_grad_per_sample_l2_med": [ 0.00014718857710249722, 2.6654392026870255e-09, 1.4668186665289795e-09, 1.3113429231381701e-09, 1.3212382299343517e-09 ], "bp_grad_F": [ 0.1564428061246872, 0.00024187436792999506, 2.621962664761668e-07, 5.580703898999673e-08, 5.442945649747344e-08 ], "gamma_dfa": 0.0019682426573126577, "gamma_dfa_per_layer": [ 0.003052386222407222, 0.0027148486115038395, 0.0025699653197079897, -0.00046422952436842024 ], "acc_eval": 0.2265625, "loss_eval": 2.145447254180908, "epoch": 15 }, { "hidden_norms_cls": [ 20.727081298828125, 2753822.5, 3114285.75, 4713040.0, 8652256.0 ], "hidden_norms_avg": [ 660.8045654296875, 2684893.0, 3331407.5, 4614215.5, 7864381.5 ], "bp_grad_per_sample_l2_med": [ 0.00013858993770554662, 2.7730009399817845e-09, 1.344458322449782e-09, 1.2393497339502346e-09, 1.2431760065823028e-09 ], "bp_grad_F": [ 0.1324291080236435, 0.00022225745487958193, 9.285694346772289e-08, 4.7669061586930184e-08, 4.746264181676452e-08 ], "gamma_dfa": 0.001855946145951748, "gamma_dfa_per_layer": [ 0.004218719433993101, 0.001718730665743351, 0.0019668969325721264, -0.0004805624485015869 ], "acc_eval": 0.251953125, "loss_eval": 2.101409673690796, "epoch": 16 }, { "hidden_norms_cls": [ 21.603151321411133, 3877476.75, 4156743.75, 5474745.5, 10299149.0 ], "hidden_norms_avg": [ 698.7645263671875, 3523264.5, 4085091.75, 5354783.0, 9094561.0 ], "bp_grad_per_sample_l2_med": [ 0.000199332891497761, 1.9098649328697093e-09, 1.2144363292776461e-09, 1.1166952917918138e-09, 1.1315383074972374e-09 ], "bp_grad_F": [ 0.15142236649990082, 4.2183397454209626e-05, 7.309424887580462e-08, 5.2962114693855256e-08, 4.2337880756804225e-08 ], "gamma_dfa": 0.0013709207050851546, "gamma_dfa_per_layer": [ 0.0023175266105681658, 0.0016730788629502058, 0.0018372924532741308, -0.0003442151064518839 ], "acc_eval": 0.220703125, "loss_eval": 2.1280713081359863, "epoch": 17 }, { "hidden_norms_cls": [ 22.48230743408203, 3581296.5, 4024996.25, 6183271.0, 11393130.0 ], "hidden_norms_avg": [ 735.2485961914062, 4017679.75, 4751523.5, 6215236.0, 10366257.0 ], "bp_grad_per_sample_l2_med": [ 0.00018803548300638795, 1.895784862426808e-09, 1.1237420993737146e-09, 1.0378963244406236e-09, 1.0573794062551656e-09 ], "bp_grad_F": [ 0.12878409028053284, 4.194497887510806e-05, 4.941083631138099e-08, 3.9714532107382183e-08, 3.994472663748638e-08 ], "gamma_dfa": 0.0012161588310846128, "gamma_dfa_per_layer": [ 0.0021385664585977793, 0.0015012789517641068, 0.0016565187834203243, -0.0004317288694437593 ], "acc_eval": 0.2158203125, "loss_eval": 2.1137895584106445, "epoch": 18 }, { "hidden_norms_cls": [ 23.29258155822754, 4616424.5, 5061994.0, 6831782.5, 12437102.0 ], "hidden_norms_avg": [ 768.5599975585938, 4586839.5, 5567332.5, 6953557.0, 11342041.0 ], "bp_grad_per_sample_l2_med": [ 0.00021542877948377281, 1.9688994878919175e-09, 1.0831572305747272e-09, 9.59386015075836e-10, 9.76972058808201e-10 ], "bp_grad_F": [ 0.09346769750118256, 4.979455843567848e-05, 4.6927411290198506e-08, 3.8312244043936516e-08, 3.882623289541698e-08 ], "gamma_dfa": 0.0011904535058420151, "gamma_dfa_per_layer": [ 0.0024171490222215652, 0.0012326111318543553, 0.0015420420095324516, -0.0004299881402403116 ], "acc_eval": 0.2333984375, "loss_eval": 2.0970499515533447, "epoch": 19 }, { "hidden_norms_cls": [ 24.054462432861328, 5806660.5, 6270370.0, 7861086.0, 14600824.0 ], "hidden_norms_avg": [ 801.1851806640625, 5855518.5, 6747570.0, 8137969.0, 13373154.0 ], "bp_grad_per_sample_l2_med": [ 0.00012799039541278034, 1.5442244150065676e-09, 9.774002718287989e-10, 8.729071909741037e-10, 8.921305361120346e-10 ], "bp_grad_F": [ 0.9552626609802246, 1.163827892014524e-05, 2.461903250150499e-07, 3.4675800009154045e-08, 3.4831803219503854e-08 ], "gamma_dfa": 0.0018355100764892995, "gamma_dfa_per_layer": [ 0.004604285582900047, 0.00167210737708956, 0.001404301729053259, -0.0003386543830856681 ], "acc_eval": 0.2138671875, "loss_eval": 2.11769700050354, "epoch": 20 }, { "hidden_norms_cls": [ 24.826902389526367, 6414338.0, 6989573.0, 8609765.0, 15368301.0 ], "hidden_norms_avg": [ 830.1490478515625, 6946265.5, 7916239.0, 9224772.0, 14431417.0 ], "bp_grad_per_sample_l2_med": [ 0.00015248128329403698, 1.4729809594271615e-09, 9.462167716023373e-10, 8.629364445233989e-10, 8.805687845558907e-10 ], "bp_grad_F": [ 0.1705506592988968, 0.00016797611897345632, 4.810285503253908e-08, 3.399246040203252e-08, 3.436711182303043e-08 ], "gamma_dfa": 0.0015317398574552499, "gamma_dfa_per_layer": [ 0.004021936096251011, 0.0012830595951527357, 0.0012305387062951922, -0.00040857496787793934 ], "acc_eval": 0.2236328125, "loss_eval": 2.102954864501953, "epoch": 21 }, { "hidden_norms_cls": [ 25.52900505065918, 8152435.5, 8736555.0, 9881049.0, 16997340.0 ], "hidden_norms_avg": [ 858.3137817382812, 7544203.0, 8860779.0, 10224814.0, 15607154.0 ], "bp_grad_per_sample_l2_med": [ 0.0001363755582133308, 1.2969386675720784e-09, 9.174655479782245e-10, 8.421383035361885e-10, 8.538599827190296e-10 ], "bp_grad_F": [ 0.07549053430557251, 2.9420058126561344e-05, 5.8904493727141016e-08, 3.187446395713778e-08, 3.1860317051268794e-08 ], "gamma_dfa": 0.0023631651129107922, "gamma_dfa_per_layer": [ 0.007739294320344925, 0.0009300304809585214, 0.001171439653262496, -0.00038810400292277336 ], "acc_eval": 0.2080078125, "loss_eval": 2.1162400245666504, "epoch": 22 }, { "hidden_norms_cls": [ 26.122589111328125, 9255466.0, 9964734.0, 11054792.0, 18565818.0 ], "hidden_norms_avg": [ 884.7098388671875, 8814330.0, 10177720.0, 11552646.0, 17489728.0 ], "bp_grad_per_sample_l2_med": [ 0.00014142012514639646, 1.3653665975610352e-09, 8.580440802319345e-10, 7.922714151398225e-10, 8.032630116616701e-10 ], "bp_grad_F": [ 0.11926258355379105, 1.2633940968953539e-05, 3.893048727832138e-08, 3.075604126934195e-08, 3.043995278062539e-08 ], "gamma_dfa": 0.0013515961618395522, "gamma_dfa_per_layer": [ 0.0038036422338336706, 0.0009011125075630844, 0.0010650388430804014, -0.0003634089371189475 ], "acc_eval": 0.201171875, "loss_eval": 2.134256362915039, "epoch": 23 }, { "hidden_norms_cls": [ 26.71797752380371, 8691604.0, 9652268.0, 11413482.0, 19342164.0 ], "hidden_norms_avg": [ 908.3400268554688, 9418884.0, 11132975.0, 12548590.0, 18516546.0 ], "bp_grad_per_sample_l2_med": [ 0.00016020517796278, 1.5232745065318909e-09, 8.103306359252826e-10, 7.392123024807518e-10, 7.529800671868259e-10 ], "bp_grad_F": [ 0.08055854588747025, 1.5452902516699396e-05, 3.9288735820264264e-08, 3.091117406484045e-08, 2.9865013573271426e-08 ], "gamma_dfa": 0.0012649961790884845, "gamma_dfa_per_layer": [ 0.0036856848746538162, 0.0008738536853343248, 0.0009324033162556589, -0.00043195715988986194 ], "acc_eval": 0.216796875, "loss_eval": 2.1074087619781494, "epoch": 24 }, { "hidden_norms_cls": [ 27.27407455444336, 9931691.0, 10836582.0, 12350148.0, 20677670.0 ], "hidden_norms_avg": [ 931.8362426757812, 10575293.0, 12476721.0, 13979366.0, 20145220.0 ], "bp_grad_per_sample_l2_med": [ 0.0002644142950884998, 1.4137412351900025e-09, 7.711813965194381e-10, 7.245293809354791e-10, 7.329452600401964e-10 ], "bp_grad_F": [ 0.08752908557653427, 3.3139032893814147e-05, 4.584432744536571e-08, 2.996421955003825e-08, 2.8689356668110122e-08 ], "gamma_dfa": 0.0013240749976830557, "gamma_dfa_per_layer": [ 0.003940493334084749, 0.0008323215297423303, 0.0009093738626688719, -0.0003858887357637286 ], "acc_eval": 0.2080078125, "loss_eval": 2.1011557579040527, "epoch": 25 }, { "hidden_norms_cls": [ 27.817367553710938, 12253263.0, 13105294.0, 14345712.0, 22455440.0 ], "hidden_norms_avg": [ 953.0517578125, 12373978.0, 14141729.0, 15597335.0, 22309104.0 ], "bp_grad_per_sample_l2_med": [ 0.00014759604528080672, 1.123480086739903e-09, 7.102037291595309e-10, 6.690955567378865e-10, 6.791667228611686e-10 ], "bp_grad_F": [ 0.05615593492984772, 0.00010146480053663254, 3.714368190799178e-08, 2.748037175592799e-08, 2.6385574614096186e-08 ], "gamma_dfa": 0.0012311612081248313, "gamma_dfa_per_layer": [ 0.003369898535311222, 0.0009893677197396755, 0.0009041082230396569, -0.0003387296455912292 ], "acc_eval": 0.234375, "loss_eval": 2.105236291885376, "epoch": 26 }, { "hidden_norms_cls": [ 28.32236099243164, 13643201.0, 14611628.0, 15764247.0, 24160378.0 ], "hidden_norms_avg": [ 973.9281616210938, 13221320.0, 15394035.0, 16890642.0, 23678466.0 ], "bp_grad_per_sample_l2_med": [ 0.00016657183005008847, 9.720990679085162e-10, 6.881580305595492e-10, 6.496979620962406e-10, 6.5528305004392e-10 ], "bp_grad_F": [ 0.21266740560531616, 1.0097430276800878e-05, 5.8009760550703504e-08, 2.5056060337647068e-08, 2.5318335872270836e-08 ], "gamma_dfa": 0.0010233484499622136, "gamma_dfa_per_layer": [ 0.0030805980786681175, 0.0005203179316595197, 0.000822446309030056, -0.00032996851950883865 ], "acc_eval": 0.212890625, "loss_eval": 2.137085437774658, "epoch": 27 }, { "hidden_norms_cls": [ 28.79292106628418, 13177481.0, 14299000.0, 15555998.0, 23304192.0 ], "hidden_norms_avg": [ 992.415771484375, 14624837.0, 16826644.0, 18325902.0, 25292966.0 ], "bp_grad_per_sample_l2_med": [ 0.00020211696391925216, 1.1425522750130312e-09, 6.55300591567709e-10, 6.094423854463571e-10, 6.189129764244683e-10 ], "bp_grad_F": [ 0.17359277606010437, 1.2817296010325663e-05, 7.396955936656013e-08, 2.5667416636565576e-08, 2.485118777428852e-08 ], "gamma_dfa": 0.0013693289074581116, "gamma_dfa_per_layer": [ 0.004313473589718342, 0.0007373306434601545, 0.000740988994948566, -0.00031447759829461575 ], "acc_eval": 0.2255859375, "loss_eval": 2.095831871032715, "epoch": 28 }, { "hidden_norms_cls": [ 29.206546783447266, 13026473.0, 14086985.0, 16207103.0, 25752542.0 ], "hidden_norms_avg": [ 1012.0676879882812, 14977745.0, 17788350.0, 19459138.0, 26297900.0 ], "bp_grad_per_sample_l2_med": [ 0.0002467916056048125, 1.5415436704913077e-09, 6.588643519656046e-10, 6.053296752739357e-10, 6.112412798131572e-10 ], "bp_grad_F": [ 0.042935822159051895, 9.192503966914956e-06, 3.478140442325639e-08, 2.366191687031005e-08, 2.384759412166204e-08 ], "gamma_dfa": 0.0008732089045224711, "gamma_dfa_per_layer": [ 0.002771018771454692, 0.00032788922544568777, 0.0007068651611916721, -0.0003129375400021672 ], "acc_eval": 0.2294921875, "loss_eval": 2.0877132415771484, "epoch": 29 }, { "hidden_norms_cls": [ 29.655010223388672, 18104814.0, 18959442.0, 20352136.0, 30115644.0 ], "hidden_norms_avg": [ 1030.1336669921875, 17704192.0, 19945910.0, 21540694.0, 29199112.0 ], "bp_grad_per_sample_l2_med": [ 0.00019920141494367272, 8.472024748407136e-10, 5.961620086480934e-10, 5.578593698096768e-10, 5.602495689593923e-10 ], "bp_grad_F": [ 0.05658308416604996, 2.5135868781944737e-05, 4.3493169954444966e-08, 2.1390142990185268e-08, 2.1341643119399123e-08 ], "gamma_dfa": 0.0010463381186127663, "gamma_dfa_per_layer": [ 0.0027386434376239777, 0.0009209397248923779, 0.0007645037840120494, -0.0002387344720773399 ], "acc_eval": 0.2138671875, "loss_eval": 2.1298673152923584, "epoch": 30 }, { "hidden_norms_cls": [ 30.063920974731445, 20103628.0, 20986630.0, 22120356.0, 31195618.0 ], "hidden_norms_avg": [ 1046.1927490234375, 18906620.0, 21404482.0, 23038508.0, 30526688.0 ], "bp_grad_per_sample_l2_med": [ 0.0002040969266090542, 9.528980937645315e-10, 5.700001026731627e-10, 5.158900528989818e-10, 5.214851328538828e-10 ], "bp_grad_F": [ 0.0816737711429596, 5.908617822569795e-05, 3.4592272157851767e-08, 2.022995992945198e-08, 2.0381063947638722e-08 ], "gamma_dfa": 0.001085347576008644, "gamma_dfa_per_layer": [ 0.0035934830084443092, 0.0002959886915050447, 0.0007062341319397092, -0.0002543155278544873 ], "acc_eval": 0.2041015625, "loss_eval": 2.116055965423584, "epoch": 31 }, { "hidden_norms_cls": [ 30.392677307128906, 21290946.0, 22100456.0, 23440498.0, 32839040.0 ], "hidden_norms_avg": [ 1062.797119140625, 20072588.0, 22866046.0, 24608556.0, 32259930.0 ], "bp_grad_per_sample_l2_med": [ 0.00022883246128913015, 1.3679187782500435e-09, 5.444520945196984e-10, 5.043216955158414e-10, 5.114720313947885e-10 ], "bp_grad_F": [ 0.2192479968070984, 0.0001256070681847632, 1.2757884348957305e-07, 2.0006645229386777e-08, 1.9971306386423748e-08 ], "gamma_dfa": 0.0019978012933279388, "gamma_dfa_per_layer": [ 0.0072806887328624725, 0.0002412673202343285, 0.000707695260643959, -0.00023844614042900503 ], "acc_eval": 0.2197265625, "loss_eval": 2.1034791469573975, "epoch": 32 }, { "hidden_norms_cls": [ 30.711090087890625, 22272344.0, 23036462.0, 24462584.0, 35130192.0 ], "hidden_norms_avg": [ 1082.3468017578125, 20945452.0, 23993758.0, 25838460.0, 33448582.0 ], "bp_grad_per_sample_l2_med": [ 0.0005148049676790833, 2.304462176638822e-09, 5.340937136999457e-10, 4.950916898671665e-10, 5.010572512453848e-10 ], "bp_grad_F": [ 0.15110087394714355, 3.209088754374534e-05, 1.0334197497741116e-07, 2.0131187383753968e-08, 1.9814510920923567e-08 ], "gamma_dfa": 0.003046433750569122, "gamma_dfa_per_layer": [ 0.011593285948038101, 0.00019314857490826398, 0.0006439671851694584, -0.0002446667058393359 ], "acc_eval": 0.208984375, "loss_eval": 2.112250328063965, "epoch": 33 }, { "hidden_norms_cls": [ 31.0146427154541, 29106790.0, 29617952.0, 31075512.0, 42307980.0 ], "hidden_norms_avg": [ 1102.4920654296875, 22080922.0, 25255976.0, 27220448.0, 35072796.0 ], "bp_grad_per_sample_l2_med": [ 0.0003266549902036786, 3.0358568992028268e-09, 4.893331295718895e-10, 4.395950825575312e-10, 4.4405815136094873e-10 ], "bp_grad_F": [ 1.0139163732528687, 1.6822159523144364e-05, 1.2544650473955699e-07, 1.6449900996917677e-08, 1.5756539184508256e-08 ], "gamma_dfa": 0.004347974703705404, "gamma_dfa_per_layer": [ 0.016904333606362343, -2.5271147023886442e-05, 0.0006614690646529198, -0.00014863270916976035 ], "acc_eval": 0.1806640625, "loss_eval": 2.1869568824768066, "epoch": 34 }, { "hidden_norms_cls": [ 31.282560348510742, 30793450.0, 31273076.0, 33029836.0, 44659544.0 ], "hidden_norms_avg": [ 1120.8310546875, 23223250.0, 26597348.0, 28740710.0, 37219140.0 ], "bp_grad_per_sample_l2_med": [ 0.0004533866886049509, 8.621259817154225e-10, 4.717314872060285e-10, 4.43607900413312e-10, 4.492739236194865e-10 ], "bp_grad_F": [ 0.8242164254188538, 9.425415555597283e-06, 6.696246401816097e-08, 1.4385987512355314e-08, 1.456661191667763e-08 ], "gamma_dfa": 0.004019053936644923, "gamma_dfa_per_layer": [ 0.015497363172471523, 0.0001274545502383262, 0.0006036070408299565, -0.00015220901696011424 ], "acc_eval": 0.1396484375, "loss_eval": 2.199540615081787, "epoch": 35 }, { "hidden_norms_cls": [ 31.512802124023438, 21969868.0, 22884238.0, 24682478.0, 38405980.0 ], "hidden_norms_avg": [ 1138.61962890625, 23861642.0, 27547416.0, 29877192.0, 38524416.0 ], "bp_grad_per_sample_l2_med": [ 0.00065120670478791, 1.8789774181016128e-09, 5.075246334307337e-10, 4.637440431665141e-10, 4.687980004192127e-10 ], "bp_grad_F": [ 0.22404567897319794, 6.978048531891545e-06, 5.974419536869391e-08, 1.854446907145757e-08, 1.8726453276940447e-08 ], "gamma_dfa": 0.0030916051182430238, "gamma_dfa_per_layer": [ 0.011011095717549324, 0.0010498585179448128, 0.0005736061139032245, -0.00026813987642526627 ], "acc_eval": 0.20703125, "loss_eval": 2.1297407150268555, "epoch": 36 }, { "hidden_norms_cls": [ 31.728811264038086, 29299954.0, 29843046.0, 31522240.0, 44597740.0 ], "hidden_norms_avg": [ 1154.2742919921875, 26176784.0, 29361794.0, 31622036.0, 40631524.0 ], "bp_grad_per_sample_l2_med": [ 0.00057179294526577, 8.620974489836897e-10, 4.3859474385676833e-10, 4.131678610352907e-10, 4.158901834028228e-10 ], "bp_grad_F": [ 0.1988120824098587, 6.200312782311812e-06, 7.633398269035752e-08, 1.800971105581084e-08, 1.6420651505200112e-08 ], "gamma_dfa": 0.0036353242212499026, "gamma_dfa_per_layer": [ 0.013258620165288448, 0.0009053392568603158, 0.0005595044931396842, -0.00018216703028883785 ], "acc_eval": 0.193359375, "loss_eval": 2.162503719329834, "epoch": 37 }, { "hidden_norms_cls": [ 31.93093490600586, 24153264.0, 24958016.0, 27164164.0, 41821856.0 ], "hidden_norms_avg": [ 1168.3504638671875, 25251302.0, 29331440.0, 31888322.0, 40732864.0 ], "bp_grad_per_sample_l2_med": [ 0.0007007869426161051, 3.803806603031035e-09, 4.6435830181046356e-10, 4.2823591894780577e-10, 4.335505288111108e-10 ], "bp_grad_F": [ 0.23370306193828583, 5.834654530190164e-06, 4.249230300956697e-08, 1.778762737103534e-08, 1.7575523258983594e-08 ], "gamma_dfa": 0.003036663241800852, "gamma_dfa_per_layer": [ 0.010693107731640339, 0.001166085829026997, 0.0005278221797198057, -0.00024036277318373322 ], "acc_eval": 0.2060546875, "loss_eval": 2.145090103149414, "epoch": 38 }, { "hidden_norms_cls": [ 32.11568069458008, 30941254.0, 31479742.0, 33270594.0, 46886708.0 ], "hidden_norms_avg": [ 1180.89794921875, 26732550.0, 30676362.0, 33269292.0, 42382468.0 ], "bp_grad_per_sample_l2_med": [ 0.0006622264045290649, 1.5328843749884413e-09, 4.1302217201888425e-10, 3.8878930630481534e-10, 3.9369618676232676e-10 ], "bp_grad_F": [ 0.7251601815223694, 2.9320523026399314e-05, 1.0578004605577007e-07, 1.5190060764780355e-08, 1.538120386612718e-08 ], "gamma_dfa": 0.0034242832334712148, "gamma_dfa_per_layer": [ 0.012806901708245277, 0.0005313451401889324, 0.0005365218385122716, -0.00017763575306162238 ], "acc_eval": 0.1904296875, "loss_eval": 2.1417269706726074, "epoch": 39 }, { "hidden_norms_cls": [ 32.295955657958984, 33935232.0, 34368956.0, 35934572.0, 47697056.0 ], "hidden_norms_avg": [ 1192.405517578125, 27784236.0, 31654758.0, 34253712.0, 43239588.0 ], "bp_grad_per_sample_l2_med": [ 0.000609845039434731, 1.1788049425476288e-09, 4.4074988103659507e-10, 3.883143528948807e-10, 3.8990835560248627e-10 ], "bp_grad_F": [ 0.3570167124271393, 5.2556606533471495e-06, 6.658066098452764e-08, 1.6441132899558397e-08, 1.5662063646004754e-08 ], "gamma_dfa": 0.0031971330136002507, "gamma_dfa_per_layer": [ 0.011760826222598553, 0.000679977354593575, 0.0005443703266791999, -0.00019664184947032481 ], "acc_eval": 0.1962890625, "loss_eval": 2.159468173980713, "epoch": 40 }, { "hidden_norms_cls": [ 32.446258544921875, 19652562.0, 21036314.0, 25921266.0, 40927384.0 ], "hidden_norms_avg": [ 1203.144287109375, 31749304.0, 34556376.0, 36976868.0, 47059032.0 ], "bp_grad_per_sample_l2_med": [ 0.0006137214368209243, 8.001962981118993e-10, 4.3686718131930036e-10, 4.163595301864831e-10, 4.1693556940280985e-10 ], "bp_grad_F": [ 0.12317141890525818, 1.0874373401748016e-05, 3.419825134187704e-08, 1.7081790204542813e-08, 1.7078438219186864e-08 ], "gamma_dfa": 0.002385696723649744, "gamma_dfa_per_layer": [ 0.008561503142118454, 0.000761325703933835, 0.00044924806570634246, -0.0002292900171596557 ], "acc_eval": 0.1943359375, "loss_eval": 2.1486196517944336, "epoch": 41 }, { "hidden_norms_cls": [ 32.65601348876953, 18852588.0, 20806824.0, 26129350.0, 41854136.0 ], "hidden_norms_avg": [ 1211.216064453125, 33512262.0, 36150576.0, 38488828.0, 48876332.0 ], "bp_grad_per_sample_l2_med": [ 0.00041886867256835103, 6.960994003435417e-10, 3.895795075425923e-10, 3.7316269518861134e-10, 3.8092326515304364e-10 ], "bp_grad_F": [ 0.14164908230304718, 1.2379082363622729e-06, 2.6289937338219715e-08, 1.6158612226035984e-08, 1.6345055087185756e-08 ], "gamma_dfa": 0.0026270662965544034, "gamma_dfa_per_layer": [ 0.009110232815146446, 0.0011993220541626215, 0.00041866287938319147, -0.00021995256247464567 ], "acc_eval": 0.19140625, "loss_eval": 2.1592655181884766, "epoch": 42 }, { "hidden_norms_cls": [ 32.8077507019043, 13604255.0, 20737208.0, 26201736.0, 38498212.0 ], "hidden_norms_avg": [ 1218.5357666015625, 34337856.0, 37186496.0, 39492900.0, 49837356.0 ], "bp_grad_per_sample_l2_med": [ 0.00024631666019558907, 7.821958081244418e-10, 3.8121927836698433e-10, 3.6691791271969976e-10, 3.7013728193535655e-10 ], "bp_grad_F": [ 0.16077305376529694, 4.323472239775583e-06, 3.772007772795405e-08, 1.5986831414238623e-08, 1.5948634413121e-08 ], "gamma_dfa": 0.002168099657865241, "gamma_dfa_per_layer": [ 0.007105600088834763, 0.0013786349445581436, 0.00041434637387283146, -0.00022618277580477297 ], "acc_eval": 0.193359375, "loss_eval": 2.1537227630615234, "epoch": 43 }, { "hidden_norms_cls": [ 32.95870590209961, 17278438.0, 21010234.0, 26451948.0, 41976576.0 ], "hidden_norms_avg": [ 1225.39501953125, 36196112.0, 38833272.0, 41042520.0, 51415488.0 ], "bp_grad_per_sample_l2_med": [ 0.00017274360288865864, 7.227461407133262e-10, 3.619011756939017e-10, 3.5793992769761473e-10, 3.6092046018509905e-10 ], "bp_grad_F": [ 0.9672663807868958, 3.41643476531317e-06, 5.25712664511957e-08, 1.5481989024124232e-08, 1.548605688128646e-08 ], "gamma_dfa": 0.001979457345441915, "gamma_dfa_per_layer": [ 0.006772718392312527, 0.0009743775590322912, 0.00037397228879854083, -0.00020323885837569833 ], "acc_eval": 0.208984375, "loss_eval": 2.1646997928619385, "epoch": 44 }, { "hidden_norms_cls": [ 33.06986999511719, 23368844.0, 24521804.0, 27230594.0, 45358652.0 ], "hidden_norms_avg": [ 1231.394287109375, 38020996.0, 40414464.0, 42538228.0, 53283596.0 ], "bp_grad_per_sample_l2_med": [ 0.00015840897685848176, 6.067092384043349e-10, 3.4933173020945674e-10, 3.3962907486362326e-10, 3.42745692938351e-10 ], "bp_grad_F": [ 0.3695656955242157, 2.3579739263368538e-06, 5.5092176154403205e-08, 1.777137192959799e-08, 1.4559810246339566e-08 ], "gamma_dfa": 0.0020704490307252854, "gamma_dfa_per_layer": [ 0.007164421491324902, 0.0009055124246515334, 0.0003939281450584531, -0.00018206593813374639 ], "acc_eval": 0.203125, "loss_eval": 2.1666717529296875, "epoch": 45 }, { "hidden_norms_cls": [ 33.164432525634766, 29174184.0, 30089798.0, 32367896.0, 48892740.0 ], "hidden_norms_avg": [ 1237.1142578125, 37470168.0, 40219512.0, 42356984.0, 52772660.0 ], "bp_grad_per_sample_l2_med": [ 0.00024464691523462534, 5.441591066634999e-10, 3.6414088411262924e-10, 3.320065611323031e-10, 3.387692348866267e-10 ], "bp_grad_F": [ 0.20688536763191223, 4.435638402355835e-06, 8.288016317692382e-08, 1.4215274291018432e-08, 1.4331217101926086e-08 ], "gamma_dfa": 0.0017712319058773573, "gamma_dfa_per_layer": [ 0.006079941056668758, 0.0008057263912633061, 0.00038248312193900347, -0.0001832229463616386 ], "acc_eval": 0.1806640625, "loss_eval": 2.173765182495117, "epoch": 46 }, { "hidden_norms_cls": [ 33.24842071533203, 33830332.0, 34499304.0, 36673048.0, 51963528.0 ], "hidden_norms_avg": [ 1242.226318359375, 38073352.0, 40806512.0, 42901500.0, 53437180.0 ], "bp_grad_per_sample_l2_med": [ 0.0002524294250179082, 5.388652302151797e-10, 3.6845529405304944e-10, 3.3760005901939394e-10, 3.4174474361492457e-10 ], "bp_grad_F": [ 0.12659014761447906, 2.532647158659529e-06, 5.97612910269163e-08, 1.3431267653629675e-08, 1.3499856343912597e-08 ], "gamma_dfa": 0.0021579467684205156, "gamma_dfa_per_layer": [ 0.007928929291665554, 0.00047530903248116374, 0.00039780279621481895, -0.0001702540466794744 ], "acc_eval": 0.2099609375, "loss_eval": 2.161896228790283, "epoch": 47 }, { "hidden_norms_cls": [ 33.338741302490234, 19795148.0, 21916948.0, 27189936.0, 43588712.0 ], "hidden_norms_avg": [ 1246.7552490234375, 38983196.0, 41658504.0, 43769460.0, 54177164.0 ], "bp_grad_per_sample_l2_med": [ 0.0002599447325337678, 6.2289540192495e-10, 3.6807956682594067e-10, 3.4037242468976103e-10, 3.472495624379235e-10 ], "bp_grad_F": [ 0.11130323261022568, 6.972830760787474e-06, 5.447330764241087e-08, 1.4756569299834155e-08, 1.4917180379825368e-08 ], "gamma_dfa": 0.0021847522366442718, "gamma_dfa_per_layer": [ 0.007594278547912836, 0.0009666476398706436, 0.0003712670295499265, -0.00019318427075631917 ], "acc_eval": 0.1904296875, "loss_eval": 2.1626296043395996, "epoch": 48 }, { "hidden_norms_cls": [ 33.42045974731445, 24898126.0, 26009376.0, 28516464.0, 47394980.0 ], "hidden_norms_avg": [ 1250.1884765625, 39632580.0, 42285708.0, 44390100.0, 55233620.0 ], "bp_grad_per_sample_l2_med": [ 0.0001829452667152509, 5.726033536213038e-10, 3.5659752928296484e-10, 3.292066619309253e-10, 3.31846911061362e-10 ], "bp_grad_F": [ 0.23442988097667694, 3.2595114589639707e-06, 1.0605135969399271e-07, 1.4677630666426467e-08, 1.445219677265186e-08 ], "gamma_dfa": 0.0021932553718215786, "gamma_dfa_per_layer": [ 0.007973091676831245, 0.0006458763382397592, 0.00032728860969655216, -0.00017323513748124242 ], "acc_eval": 0.1923828125, "loss_eval": 2.175835609436035, "epoch": 49 }, { "hidden_norms_cls": [ 33.47613525390625, 25550002.0, 26776384.0, 28507352.0, 47268464.0 ], "hidden_norms_avg": [ 1253.279541015625, 39494300.0, 42348356.0, 44479368.0, 55121100.0 ], "bp_grad_per_sample_l2_med": [ 0.00012893354869447649, 5.787402224122218e-10, 3.341840137949248e-10, 3.2919431069977634e-10, 3.3201591476128556e-10 ], "bp_grad_F": [ 0.10876749455928802, 4.772132342623081e-06, 7.90316647680811e-08, 1.4042406348835357e-08, 1.4153799909877307e-08 ], "gamma_dfa": 0.001727514507365413, "gamma_dfa_per_layer": [ 0.0062596434727311134, 0.0004772312822751701, 0.000357049866579473, -0.0001838665921241045 ], "acc_eval": 0.1904296875, "loss_eval": 2.164583444595337, "epoch": 50 }, { "hidden_norms_cls": [ 33.52043914794922, 28050636.0, 29099278.0, 31227182.0, 49045872.0 ], "hidden_norms_avg": [ 1255.7454833984375, 40231008.0, 42960368.0, 45079784.0, 55989944.0 ], "bp_grad_per_sample_l2_med": [ 0.00015386792074423283, 5.41802436249128e-10, 3.373940293815991e-10, 3.3321326253776817e-10, 3.361276257329848e-10 ], "bp_grad_F": [ 0.2656819522380829, 2.482481932020164e-06, 8.287289432473699e-08, 1.3792345932017724e-08, 1.3917338392843703e-08 ], "gamma_dfa": 0.001938080065883696, "gamma_dfa_per_layer": [ 0.006978346034884453, 0.0005946386372670531, 0.00036033656215295196, -0.00018100097076967359 ], "acc_eval": 0.1962890625, "loss_eval": 2.176473379135132, "epoch": 51 }, { "hidden_norms_cls": [ 33.55419921875, 25508434.0, 26505134.0, 29051658.0, 47339916.0 ], "hidden_norms_avg": [ 1257.7822265625, 40388772.0, 43162480.0, 45217960.0, 55966100.0 ], "bp_grad_per_sample_l2_med": [ 0.00018102869216818362, 5.443374639924059e-10, 3.9548594954474936e-10, 3.679410942591943e-10, 3.717116892065775e-10 ], "bp_grad_F": [ 0.28429684042930603, 3.3983885714405915e-06, 8.993236377818903e-08, 1.4510244561449781e-08, 1.4562592021150067e-08 ], "gamma_dfa": 0.001642326584260445, "gamma_dfa_per_layer": [ 0.006192460190504789, 0.00019942648941650987, 0.00037004181649535894, -0.0001926221593748778 ], "acc_eval": 0.2001953125, "loss_eval": 2.1743006706237793, "epoch": 52 }, { "hidden_norms_cls": [ 33.58127212524414, 28540952.0, 29607362.0, 31472670.0, 49191068.0 ], "hidden_norms_avg": [ 1259.4189453125, 40550800.0, 43364984.0, 45506960.0, 56297104.0 ], "bp_grad_per_sample_l2_med": [ 0.00018638238543644547, 5.299162220140374e-10, 3.2437005859087265e-10, 3.1624741714253446e-10, 3.1920088794379353e-10 ], "bp_grad_F": [ 0.21056434512138367, 3.217361381757655e-06, 5.1724125427199397e-08, 1.390105897058902e-08, 1.3961146017038573e-08 ], "gamma_dfa": 0.0018532263711676933, "gamma_dfa_per_layer": [ 0.006584585644304752, 0.0006806463352404535, 0.00032758695306256413, -0.00017991344793699682 ], "acc_eval": 0.19921875, "loss_eval": 2.167957067489624, "epoch": 53 }, { "hidden_norms_cls": [ 33.60611343383789, 27949698.0, 28918304.0, 31366946.0, 48876736.0 ], "hidden_norms_avg": [ 1260.694091796875, 41001392.0, 43744060.0, 45853688.0, 56636716.0 ], "bp_grad_per_sample_l2_med": [ 0.00021861983987037092, 5.396287861003657e-10, 3.377726154329963e-10, 3.201852394330018e-10, 3.237338452866112e-10 ], "bp_grad_F": [ 0.12415990233421326, 1.6796100226201816e-06, 6.823196940786147e-08, 1.384469427989643e-08, 1.3965705036866893e-08 ], "gamma_dfa": 0.0017868579998321366, "gamma_dfa_per_layer": [ 0.006317156832665205, 0.0006519090966321528, 0.0003622731601353735, -0.00018390709010418504 ], "acc_eval": 0.1953125, "loss_eval": 2.178144931793213, "epoch": 54 }, { "hidden_norms_cls": [ 33.620914459228516, 27607036.0, 28622492.0, 31370470.0, 48645068.0 ], "hidden_norms_avg": [ 1261.64208984375, 40948476.0, 43773536.0, 45888992.0, 56623536.0 ], "bp_grad_per_sample_l2_med": [ 0.0002112231741193682, 5.336073249928575e-10, 3.533912051878474e-10, 3.186636232666018e-10, 3.226934830458106e-10 ], "bp_grad_F": [ 0.1486925333738327, 3.3336793876515003e-06, 9.466339889740993e-08, 1.4568017014937595e-08, 1.4240884915750485e-08 ], "gamma_dfa": 0.0018792969822243322, "gamma_dfa_per_layer": [ 0.006730419583618641, 0.000605170032940805, 0.0003661802038550377, -0.00018458189151715487 ], "acc_eval": 0.1982421875, "loss_eval": 2.172356367111206, "epoch": 55 }, { "hidden_norms_cls": [ 33.63143539428711, 28410040.0, 29532286.0, 31697578.0, 48914624.0 ], "hidden_norms_avg": [ 1262.2918701171875, 40698620.0, 43622904.0, 45764712.0, 56531748.0 ], "bp_grad_per_sample_l2_med": [ 0.0002270409750053659, 5.479600106994553e-10, 3.2429942065093087e-10, 3.150284755282229e-10, 3.179212726411862e-10 ], "bp_grad_F": [ 0.10118122398853302, 2.5195840862579644e-06, 8.798109263352671e-08, 1.3570585544186997e-08, 1.3736383586149259e-08 ], "gamma_dfa": 0.0017859039653558284, "gamma_dfa_per_layer": [ 0.006382801569998264, 0.0005453285994008183, 0.00039217708399519324, -0.00017669139197096229 ], "acc_eval": 0.1943359375, "loss_eval": 2.1648902893066406, "epoch": 56 }, { "hidden_norms_cls": [ 33.63875961303711, 31114778.0, 32184654.0, 34278688.0, 50894352.0 ], "hidden_norms_avg": [ 1262.7132568359375, 40792528.0, 43713536.0, 45850224.0, 56615416.0 ], "bp_grad_per_sample_l2_med": [ 0.00019923689251299948, 5.368823718931992e-10, 3.306654117185559e-10, 3.113070912164062e-10, 3.1328556415743947e-10 ], "bp_grad_F": [ 0.3573400378227234, 1.249598790309392e-05, 1.6106491784739774e-07, 3.301076745287901e-08, 1.3328084413899433e-08 ], "gamma_dfa": 0.0016940671957854647, "gamma_dfa_per_layer": [ 0.006114102900028229, 0.0004918627091683447, 0.00032346430816687644, -0.00015316113422159106 ], "acc_eval": 0.201171875, "loss_eval": 2.1634349822998047, "epoch": 57 }, { "hidden_norms_cls": [ 33.642520904541016, 31868976.0, 32779660.0, 35005740.0, 51305220.0 ], "hidden_norms_avg": [ 1262.9461669921875, 41087592.0, 43928832.0, 46043268.0, 56839576.0 ], "bp_grad_per_sample_l2_med": [ 0.0002181618328904733, 5.162476557352136e-10, 3.3206276617292474e-10, 3.1130611977125966e-10, 3.1441516057384433e-10 ], "bp_grad_F": [ 0.12289460748434067, 1.5301338862627745e-05, 8.779379356838035e-08, 1.4331889452989799e-08, 1.318165843144925e-08 ], "gamma_dfa": 0.001529279034002684, "gamma_dfa_per_layer": [ 0.00539398193359375, 0.0005496743833646178, 0.00034435215638950467, -0.00017089233733713627 ], "acc_eval": 0.2021484375, "loss_eval": 2.164745807647705, "epoch": 58 }, { "hidden_norms_cls": [ 33.6442756652832, 31315430.0, 32160978.0, 34340796.0, 51077484.0 ], "hidden_norms_avg": [ 1263.062744140625, 41015680.0, 43882708.0, 46002096.0, 56770896.0 ], "bp_grad_per_sample_l2_med": [ 0.00021884885791223496, 5.177114292820306e-10, 3.350683897007656e-10, 3.101042200803761e-10, 3.12167347527037e-10 ], "bp_grad_F": [ 0.11127890646457672, 1.1515544429130387e-05, 8.542571805492116e-08, 1.319963871537766e-08, 1.3264477516372608e-08 ], "gamma_dfa": 0.0016308917693095282, "gamma_dfa_per_layer": [ 0.005676542408764362, 0.0006629846757277846, 0.0003523063496686518, -0.0001682663569226861 ], "acc_eval": 0.19921875, "loss_eval": 2.1635866165161133, "epoch": 59 }, { "hidden_norms_cls": [ 33.643985748291016, 31097308.0, 32052318.0, 34155804.0, 50803736.0 ], "hidden_norms_avg": [ 1263.064208984375, 40997444.0, 43870400.0, 45990872.0, 56755540.0 ], "bp_grad_per_sample_l2_med": [ 0.00021703331731259823, 5.1921633659191e-10, 3.35882821556055e-10, 3.102589296588576e-10, 3.1300673164480486e-10 ], "bp_grad_F": [ 0.1889268010854721, 1.0328590178687591e-05, 1.1096560825762936e-07, 1.3215729843807367e-08, 1.3306935997547953e-08 ], "gamma_dfa": 0.0016646812255203258, "gamma_dfa_per_layer": [ 0.005869406741112471, 0.0006016636616550386, 0.0003579354961402714, -0.00017028099682647735 ], "acc_eval": 0.2021484375, "loss_eval": 2.163691520690918, "epoch": 60 } ] }