summaryrefslogtreecommitdiff
path: root/results/snapshot_vit_v1/snapshot_vit_s123.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s123.json')
-rw-r--r--results/snapshot_vit_v1/snapshot_vit_s123.json4594
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s123.json b/results/snapshot_vit_v1/snapshot_vit_s123.json
new file mode 100644
index 0000000..93853cf
--- /dev/null
+++ b/results/snapshot_vit_v1/snapshot_vit_s123.json
@@ -0,0 +1,4594 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_vit_v1",
+ "epochs": 60,
+ "lr": 0.001,
+ "wd": 0.05,
+ "seed": 123,
+ "depth": 4,
+ "d_model": 128,
+ "n_heads": 4
+ },
+ "depth": 4,
+ "d_model": 128,
+ "architecture": "ViTMini",
+ "bp_log": [
+ {
+ "hidden_norms_cls": [
+ 0.3210873007774353,
+ 3.3568029403686523,
+ 4.891699314117432,
+ 6.200707912445068,
+ 7.5911865234375
+ ],
+ "hidden_norms_avg": [
+ 5.7549052238464355,
+ 6.750590801239014,
+ 7.9020819664001465,
+ 8.925304412841797,
+ 10.076716423034668
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.004074312746524811,
+ 0.0011155740357935429,
+ 0.0009667170234024525,
+ 0.0008621186716482043,
+ 0.0008127145702019334
+ ],
+ "bp_grad_F": [
+ 0.20160320401191711,
+ 0.039521340280771255,
+ 0.033098917454481125,
+ 0.029271923005580902,
+ 0.027136052027344704
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.125,
+ "loss_eval": 2.422111988067627,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 0.4782717227935791,
+ 11.874238014221191,
+ 20.313709259033203,
+ 26.86528778076172,
+ 32.42327880859375
+ ],
+ "hidden_norms_avg": [
+ 3.8830745220184326,
+ 11.266603469848633,
+ 17.881502151489258,
+ 23.234352111816406,
+ 28.51181411743164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002827065996825695,
+ 0.00024586476502008736,
+ 0.00014567613834515214,
+ 0.00013882767234463245,
+ 0.0001400413311785087
+ ],
+ "bp_grad_F": [
+ 0.12621107697486877,
+ 0.009982436895370483,
+ 0.00507162231951952,
+ 0.004677945747971535,
+ 0.004658848978579044
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4697265625,
+ "loss_eval": 1.4472862482070923,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 0.6104467511177063,
+ 13.787332534790039,
+ 22.073436737060547,
+ 28.480369567871094,
+ 33.141117095947266
+ ],
+ "hidden_norms_avg": [
+ 3.951775074005127,
+ 12.005932807922363,
+ 18.336896896362305,
+ 23.67597198486328,
+ 27.899608612060547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.002604336943477392,
+ 0.00026667251950129867,
+ 0.00014805165119469166,
+ 0.00013079405471216887,
+ 0.00012911780504509807
+ ],
+ "bp_grad_F": [
+ 0.12487494200468063,
+ 0.010650832206010818,
+ 0.005604646634310484,
+ 0.004644650500267744,
+ 0.00448915408924222
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5146484375,
+ "loss_eval": 1.291869878768921,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 0.7104504108428955,
+ 13.74225902557373,
+ 21.90972328186035,
+ 28.958967208862305,
+ 33.262393951416016
+ ],
+ "hidden_norms_avg": [
+ 3.9180142879486084,
+ 13.097892761230469,
+ 19.570770263671875,
+ 24.899248123168945,
+ 28.65104866027832
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020766372326761484,
+ 0.00025831969105638564,
+ 0.00014769421250093728,
+ 0.00012920337030664086,
+ 0.00012324318231549114
+ ],
+ "bp_grad_F": [
+ 0.09676238149404526,
+ 0.010603155009448528,
+ 0.005832126829773188,
+ 0.00465927692130208,
+ 0.004435759503394365
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.529296875,
+ "loss_eval": 1.2694497108459473,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 0.801612377166748,
+ 12.882991790771484,
+ 20.474157333374023,
+ 27.37413215637207,
+ 32.06389617919922
+ ],
+ "hidden_norms_avg": [
+ 3.8871910572052,
+ 13.333250999450684,
+ 19.042104721069336,
+ 24.029348373413086,
+ 27.96086311340332
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020045258570462465,
+ 0.000285606540273875,
+ 0.00016217664233408868,
+ 0.00013080642384011298,
+ 0.00011968115722993389
+ ],
+ "bp_grad_F": [
+ 0.09496191889047623,
+ 0.011928788386285305,
+ 0.006509022321552038,
+ 0.005044482182711363,
+ 0.004537967965006828
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.58203125,
+ "loss_eval": 1.119094967842102,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 0.8653663396835327,
+ 12.994612693786621,
+ 20.49618148803711,
+ 26.709278106689453,
+ 30.303852081298828
+ ],
+ "hidden_norms_avg": [
+ 4.018242835998535,
+ 13.520885467529297,
+ 19.090721130371094,
+ 23.6751651763916,
+ 26.93212890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018953323597088456,
+ 0.000296358106425032,
+ 0.00017310198745690286,
+ 0.0001364975469186902,
+ 0.00012098452862119302
+ ],
+ "bp_grad_F": [
+ 0.09499228745698929,
+ 0.012825642712414265,
+ 0.007407570723444223,
+ 0.005570532754063606,
+ 0.004951393231749535
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.595703125,
+ "loss_eval": 1.0847156047821045,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 0.9313029646873474,
+ 13.966381072998047,
+ 21.648372650146484,
+ 28.33364486694336,
+ 32.91484069824219
+ ],
+ "hidden_norms_avg": [
+ 4.053382396697998,
+ 15.042261123657227,
+ 20.74883270263672,
+ 25.032489776611328,
+ 28.55679702758789
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001841629622504115,
+ 0.0002753600711002946,
+ 0.0001624371943762526,
+ 0.0001305017649428919,
+ 0.00011278261081315577
+ ],
+ "bp_grad_F": [
+ 0.09068351984024048,
+ 0.0128449946641922,
+ 0.007257991470396519,
+ 0.005361978895962238,
+ 0.004660472739487886
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6103515625,
+ "loss_eval": 1.095273494720459,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 0.9818395972251892,
+ 13.022477149963379,
+ 20.385391235351562,
+ 27.03214454650879,
+ 31.324769973754883
+ ],
+ "hidden_norms_avg": [
+ 4.1024041175842285,
+ 14.697205543518066,
+ 19.634239196777344,
+ 23.90021324157715,
+ 27.306678771972656
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015902157174423337,
+ 0.00027956697158515453,
+ 0.0001692597143119201,
+ 0.0001353132538497448,
+ 0.00011523282591952011
+ ],
+ "bp_grad_F": [
+ 0.07967441529035568,
+ 0.012528380379080772,
+ 0.007520876359194517,
+ 0.00570708978921175,
+ 0.004875381011515856
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.62890625,
+ "loss_eval": 1.0069011449813843,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 1.0194361209869385,
+ 13.912450790405273,
+ 20.85824203491211,
+ 27.968477249145508,
+ 32.243431091308594
+ ],
+ "hidden_norms_avg": [
+ 4.178755283355713,
+ 14.875143051147461,
+ 20.261545181274414,
+ 24.636741638183594,
+ 27.893512725830078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001506888889707625,
+ 0.00028421770548447967,
+ 0.0001727779454085976,
+ 0.00013076694449409842,
+ 0.00010860477777896449
+ ],
+ "bp_grad_F": [
+ 0.07398127764463425,
+ 0.013124965131282806,
+ 0.007798053789883852,
+ 0.005717460531741381,
+ 0.004830002784729004
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.638671875,
+ "loss_eval": 0.9834396839141846,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 1.077261209487915,
+ 12.524529457092285,
+ 19.766538619995117,
+ 25.7626895904541,
+ 30.03727149963379
+ ],
+ "hidden_norms_avg": [
+ 4.1816864013671875,
+ 14.304539680480957,
+ 19.208524703979492,
+ 23.25862693786621,
+ 26.313356399536133
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0014360174536705017,
+ 0.0003003668098244816,
+ 0.0001815372525015846,
+ 0.0001390709658153355,
+ 0.00011320491466904059
+ ],
+ "bp_grad_F": [
+ 0.0756259635090828,
+ 0.014865156263113022,
+ 0.008982912637293339,
+ 0.006551471073180437,
+ 0.005398898851126432
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6494140625,
+ "loss_eval": 0.971701979637146,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1200045347213745,
+ 12.160452842712402,
+ 19.172168731689453,
+ 25.067665100097656,
+ 28.764787673950195
+ ],
+ "hidden_norms_avg": [
+ 4.289422035217285,
+ 15.51036262512207,
+ 20.407268524169922,
+ 24.061931610107422,
+ 26.493688583374023
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012870824430137873,
+ 0.00027074789977632463,
+ 0.0001742457679938525,
+ 0.0001348328951280564,
+ 0.000104573555290699
+ ],
+ "bp_grad_F": [
+ 0.07437644153833389,
+ 0.015084434300661087,
+ 0.009522279724478722,
+ 0.0069595095701515675,
+ 0.0055610560812056065
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6767578125,
+ "loss_eval": 0.8734689354896545,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1509246826171875,
+ 12.219743728637695,
+ 19.352998733520508,
+ 25.70184326171875,
+ 29.580278396606445
+ ],
+ "hidden_norms_avg": [
+ 4.315939426422119,
+ 15.6610689163208,
+ 20.42215347290039,
+ 24.016841888427734,
+ 26.62118911743164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013146374840289354,
+ 0.0002733681467361748,
+ 0.0001865291123976931,
+ 0.00013389455853030086,
+ 0.00010298956476617604
+ ],
+ "bp_grad_F": [
+ 0.07836466282606125,
+ 0.015104672871530056,
+ 0.009902945719659328,
+ 0.0069915857166051865,
+ 0.005596037954092026
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6767578125,
+ "loss_eval": 0.917751669883728,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2017452716827393,
+ 12.72107219696045,
+ 18.952699661254883,
+ 25.067615509033203,
+ 29.466550827026367
+ ],
+ "hidden_norms_avg": [
+ 4.358119487762451,
+ 15.672205924987793,
+ 20.140914916992188,
+ 24.013885498046875,
+ 26.668514251708984
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011630960507318377,
+ 0.00025659528910182416,
+ 0.0001693729282123968,
+ 0.0001237613905686885,
+ 9.384296572534367e-05
+ ],
+ "bp_grad_F": [
+ 0.07334695011377335,
+ 0.015075902454555035,
+ 0.009827414527535439,
+ 0.007068648934364319,
+ 0.005549146793782711
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6982421875,
+ "loss_eval": 0.8279671669006348,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 1.234994649887085,
+ 12.283885955810547,
+ 18.62163543701172,
+ 24.3900203704834,
+ 28.36040496826172
+ ],
+ "hidden_norms_avg": [
+ 4.369320869445801,
+ 15.747625350952148,
+ 19.76953887939453,
+ 23.351999282836914,
+ 25.69841194152832
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011812442680820823,
+ 0.0002851892786566168,
+ 0.0001940266229212284,
+ 0.00013827465591020882,
+ 0.00010182376718148589
+ ],
+ "bp_grad_F": [
+ 0.07158326357603073,
+ 0.01604902744293213,
+ 0.010893523693084717,
+ 0.007844515144824982,
+ 0.005985426716506481
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.689453125,
+ "loss_eval": 0.8679210543632507,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2675292491912842,
+ 11.706314086914062,
+ 18.347841262817383,
+ 24.01951789855957,
+ 28.1114501953125
+ ],
+ "hidden_norms_avg": [
+ 4.390969753265381,
+ 15.140497207641602,
+ 19.62596893310547,
+ 23.22857666015625,
+ 25.681791305541992
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010449079563841224,
+ 0.0002611770760267973,
+ 0.00017687672516331077,
+ 0.00012088462244719267,
+ 8.996625547297299e-05
+ ],
+ "bp_grad_F": [
+ 0.06979352980852127,
+ 0.016320781782269478,
+ 0.01088168565183878,
+ 0.007916715927422047,
+ 0.006064872723072767
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6884765625,
+ "loss_eval": 0.8092349767684937,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2957582473754883,
+ 11.933137893676758,
+ 18.238237380981445,
+ 23.88395118713379,
+ 27.868513107299805
+ ],
+ "hidden_norms_avg": [
+ 4.4383697509765625,
+ 15.46267318725586,
+ 19.841346740722656,
+ 23.529712677001953,
+ 25.852684020996094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009947444777935743,
+ 0.00024384066637139767,
+ 0.00016608397709205747,
+ 0.0001234996016137302,
+ 9.023427992360666e-05
+ ],
+ "bp_grad_F": [
+ 0.07019422203302383,
+ 0.016806265339255333,
+ 0.011433122679591179,
+ 0.008135766722261906,
+ 0.006158903241157532
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.712890625,
+ "loss_eval": 0.7795700430870056,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3391923904418945,
+ 11.329567909240723,
+ 17.184999465942383,
+ 22.353059768676758,
+ 26.889299392700195
+ ],
+ "hidden_norms_avg": [
+ 4.53090238571167,
+ 15.341407775878906,
+ 19.109649658203125,
+ 22.223899841308594,
+ 24.45347023010254
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001086357282474637,
+ 0.00030167572549544275,
+ 0.0002114812668878585,
+ 0.00015480270667467266,
+ 0.00010993685282301158
+ ],
+ "bp_grad_F": [
+ 0.06569939106702805,
+ 0.017201317474246025,
+ 0.012068319134414196,
+ 0.008909368887543678,
+ 0.006427914369851351
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7314453125,
+ "loss_eval": 0.7724976539611816,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3643215894699097,
+ 10.724340438842773,
+ 16.144981384277344,
+ 21.656490325927734,
+ 25.777481079101562
+ ],
+ "hidden_norms_avg": [
+ 4.520992279052734,
+ 15.036820411682129,
+ 18.98927879333496,
+ 22.688859939575195,
+ 24.71843910217285
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000967099389526993,
+ 0.0002715744194574654,
+ 0.00019328886992298067,
+ 0.00013628297892864794,
+ 9.314809722127393e-05
+ ],
+ "bp_grad_F": [
+ 0.06768078356981277,
+ 0.01841692440211773,
+ 0.012980606406927109,
+ 0.009295133873820305,
+ 0.006698420271277428
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.73828125,
+ "loss_eval": 0.7337102890014648,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3963993787765503,
+ 11.463358879089355,
+ 16.49429702758789,
+ 21.585325241088867,
+ 25.636695861816406
+ ],
+ "hidden_norms_avg": [
+ 4.539251327514648,
+ 14.975208282470703,
+ 18.360631942749023,
+ 21.586400985717773,
+ 23.561830520629883
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008780099451541901,
+ 0.00024953793035820127,
+ 0.00017615300021134317,
+ 0.00012566034274641424,
+ 8.528940088581294e-05
+ ],
+ "bp_grad_F": [
+ 0.07198558002710342,
+ 0.019673649221658707,
+ 0.013869633898139,
+ 0.009656366892158985,
+ 0.006824122741818428
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7451171875,
+ "loss_eval": 0.7211208343505859,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 1.421103835105896,
+ 9.9105806350708,
+ 15.361790657043457,
+ 20.334768295288086,
+ 24.506919860839844
+ ],
+ "hidden_norms_avg": [
+ 4.622361660003662,
+ 14.7937650680542,
+ 18.042116165161133,
+ 21.208105087280273,
+ 23.21940040588379
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007793674594722688,
+ 0.0002331113355467096,
+ 0.00016331924416590482,
+ 0.00011330798588460311,
+ 7.215427467599511e-05
+ ],
+ "bp_grad_F": [
+ 0.07613872736692429,
+ 0.022306306287646294,
+ 0.015858706086874008,
+ 0.011275039985775948,
+ 0.007263499312102795
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7392578125,
+ "loss_eval": 0.7346716523170471,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4554439783096313,
+ 10.118419647216797,
+ 15.106456756591797,
+ 20.052860260009766,
+ 24.34604263305664
+ ],
+ "hidden_norms_avg": [
+ 4.584441661834717,
+ 14.634279251098633,
+ 17.785133361816406,
+ 21.110010147094727,
+ 22.89650535583496
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007524031680077314,
+ 0.0002260785986436531,
+ 0.00016854463319759816,
+ 0.00011997718684142455,
+ 7.738151180092245e-05
+ ],
+ "bp_grad_F": [
+ 0.07370379567146301,
+ 0.021284889429807663,
+ 0.015382407233119011,
+ 0.010745048522949219,
+ 0.007394883316010237
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.74609375,
+ "loss_eval": 0.7024286389350891,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4652466773986816,
+ 10.145299911499023,
+ 15.15330982208252,
+ 20.131061553955078,
+ 23.987186431884766
+ ],
+ "hidden_norms_avg": [
+ 4.602361679077148,
+ 14.532269477844238,
+ 17.825733184814453,
+ 21.43619728088379,
+ 23.12371253967285
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008222013129852712,
+ 0.0002455596113577485,
+ 0.00017989490879699588,
+ 0.00012026322656311095,
+ 8.26524556032382e-05
+ ],
+ "bp_grad_F": [
+ 0.0741497054696083,
+ 0.020758304744958878,
+ 0.01482379250228405,
+ 0.010753357782959938,
+ 0.007582026533782482
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7412109375,
+ "loss_eval": 0.7016957402229309,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 1.480756402015686,
+ 10.028592109680176,
+ 14.573174476623535,
+ 19.24639320373535,
+ 23.3629150390625
+ ],
+ "hidden_norms_avg": [
+ 4.621757984161377,
+ 14.29589557647705,
+ 17.4040470123291,
+ 20.71320343017578,
+ 22.405963897705078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000667835003696382,
+ 0.00020642780873458833,
+ 0.0001538341457489878,
+ 0.00010652844503056258,
+ 6.964046770008281e-05
+ ],
+ "bp_grad_F": [
+ 0.07375485450029373,
+ 0.021967202425003052,
+ 0.016106218099594116,
+ 0.011507184244692326,
+ 0.007651185616850853
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7607421875,
+ "loss_eval": 0.6544591188430786,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5069013833999634,
+ 9.897040367126465,
+ 14.096169471740723,
+ 18.488874435424805,
+ 22.214311599731445
+ ],
+ "hidden_norms_avg": [
+ 4.621402263641357,
+ 13.978808403015137,
+ 16.55535888671875,
+ 19.729736328125,
+ 21.272388458251953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007426440715789795,
+ 0.0002414636837784201,
+ 0.00018161055049858987,
+ 0.00012697202328126878,
+ 8.096778037725016e-05
+ ],
+ "bp_grad_F": [
+ 0.07682260870933533,
+ 0.02333010919392109,
+ 0.017287475988268852,
+ 0.012499523349106312,
+ 0.008510846644639969
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7568359375,
+ "loss_eval": 0.6971542835235596,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5169755220413208,
+ 9.5064058303833,
+ 13.812594413757324,
+ 17.95937156677246,
+ 21.51923370361328
+ ],
+ "hidden_norms_avg": [
+ 4.612667083740234,
+ 13.86723804473877,
+ 16.418981552124023,
+ 19.12198257446289,
+ 20.565521240234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007257908000610769,
+ 0.00024720808141864836,
+ 0.0001871327986009419,
+ 0.00013439780741464347,
+ 8.671147952554747e-05
+ ],
+ "bp_grad_F": [
+ 0.07474599778652191,
+ 0.024257108569145203,
+ 0.01782340556383133,
+ 0.01281843613833189,
+ 0.008487668819725513
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.763671875,
+ "loss_eval": 0.6618016958236694,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5133440494537354,
+ 9.023777961730957,
+ 13.088467597961426,
+ 17.324251174926758,
+ 21.083759307861328
+ ],
+ "hidden_norms_avg": [
+ 4.670994281768799,
+ 13.658943176269531,
+ 16.629199981689453,
+ 19.75893783569336,
+ 21.12710952758789
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005614451365545392,
+ 0.0001914121676236391,
+ 0.00014186649059411138,
+ 0.00010088241106132045,
+ 6.150588887976483e-05
+ ],
+ "bp_grad_F": [
+ 0.08172759413719177,
+ 0.027048049494624138,
+ 0.019993988797068596,
+ 0.014050732366740704,
+ 0.009047404862940311
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7626953125,
+ "loss_eval": 0.6708824634552002,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5329865217208862,
+ 8.596381187438965,
+ 12.645307540893555,
+ 16.668807983398438,
+ 20.51462745666504
+ ],
+ "hidden_norms_avg": [
+ 4.642580986022949,
+ 13.140735626220703,
+ 15.32632064819336,
+ 17.985010147094727,
+ 19.472858428955078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005455430946312845,
+ 0.00019156686903443187,
+ 0.00014253854169510305,
+ 0.00010098751954501495,
+ 6.338314415188506e-05
+ ],
+ "bp_grad_F": [
+ 0.08767001330852509,
+ 0.029545463621616364,
+ 0.021587952971458435,
+ 0.014973495155572891,
+ 0.009515349753201008
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.767578125,
+ "loss_eval": 0.6813780069351196,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 1.554770588874817,
+ 8.98424243927002,
+ 12.76674747467041,
+ 16.438858032226562,
+ 19.893146514892578
+ ],
+ "hidden_norms_avg": [
+ 4.635522365570068,
+ 13.039203643798828,
+ 15.419903755187988,
+ 18.176319122314453,
+ 19.39232635498047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005697832675650716,
+ 0.0001985357521334663,
+ 0.0001536469644634053,
+ 0.00010455933079356328,
+ 6.821998249506578e-05
+ ],
+ "bp_grad_F": [
+ 0.07977671921253204,
+ 0.02706393413245678,
+ 0.020037846639752388,
+ 0.014591805636882782,
+ 0.009512925520539284
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.794921875,
+ "loss_eval": 0.628034770488739,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5515426397323608,
+ 8.19682788848877,
+ 11.861184120178223,
+ 15.59919548034668,
+ 18.893400192260742
+ ],
+ "hidden_norms_avg": [
+ 4.5841450691223145,
+ 12.511472702026367,
+ 14.583609580993652,
+ 16.949586868286133,
+ 18.082292556762695
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005373116582632065,
+ 0.0001997901708818972,
+ 0.0001489907590439543,
+ 0.00010373342229286209,
+ 6.318451050901785e-05
+ ],
+ "bp_grad_F": [
+ 0.09340352565050125,
+ 0.03397079557180405,
+ 0.025108041241765022,
+ 0.017669958993792534,
+ 0.010975479148328304
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.767578125,
+ "loss_eval": 0.7042175531387329,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5542187690734863,
+ 8.489326477050781,
+ 11.786734580993652,
+ 15.331045150756836,
+ 18.48196792602539
+ ],
+ "hidden_norms_avg": [
+ 4.615735054016113,
+ 12.620647430419922,
+ 14.822388648986816,
+ 17.454334259033203,
+ 18.677461624145508
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005812083836644888,
+ 0.00021461205324158072,
+ 0.00015997944865375757,
+ 0.00011693408305291086,
+ 7.380295573966578e-05
+ ],
+ "bp_grad_F": [
+ 0.09380948543548584,
+ 0.03345760330557823,
+ 0.025129586458206177,
+ 0.01789030432701111,
+ 0.011130682192742825
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7666015625,
+ "loss_eval": 0.6850110292434692,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5533884763717651,
+ 8.01724910736084,
+ 11.423017501831055,
+ 15.046612739562988,
+ 18.549089431762695
+ ],
+ "hidden_norms_avg": [
+ 4.590519428253174,
+ 12.431540489196777,
+ 14.243208885192871,
+ 16.609176635742188,
+ 18.00058937072754
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004959268844686449,
+ 0.00020078590023331344,
+ 0.00015426705067511648,
+ 0.00010096926416736096,
+ 5.95865749346558e-05
+ ],
+ "bp_grad_F": [
+ 0.09663982689380646,
+ 0.036162860691547394,
+ 0.02716146595776081,
+ 0.01926880143582821,
+ 0.011334826238453388
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7783203125,
+ "loss_eval": 0.6707749366760254,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5530469417572021,
+ 7.959159851074219,
+ 11.2805757522583,
+ 14.567391395568848,
+ 17.63263511657715
+ ],
+ "hidden_norms_avg": [
+ 4.583434581756592,
+ 11.983453750610352,
+ 13.4386625289917,
+ 15.498583793640137,
+ 16.631824493408203
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005142099689692259,
+ 0.00020230942755006254,
+ 0.00015552931290585548,
+ 0.00011007695866283029,
+ 6.233472959138453e-05
+ ],
+ "bp_grad_F": [
+ 0.09787525236606598,
+ 0.037690743803977966,
+ 0.028980012983083725,
+ 0.02064511366188526,
+ 0.012224731035530567
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7763671875,
+ "loss_eval": 0.6748013496398926,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5515272617340088,
+ 7.847743988037109,
+ 10.868992805480957,
+ 14.282126426696777,
+ 17.300424575805664
+ ],
+ "hidden_norms_avg": [
+ 4.579150199890137,
+ 11.951078414916992,
+ 13.621748924255371,
+ 15.971713066101074,
+ 17.04889488220215
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004585929855238646,
+ 0.00017806614050641656,
+ 0.0001380510366288945,
+ 9.63187703746371e-05,
+ 5.829996371176094e-05
+ ],
+ "bp_grad_F": [
+ 0.10181005299091339,
+ 0.038575656712055206,
+ 0.02964734099805355,
+ 0.020979750901460648,
+ 0.01240287534892559
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.78125,
+ "loss_eval": 0.648021936416626,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5606788396835327,
+ 7.502675533294678,
+ 10.430459022521973,
+ 13.642136573791504,
+ 16.445953369140625
+ ],
+ "hidden_norms_avg": [
+ 4.601283550262451,
+ 11.615697860717773,
+ 13.472222328186035,
+ 15.831238746643066,
+ 16.856765747070312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004074577009305358,
+ 0.00017814920283854008,
+ 0.00013730341743212193,
+ 9.565176151227206e-05,
+ 5.229458474786952e-05
+ ],
+ "bp_grad_F": [
+ 0.11506060510873795,
+ 0.04695325344800949,
+ 0.03571247681975365,
+ 0.025198202580213547,
+ 0.013851121068000793
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.755859375,
+ "loss_eval": 0.7299192547798157,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5404834747314453,
+ 7.528626441955566,
+ 10.384718894958496,
+ 13.326257705688477,
+ 16.41958999633789
+ ],
+ "hidden_norms_avg": [
+ 4.533090591430664,
+ 11.6575345993042,
+ 13.231060028076172,
+ 15.337231636047363,
+ 16.463298797607422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00042279696208424866,
+ 0.00016955600585788488,
+ 0.00012915951083414257,
+ 8.976108074421063e-05,
+ 4.930083014187403e-05
+ ],
+ "bp_grad_F": [
+ 0.11639728397130966,
+ 0.047109171748161316,
+ 0.03660130873322487,
+ 0.02588750049471855,
+ 0.013930009678006172
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.7065586447715759,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 1.539638638496399,
+ 7.26485013961792,
+ 9.96584701538086,
+ 13.003418922424316,
+ 16.14008140563965
+ ],
+ "hidden_norms_avg": [
+ 4.537028789520264,
+ 11.146146774291992,
+ 12.836923599243164,
+ 14.992585182189941,
+ 16.076574325561523
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00039646061486564577,
+ 0.00017108044994529337,
+ 0.00013601842510979623,
+ 9.225023677572608e-05,
+ 4.893271398032084e-05
+ ],
+ "bp_grad_F": [
+ 0.11648086458444595,
+ 0.04862738400697708,
+ 0.0374443456530571,
+ 0.026762915775179863,
+ 0.014388044364750385
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7939453125,
+ "loss_eval": 0.6772804260253906,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5278778076171875,
+ 7.107171058654785,
+ 9.836174011230469,
+ 12.691095352172852,
+ 15.726043701171875
+ ],
+ "hidden_norms_avg": [
+ 4.5205254554748535,
+ 10.983088493347168,
+ 12.684239387512207,
+ 14.876561164855957,
+ 15.817031860351562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003774319775402546,
+ 0.00015706375415902585,
+ 0.0001264828024432063,
+ 8.857168722897768e-05,
+ 4.440043630893342e-05
+ ],
+ "bp_grad_F": [
+ 0.12492093443870544,
+ 0.053397826850414276,
+ 0.040937285870313644,
+ 0.029012493789196014,
+ 0.015446576289832592
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7724609375,
+ "loss_eval": 0.707297146320343,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 1.51571524143219,
+ 7.153889179229736,
+ 9.856640815734863,
+ 12.511648178100586,
+ 15.47674560546875
+ ],
+ "hidden_norms_avg": [
+ 4.51829719543457,
+ 10.948126792907715,
+ 12.496319770812988,
+ 14.353506088256836,
+ 15.267280578613281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003654273459687829,
+ 0.00015038737910799682,
+ 0.00011584001913433895,
+ 8.340556814800948e-05,
+ 4.3377422116464004e-05
+ ],
+ "bp_grad_F": [
+ 0.13914552330970764,
+ 0.0589178130030632,
+ 0.04522731155157089,
+ 0.0323280394077301,
+ 0.016300896182656288
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7626953125,
+ "loss_eval": 0.729290246963501,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5081822872161865,
+ 6.952159404754639,
+ 9.558011054992676,
+ 12.107258796691895,
+ 15.05250358581543
+ ],
+ "hidden_norms_avg": [
+ 4.481203556060791,
+ 10.740157127380371,
+ 12.00869083404541,
+ 13.831336975097656,
+ 14.76778507232666
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003083393967244774,
+ 0.00012594371219165623,
+ 0.00010108885180670768,
+ 7.270355854416266e-05,
+ 3.639453643700108e-05
+ ],
+ "bp_grad_F": [
+ 0.14465992152690887,
+ 0.061646901071071625,
+ 0.047660429030656815,
+ 0.03381076827645302,
+ 0.01706051267683506
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7685546875,
+ "loss_eval": 0.7395438551902771,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5159180164337158,
+ 6.878056526184082,
+ 9.382442474365234,
+ 11.969950675964355,
+ 15.129233360290527
+ ],
+ "hidden_norms_avg": [
+ 4.494526386260986,
+ 10.639691352844238,
+ 12.291059494018555,
+ 14.28632640838623,
+ 15.170000076293945
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028951463173143566,
+ 0.00012502263416536152,
+ 0.00010040518827736378,
+ 7.046512473607436e-05,
+ 3.719307642313652e-05
+ ],
+ "bp_grad_F": [
+ 0.1406005620956421,
+ 0.06109313294291496,
+ 0.047722309827804565,
+ 0.033977217972278595,
+ 0.01711316779255867
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7802734375,
+ "loss_eval": 0.7057114839553833,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5058479309082031,
+ 6.699619770050049,
+ 9.136896133422852,
+ 11.609856605529785,
+ 14.701480865478516
+ ],
+ "hidden_norms_avg": [
+ 4.482093811035156,
+ 10.446189880371094,
+ 12.056195259094238,
+ 13.87569522857666,
+ 14.783234596252441
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002856751380022615,
+ 0.00013275284436531365,
+ 0.00010139105870621279,
+ 6.966136425035074e-05,
+ 3.293903864687309e-05
+ ],
+ "bp_grad_F": [
+ 0.1529398262500763,
+ 0.06890096515417099,
+ 0.052683208137750626,
+ 0.03734185919165611,
+ 0.01789216138422489
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.7478293180465698,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 1.490049123764038,
+ 6.627772331237793,
+ 9.019189834594727,
+ 11.385313987731934,
+ 14.173355102539062
+ ],
+ "hidden_norms_avg": [
+ 4.458098411560059,
+ 10.279450416564941,
+ 11.593936920166016,
+ 13.30923080444336,
+ 14.155406951904297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021343027765396982,
+ 9.837630932452157e-05,
+ 8.006956340977922e-05,
+ 5.6768003560137004e-05,
+ 2.7385456633055583e-05
+ ],
+ "bp_grad_F": [
+ 0.15772707760334015,
+ 0.07120667397975922,
+ 0.05564703419804573,
+ 0.03953033685684204,
+ 0.018776116892695427
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7724609375,
+ "loss_eval": 0.7677009105682373,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4904595613479614,
+ 6.347933769226074,
+ 8.674281120300293,
+ 11.007567405700684,
+ 14.106690406799316
+ ],
+ "hidden_norms_avg": [
+ 4.430132865905762,
+ 10.265702247619629,
+ 11.588266372680664,
+ 13.410375595092773,
+ 14.36179256439209
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002224426862085238,
+ 0.00010000570182455704,
+ 7.794459816068411e-05,
+ 5.595289985649288e-05,
+ 2.7256841349299066e-05
+ ],
+ "bp_grad_F": [
+ 0.16928334534168243,
+ 0.07747916132211685,
+ 0.06056727096438408,
+ 0.04274875670671463,
+ 0.019731448963284492
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.771484375,
+ "loss_eval": 0.7774850726127625,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4839239120483398,
+ 6.341518878936768,
+ 8.600671768188477,
+ 10.991724014282227,
+ 14.061833381652832
+ ],
+ "hidden_norms_avg": [
+ 4.403061866760254,
+ 10.020040512084961,
+ 11.371668815612793,
+ 13.18271255493164,
+ 14.007345199584961
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002152575325453654,
+ 0.00010309015488019213,
+ 7.964189717313275e-05,
+ 5.283725113258697e-05,
+ 2.479495196894277e-05
+ ],
+ "bp_grad_F": [
+ 0.17190901935100555,
+ 0.080362468957901,
+ 0.06201368197798729,
+ 0.042563296854496,
+ 0.019763268530368805
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.791015625,
+ "loss_eval": 0.7503129243850708,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 1.479953408241272,
+ 6.386821269989014,
+ 8.521474838256836,
+ 10.847907066345215,
+ 13.541037559509277
+ ],
+ "hidden_norms_avg": [
+ 4.399942874908447,
+ 9.979388236999512,
+ 11.251038551330566,
+ 12.998858451843262,
+ 13.76570987701416
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000195752116269432,
+ 9.365259029436857e-05,
+ 7.282401929842308e-05,
+ 5.209222945268266e-05,
+ 2.3047552531352267e-05
+ ],
+ "bp_grad_F": [
+ 0.16316288709640503,
+ 0.07674747705459595,
+ 0.06052006781101227,
+ 0.04277755320072174,
+ 0.020131859928369522
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7978515625,
+ "loss_eval": 0.732360303401947,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4770045280456543,
+ 6.249807834625244,
+ 8.36440658569336,
+ 10.429434776306152,
+ 13.045490264892578
+ ],
+ "hidden_norms_avg": [
+ 4.391754627227783,
+ 9.821492195129395,
+ 10.789708137512207,
+ 12.3140869140625,
+ 13.067754745483398
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002329840644961223,
+ 0.00011798225023085251,
+ 9.261347440769896e-05,
+ 6.294570630416274e-05,
+ 2.9543562050093897e-05
+ ],
+ "bp_grad_F": [
+ 0.1812749058008194,
+ 0.08621949702501297,
+ 0.067754827439785,
+ 0.04831995815038681,
+ 0.021977350115776062
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.7784227132797241,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 1.467228651046753,
+ 6.0983357429504395,
+ 8.231528282165527,
+ 10.333056449890137,
+ 13.266757011413574
+ ],
+ "hidden_norms_avg": [
+ 4.390368461608887,
+ 9.647501945495605,
+ 10.692501068115234,
+ 12.274677276611328,
+ 13.044783592224121
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001511751615907997,
+ 7.784536137478426e-05,
+ 6.136627780506387e-05,
+ 4.35807196481619e-05,
+ 2.014869824051857e-05
+ ],
+ "bp_grad_F": [
+ 0.18805110454559326,
+ 0.09124159067869186,
+ 0.07224944978952408,
+ 0.050726212561130524,
+ 0.02254536561667919
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.814141571521759,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4649879932403564,
+ 6.082813739776611,
+ 8.131811141967773,
+ 10.158056259155273,
+ 13.049956321716309
+ ],
+ "hidden_norms_avg": [
+ 4.377193927764893,
+ 9.599099159240723,
+ 10.660999298095703,
+ 12.21728801727295,
+ 12.965741157531738
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001712174853309989,
+ 8.400671504205093e-05,
+ 6.461612792918459e-05,
+ 4.6120971092022955e-05,
+ 2.0111323465243913e-05
+ ],
+ "bp_grad_F": [
+ 0.19550266861915588,
+ 0.09418290108442307,
+ 0.07462290674448013,
+ 0.053083814680576324,
+ 0.02292729914188385
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7890625,
+ "loss_eval": 0.7999259233474731,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4617111682891846,
+ 6.058816432952881,
+ 8.100686073303223,
+ 10.085453987121582,
+ 12.920005798339844
+ ],
+ "hidden_norms_avg": [
+ 4.367196559906006,
+ 9.56169605255127,
+ 10.609153747558594,
+ 12.135587692260742,
+ 12.871316909790039
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015642307698726654,
+ 7.727487536612898e-05,
+ 5.90925665164832e-05,
+ 4.136386633035727e-05,
+ 1.6983105524559505e-05
+ ],
+ "bp_grad_F": [
+ 0.202835351228714,
+ 0.09727983921766281,
+ 0.07683655619621277,
+ 0.05471916124224663,
+ 0.02326873689889908
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.783203125,
+ "loss_eval": 0.8152254223823547,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4593255519866943,
+ 6.017489433288574,
+ 7.96034049987793,
+ 9.983046531677246,
+ 12.839889526367188
+ ],
+ "hidden_norms_avg": [
+ 4.349035739898682,
+ 9.508291244506836,
+ 10.475739479064941,
+ 12.025425910949707,
+ 12.764323234558105
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00013039771874900907,
+ 6.479993317043409e-05,
+ 5.060105831944384e-05,
+ 3.637294139480218e-05,
+ 1.4738084246346261e-05
+ ],
+ "bp_grad_F": [
+ 0.2170599102973938,
+ 0.10417382419109344,
+ 0.08229079097509384,
+ 0.05735529586672783,
+ 0.024290865287184715
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7841796875,
+ "loss_eval": 0.8357614278793335,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4566220045089722,
+ 5.9422221183776855,
+ 7.888944149017334,
+ 9.933752059936523,
+ 12.817610740661621
+ ],
+ "hidden_norms_avg": [
+ 4.346043109893799,
+ 9.43443489074707,
+ 10.415618896484375,
+ 11.964469909667969,
+ 12.66396713256836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00011193535465281457,
+ 5.694849824067205e-05,
+ 4.533635365078226e-05,
+ 3.3492226066300645e-05,
+ 1.4018894034961704e-05
+ ],
+ "bp_grad_F": [
+ 0.21774698793888092,
+ 0.1065358892083168,
+ 0.08431421220302582,
+ 0.05883141607046127,
+ 0.024615641683340073
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.8349668979644775,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4569600820541382,
+ 5.859008312225342,
+ 7.792572498321533,
+ 9.738831520080566,
+ 12.622002601623535
+ ],
+ "hidden_norms_avg": [
+ 4.331563472747803,
+ 9.398598670959473,
+ 10.273933410644531,
+ 11.764141082763672,
+ 12.436033248901367
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012003595475107431,
+ 5.908689126954414e-05,
+ 4.746428385260515e-05,
+ 3.251975431339815e-05,
+ 1.3768915778200608e-05
+ ],
+ "bp_grad_F": [
+ 0.2144007831811905,
+ 0.10626016557216644,
+ 0.08404342085123062,
+ 0.05926896259188652,
+ 0.024889416992664337
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7861328125,
+ "loss_eval": 0.840790331363678,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4559087753295898,
+ 5.8081440925598145,
+ 7.735576629638672,
+ 9.665096282958984,
+ 12.462581634521484
+ ],
+ "hidden_norms_avg": [
+ 4.331978797912598,
+ 9.35647964477539,
+ 10.206826210021973,
+ 11.663065910339355,
+ 12.307528495788574
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010101464431500062,
+ 5.143512680660933e-05,
+ 4.1592236811993644e-05,
+ 3.0060553399380296e-05,
+ 1.2701412742899265e-05
+ ],
+ "bp_grad_F": [
+ 0.22189198434352875,
+ 0.11008423566818237,
+ 0.08644267171621323,
+ 0.0603644996881485,
+ 0.025003522634506226
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7900390625,
+ "loss_eval": 0.8574135303497314,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4537159204483032,
+ 5.80010461807251,
+ 7.719310760498047,
+ 9.681657791137695,
+ 12.724189758300781
+ ],
+ "hidden_norms_avg": [
+ 4.318180084228516,
+ 9.302933692932129,
+ 10.182857513427734,
+ 11.675416946411133,
+ 12.381869316101074
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.399914415553212e-05,
+ 4.920759965898469e-05,
+ 3.82029902539216e-05,
+ 2.4410484911641106e-05,
+ 9.912354471453e-06
+ ],
+ "bp_grad_F": [
+ 0.2312120646238327,
+ 0.11490234732627869,
+ 0.09031722694635391,
+ 0.06280362606048584,
+ 0.02546737529337406
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7900390625,
+ "loss_eval": 0.8825892210006714,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4533940553665161,
+ 5.765341758728027,
+ 7.664762496948242,
+ 9.541180610656738,
+ 12.46136474609375
+ ],
+ "hidden_norms_avg": [
+ 4.321633815765381,
+ 9.284127235412598,
+ 10.135884284973145,
+ 11.603636741638184,
+ 12.27259635925293
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010168847802560776,
+ 5.239037636783905e-05,
+ 4.169415478827432e-05,
+ 2.8813867174903862e-05,
+ 1.1632122550508939e-05
+ ],
+ "bp_grad_F": [
+ 0.23138603568077087,
+ 0.11581514030694962,
+ 0.09145721793174744,
+ 0.06368965655565262,
+ 0.025816213339567184
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7900390625,
+ "loss_eval": 0.8627672791481018,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4520151615142822,
+ 5.752710342407227,
+ 7.6372294425964355,
+ 9.493330001831055,
+ 12.49281120300293
+ ],
+ "hidden_norms_avg": [
+ 4.314420223236084,
+ 9.275971412658691,
+ 10.131872177124023,
+ 11.594268798828125,
+ 12.271230697631836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010349372314522043,
+ 5.0890805141534656e-05,
+ 4.167861698078923e-05,
+ 2.9301188988029025e-05,
+ 1.1288396308373194e-05
+ ],
+ "bp_grad_F": [
+ 0.23472057282924652,
+ 0.11708012968301773,
+ 0.09245092421770096,
+ 0.06478185206651688,
+ 0.025885937735438347
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.791015625,
+ "loss_eval": 0.8611111640930176,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4508332014083862,
+ 5.741517066955566,
+ 7.59091329574585,
+ 9.493820190429688,
+ 12.553393363952637
+ ],
+ "hidden_norms_avg": [
+ 4.315334320068359,
+ 9.272273063659668,
+ 10.107754707336426,
+ 11.5936279296875,
+ 12.266173362731934
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.209421114064753e-05,
+ 4.9557409511180595e-05,
+ 3.8665639294777066e-05,
+ 2.703870450204704e-05,
+ 1.0333649697713554e-05
+ ],
+ "bp_grad_F": [
+ 0.23745231330394745,
+ 0.11897031217813492,
+ 0.09419847279787064,
+ 0.06559450179338455,
+ 0.02597379870712757
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.794921875,
+ "loss_eval": 0.8737660646438599,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4514665603637695,
+ 5.724127292633057,
+ 7.567911624908447,
+ 9.464110374450684,
+ 12.53247356414795
+ ],
+ "hidden_norms_avg": [
+ 4.312892436981201,
+ 9.258728981018066,
+ 10.092171669006348,
+ 11.559837341308594,
+ 12.241935729980469
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.842872193781659e-05,
+ 4.636628364096396e-05,
+ 3.5660887078847736e-05,
+ 2.4343042241525836e-05,
+ 9.563225830788724e-06
+ ],
+ "bp_grad_F": [
+ 0.23917540907859802,
+ 0.12006859481334686,
+ 0.09492167085409164,
+ 0.06607519090175629,
+ 0.02614584006369114
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7939453125,
+ "loss_eval": 0.8743407130241394,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4513946771621704,
+ 5.7332282066345215,
+ 7.562880992889404,
+ 9.466405868530273,
+ 12.53167724609375
+ ],
+ "hidden_norms_avg": [
+ 4.3138651847839355,
+ 9.26041316986084,
+ 10.077324867248535,
+ 11.538521766662598,
+ 12.218836784362793
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.282731480197981e-05,
+ 4.6137181925587356e-05,
+ 3.7237725337035954e-05,
+ 2.553310514485929e-05,
+ 9.964967830455862e-06
+ ],
+ "bp_grad_F": [
+ 0.24150457978248596,
+ 0.12129233777523041,
+ 0.09592130035161972,
+ 0.06674522906541824,
+ 0.026258554309606552
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7890625,
+ "loss_eval": 0.8750766515731812,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4510550498962402,
+ 5.730595111846924,
+ 7.558650493621826,
+ 9.460441589355469,
+ 12.49626636505127
+ ],
+ "hidden_norms_avg": [
+ 4.311552047729492,
+ 9.2510347366333,
+ 10.070302963256836,
+ 11.530484199523926,
+ 12.212501525878906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.91910312930122e-05,
+ 4.6800774725852534e-05,
+ 3.584511432563886e-05,
+ 2.5313198420917615e-05,
+ 9.680608854978345e-06
+ ],
+ "bp_grad_F": [
+ 0.24175073206424713,
+ 0.12143565714359283,
+ 0.09590216726064682,
+ 0.06680992990732193,
+ 0.026268428191542625
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.787109375,
+ "loss_eval": 0.8746636509895325,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 1.450972557067871,
+ 5.727794647216797,
+ 7.5582756996154785,
+ 9.462045669555664,
+ 12.50033187866211
+ ],
+ "hidden_norms_avg": [
+ 4.311238765716553,
+ 9.248146057128906,
+ 10.065601348876953,
+ 11.523144721984863,
+ 12.206249237060547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 8.883981354301795e-05,
+ 4.730010550701991e-05,
+ 3.57187855115626e-05,
+ 2.4922017473727465e-05,
+ 9.98118775896728e-06
+ ],
+ "bp_grad_F": [
+ 0.24178682267665863,
+ 0.12154776602983475,
+ 0.09598654508590698,
+ 0.06685590744018555,
+ 0.026261666789650917
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.787109375,
+ "loss_eval": 0.8750864863395691,
+ "epoch": 60
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms_cls": [
+ 0.3210873007774353,
+ 3.3568029403686523,
+ 4.891699314117432,
+ 6.200707912445068,
+ 7.5911865234375
+ ],
+ "hidden_norms_avg": [
+ 5.7549052238464355,
+ 6.750590801239014,
+ 7.9020819664001465,
+ 8.925304412841797,
+ 10.076716423034668
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.004074312746524811,
+ 0.0011155740357935429,
+ 0.0009667170234024525,
+ 0.0008621186716482043,
+ 0.0008127145702019334
+ ],
+ "bp_grad_F": [
+ 0.20160320401191711,
+ 0.039521340280771255,
+ 0.033098917454481125,
+ 0.029271923005580902,
+ 0.027136052027344704
+ ],
+ "gamma_dfa": 0.0011031709145754576,
+ "gamma_dfa_per_layer": [
+ -0.004096934571862221,
+ -0.003170878393575549,
+ 0.003171987598761916,
+ 0.008508509024977684
+ ],
+ "acc_eval": 0.125,
+ "loss_eval": 2.422111988067627,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 1.7445409297943115,
+ 3393.872314453125,
+ 8096.7275390625,
+ 11786.4453125,
+ 15317.9609375
+ ],
+ "hidden_norms_avg": [
+ 46.059967041015625,
+ 2908.78857421875,
+ 9192.9140625,
+ 12480.814453125,
+ 15843.904296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007700070273131132,
+ 5.177932962396881e-07,
+ 4.354141651674581e-07,
+ 4.0796010125632165e-07,
+ 4.096184795798763e-07
+ ],
+ "bp_grad_F": [
+ 0.14847944676876068,
+ 7.175570499384776e-05,
+ 1.7355905583826825e-05,
+ 1.4375820683198981e-05,
+ 1.4468741937889718e-05
+ ],
+ "gamma_dfa": 0.00903075491078198,
+ "gamma_dfa_per_layer": [
+ 0.014700280502438545,
+ 0.007455145940184593,
+ 0.009132559411227703,
+ 0.004835033789277077
+ ],
+ "acc_eval": 0.2158203125,
+ "loss_eval": 2.072723388671875,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 3.5329439640045166,
+ 17943.025390625,
+ 46227.09765625,
+ 60098.9921875,
+ 105510.8828125
+ ],
+ "hidden_norms_avg": [
+ 95.54289245605469,
+ 14775.4267578125,
+ 44856.01953125,
+ 59234.35546875,
+ 87862.078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00029628784977830946,
+ 1.0676165373979529e-07,
+ 7.34040170868866e-08,
+ 6.658416396021494e-08,
+ 6.750254044618487e-08
+ ],
+ "bp_grad_F": [
+ 0.12055971473455429,
+ 8.933278149925172e-05,
+ 3.910079612978734e-06,
+ 3.3086737403209554e-06,
+ 3.354543650857522e-06
+ ],
+ "gamma_dfa": 0.007886230800068006,
+ "gamma_dfa_per_layer": [
+ 0.016902755945920944,
+ 0.003473796183243394,
+ 0.009775697253644466,
+ 0.0013926738174632192
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 2.0924925804138184,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 5.165565013885498,
+ 33863.33203125,
+ 93132.8515625,
+ 145828.34375,
+ 276496.0
+ ],
+ "hidden_norms_avg": [
+ 142.7160186767578,
+ 36882.9296875,
+ 93356.96875,
+ 138199.0625,
+ 216913.359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00022745825117453933,
+ 4.267175768291054e-08,
+ 3.181965624321492e-08,
+ 2.8314032007870082e-08,
+ 2.8843814448009653e-08
+ ],
+ "bp_grad_F": [
+ 0.06954267621040344,
+ 0.00012680335203185678,
+ 2.0300262804084923e-06,
+ 1.8529049157223199e-06,
+ 1.8672349142434541e-06
+ ],
+ "gamma_dfa": 0.00556139531545341,
+ "gamma_dfa_per_layer": [
+ 0.01000538095831871,
+ 0.0014471756294369698,
+ 0.011906315572559834,
+ -0.001113290898501873
+ ],
+ "acc_eval": 0.2412109375,
+ "loss_eval": 2.0521552562713623,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 6.674264907836914,
+ 43835.6796875,
+ 150229.609375,
+ 253133.515625,
+ 481876.5
+ ],
+ "hidden_norms_avg": [
+ 186.87832641601562,
+ 74412.015625,
+ 150159.890625,
+ 253252.734375,
+ 439077.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003350951592437923,
+ 2.7693221937852286e-08,
+ 1.989219278186738e-08,
+ 1.704596108709211e-08,
+ 1.7547710839949104e-08
+ ],
+ "bp_grad_F": [
+ 0.058595605194568634,
+ 0.0002476655936334282,
+ 1.0984595064655878e-06,
+ 1.0368654557169066e-06,
+ 1.0405622106191004e-06
+ ],
+ "gamma_dfa": 0.002481349220033735,
+ "gamma_dfa_per_layer": [
+ 3.730843309313059e-05,
+ 0.0014904557028785348,
+ 0.011494583450257778,
+ -0.0030969507060945034
+ ],
+ "acc_eval": 0.232421875,
+ "loss_eval": 2.058844566345215,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 8.061405181884766,
+ 102865.78125,
+ 229004.390625,
+ 413580.59375,
+ 706253.625
+ ],
+ "hidden_norms_avg": [
+ 228.99224853515625,
+ 131342.546875,
+ 229257.390625,
+ 410435.25,
+ 727001.6875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00029934433405287564,
+ 1.670629679040303e-08,
+ 1.3200744497510186e-08,
+ 1.1068386207568892e-08,
+ 1.1248447506773118e-08
+ ],
+ "bp_grad_F": [
+ 0.49810686707496643,
+ 0.0004038630868308246,
+ 1.391591922583757e-06,
+ 6.11680206930032e-07,
+ 5.242948759587307e-07
+ ],
+ "gamma_dfa": 0.0009187236428260803,
+ "gamma_dfa_per_layer": [
+ -0.003027769736945629,
+ 0.002294017933309078,
+ 0.00904145184904337,
+ -0.004632805474102497
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 2.091141700744629,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 9.400635719299316,
+ 164205.859375,
+ 302756.3125,
+ 584338.25,
+ 1250749.125
+ ],
+ "hidden_norms_avg": [
+ 270.8563232421875,
+ 190832.34375,
+ 307117.59375,
+ 620500.3125,
+ 1149191.375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00034470504033379257,
+ 1.3897826889319731e-08,
+ 8.662226491651381e-09,
+ 6.850678690994982e-09,
+ 7.0105756755367565e-09
+ ],
+ "bp_grad_F": [
+ 0.08854538202285767,
+ 0.0002125167811755091,
+ 3.9876397295302013e-07,
+ 2.9177280680414697e-07,
+ 2.903063318626664e-07
+ ],
+ "gamma_dfa": 0.0008902656263671815,
+ "gamma_dfa_per_layer": [
+ -0.004116768017411232,
+ 0.004187953192740679,
+ 0.007109872996807098,
+ -0.003619995666667819
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 2.09378981590271,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 10.676177978515625,
+ 216327.671875,
+ 429372.28125,
+ 910110.1875,
+ 1955787.375
+ ],
+ "hidden_norms_avg": [
+ 311.3556823730469,
+ 279124.65625,
+ 434169.5,
+ 917506.125,
+ 1714750.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002802011731546372,
+ 8.183582700382885e-09,
+ 5.617039278149605e-09,
+ 4.765932093420133e-09,
+ 4.884364024348997e-09
+ ],
+ "bp_grad_F": [
+ 0.2021757811307907,
+ 0.00017153903900180012,
+ 2.627296851187566e-07,
+ 1.9583571031489555e-07,
+ 1.9719628596703842e-07
+ ],
+ "gamma_dfa": 0.00245969754178077,
+ "gamma_dfa_per_layer": [
+ 0.0030665153171867132,
+ 0.0039703575894236565,
+ 0.005591260269284248,
+ -0.0027893430087715387
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 2.0816030502319336,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 11.970849990844727,
+ 282019.0,
+ 553729.25,
+ 1250316.5,
+ 2676136.75
+ ],
+ "hidden_norms_avg": [
+ 350.0874938964844,
+ 367917.96875,
+ 563719.125,
+ 1231394.75,
+ 2379567.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015754146443214267,
+ 7.837374305097455e-09,
+ 4.1749870227647534e-09,
+ 3.572480755664742e-09,
+ 3.6429026462059255e-09
+ ],
+ "bp_grad_F": [
+ 0.06816119700670242,
+ 0.0002165154874091968,
+ 1.8739321205885062e-07,
+ 1.4396131575722393e-07,
+ 1.449055417879208e-07
+ ],
+ "gamma_dfa": 0.0018902571755461395,
+ "gamma_dfa_per_layer": [
+ 0.0010774387046694756,
+ 0.004019944928586483,
+ 0.004736708011478186,
+ -0.0022730629425495863
+ ],
+ "acc_eval": 0.2236328125,
+ "loss_eval": 2.069587469100952,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 13.234355926513672,
+ 498576.65625,
+ 747356.3125,
+ 1569417.0,
+ 3492356.0
+ ],
+ "hidden_norms_avg": [
+ 390.34356689453125,
+ 517596.5,
+ 755798.625,
+ 1559863.25,
+ 3087860.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012954612611792982,
+ 6.955718223622398e-09,
+ 3.3238092278509157e-09,
+ 2.7362234700234467e-09,
+ 2.7891511322764018e-09
+ ],
+ "bp_grad_F": [
+ 0.03943011909723282,
+ 0.00019621588580776006,
+ 1.9796995331944345e-07,
+ 1.1484767270530938e-07,
+ 1.1313876058238748e-07
+ ],
+ "gamma_dfa": 0.002013051969697699,
+ "gamma_dfa_per_layer": [
+ 0.0007974229520186782,
+ 0.0045172227546572685,
+ 0.004162413999438286,
+ -0.0014248518273234367
+ ],
+ "acc_eval": 0.21484375,
+ "loss_eval": 2.0846829414367676,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 14.412362098693848,
+ 653898.875,
+ 962527.9375,
+ 1974772.75,
+ 4235229.0
+ ],
+ "hidden_norms_avg": [
+ 426.1747741699219,
+ 660897.75,
+ 954217.625,
+ 1992937.5,
+ 3912584.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001297950657317415,
+ 8.463428180505161e-09,
+ 2.735849546908753e-09,
+ 2.2942541200166033e-09,
+ 2.329255233135541e-09
+ ],
+ "bp_grad_F": [
+ 0.07335253059864044,
+ 0.0002778704511001706,
+ 2.1924184068211616e-07,
+ 1.5885484572208952e-07,
+ 9.551467172741468e-08
+ ],
+ "gamma_dfa": 0.001994484744500369,
+ "gamma_dfa_per_layer": [
+ 0.0028600264340639114,
+ 0.0031631651800125837,
+ 0.0033731083385646343,
+ -0.0014183609746396542
+ ],
+ "acc_eval": 0.2373046875,
+ "loss_eval": 2.0768301486968994,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 15.627301216125488,
+ 805321.625,
+ 1191654.25,
+ 2375967.75,
+ 5068243.5
+ ],
+ "hidden_norms_avg": [
+ 464.92144775390625,
+ 870169.75,
+ 1209570.75,
+ 2342305.5,
+ 4797491.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014358766202349216,
+ 6.655038742309216e-09,
+ 2.213497385383789e-09,
+ 1.8578552030135143e-09,
+ 1.8845198734851465e-09
+ ],
+ "bp_grad_F": [
+ 0.22341646254062653,
+ 0.0010545816039666533,
+ 3.022053363110899e-07,
+ 8.581165644727662e-08,
+ 7.942276880612553e-08
+ ],
+ "gamma_dfa": 0.0012935771082993597,
+ "gamma_dfa_per_layer": [
+ -0.00014482985716313124,
+ 0.0035164642613381147,
+ 0.002910400740802288,
+ -0.0011077267117798328
+ ],
+ "acc_eval": 0.2138671875,
+ "loss_eval": 2.076242446899414,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 16.751590728759766,
+ 758638.375,
+ 1437438.0,
+ 2779040.25,
+ 5662257.0
+ ],
+ "hidden_norms_avg": [
+ 501.60235595703125,
+ 1119163.625,
+ 1513203.375,
+ 2677392.25,
+ 5339190.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00020390149438753724,
+ 5.5311413227343564e-09,
+ 1.8890189412701375e-09,
+ 1.6241474831701908e-09,
+ 1.6578916017806478e-09
+ ],
+ "bp_grad_F": [
+ 1.734735369682312,
+ 0.000374374445527792,
+ 1.2862761877840967e-07,
+ 1.1062630989044919e-07,
+ 6.887377423936414e-08
+ ],
+ "gamma_dfa": 0.0020944410644005984,
+ "gamma_dfa_per_layer": [
+ 0.0036250988487154245,
+ 0.0027163547929376364,
+ 0.0028407545760273933,
+ -0.0008044439600780606
+ ],
+ "acc_eval": 0.23046875,
+ "loss_eval": 2.083003520965576,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 17.76032066345215,
+ 1093088.5,
+ 1739864.0,
+ 3080344.5,
+ 6632118.5
+ ],
+ "hidden_norms_avg": [
+ 539.1420288085938,
+ 1433551.75,
+ 1843404.125,
+ 3096921.75,
+ 6237853.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014031230239197612,
+ 4.252878937904825e-09,
+ 1.704668295410272e-09,
+ 1.518661418842271e-09,
+ 1.5263605934734414e-09
+ ],
+ "bp_grad_F": [
+ 0.05247655138373375,
+ 0.00048432740732096136,
+ 1.395327586806161e-07,
+ 8.375257465331742e-08,
+ 5.970760241780226e-08
+ ],
+ "gamma_dfa": 0.0018704376125242561,
+ "gamma_dfa_per_layer": [
+ 0.0021162822376936674,
+ 0.003257386852055788,
+ 0.002796958899125457,
+ -0.0006888775387778878
+ ],
+ "acc_eval": 0.2177734375,
+ "loss_eval": 2.1021971702575684,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 18.760025024414062,
+ 2223954.75,
+ 2460609.0,
+ 3718541.25,
+ 7618764.0
+ ],
+ "hidden_norms_avg": [
+ 577.8324584960938,
+ 1908819.625,
+ 2348359.5,
+ 3542983.0,
+ 6779725.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010403544729342684,
+ 2.662567277766925e-09,
+ 1.6195218499603925e-09,
+ 1.422262307926303e-09,
+ 1.433551610752204e-09
+ ],
+ "bp_grad_F": [
+ 0.08673901855945587,
+ 0.0001567020226502791,
+ 8.41187173250546e-08,
+ 5.8843131256480774e-08,
+ 5.371895994699116e-08
+ ],
+ "gamma_dfa": 0.003976444830186665,
+ "gamma_dfa_per_layer": [
+ 0.010876781307160854,
+ 0.0029237696435302496,
+ 0.0026041539385914803,
+ -0.000498925568535924
+ ],
+ "acc_eval": 0.2177734375,
+ "loss_eval": 2.138009548187256,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 19.738407135009766,
+ 2339586.0,
+ 2696652.5,
+ 4235438.5,
+ 7955372.0
+ ],
+ "hidden_norms_avg": [
+ 619.4888916015625,
+ 2243613.75,
+ 2801893.5,
+ 4018190.75,
+ 7143025.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014718857710249722,
+ 2.6654392026870255e-09,
+ 1.4668186665289795e-09,
+ 1.3113429231381701e-09,
+ 1.3212382299343517e-09
+ ],
+ "bp_grad_F": [
+ 0.1564428061246872,
+ 0.00024187436792999506,
+ 2.621962664761668e-07,
+ 5.580703898999673e-08,
+ 5.442945649747344e-08
+ ],
+ "gamma_dfa": 0.0019682426573126577,
+ "gamma_dfa_per_layer": [
+ 0.003052386222407222,
+ 0.0027148486115038395,
+ 0.0025699653197079897,
+ -0.00046422952436842024
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.145447254180908,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 20.727081298828125,
+ 2753822.5,
+ 3114285.75,
+ 4713040.0,
+ 8652256.0
+ ],
+ "hidden_norms_avg": [
+ 660.8045654296875,
+ 2684893.0,
+ 3331407.5,
+ 4614215.5,
+ 7864381.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00013858993770554662,
+ 2.7730009399817845e-09,
+ 1.344458322449782e-09,
+ 1.2393497339502346e-09,
+ 1.2431760065823028e-09
+ ],
+ "bp_grad_F": [
+ 0.1324291080236435,
+ 0.00022225745487958193,
+ 9.285694346772289e-08,
+ 4.7669061586930184e-08,
+ 4.746264181676452e-08
+ ],
+ "gamma_dfa": 0.001855946145951748,
+ "gamma_dfa_per_layer": [
+ 0.004218719433993101,
+ 0.001718730665743351,
+ 0.0019668969325721264,
+ -0.0004805624485015869
+ ],
+ "acc_eval": 0.251953125,
+ "loss_eval": 2.101409673690796,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 21.603151321411133,
+ 3877476.75,
+ 4156743.75,
+ 5474745.5,
+ 10299149.0
+ ],
+ "hidden_norms_avg": [
+ 698.7645263671875,
+ 3523264.5,
+ 4085091.75,
+ 5354783.0,
+ 9094561.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000199332891497761,
+ 1.9098649328697093e-09,
+ 1.2144363292776461e-09,
+ 1.1166952917918138e-09,
+ 1.1315383074972374e-09
+ ],
+ "bp_grad_F": [
+ 0.15142236649990082,
+ 4.2183397454209626e-05,
+ 7.309424887580462e-08,
+ 5.2962114693855256e-08,
+ 4.2337880756804225e-08
+ ],
+ "gamma_dfa": 0.0013709207050851546,
+ "gamma_dfa_per_layer": [
+ 0.0023175266105681658,
+ 0.0016730788629502058,
+ 0.0018372924532741308,
+ -0.0003442151064518839
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 2.1280713081359863,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 22.48230743408203,
+ 3581296.5,
+ 4024996.25,
+ 6183271.0,
+ 11393130.0
+ ],
+ "hidden_norms_avg": [
+ 735.2485961914062,
+ 4017679.75,
+ 4751523.5,
+ 6215236.0,
+ 10366257.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00018803548300638795,
+ 1.895784862426808e-09,
+ 1.1237420993737146e-09,
+ 1.0378963244406236e-09,
+ 1.0573794062551656e-09
+ ],
+ "bp_grad_F": [
+ 0.12878409028053284,
+ 4.194497887510806e-05,
+ 4.941083631138099e-08,
+ 3.9714532107382183e-08,
+ 3.994472663748638e-08
+ ],
+ "gamma_dfa": 0.0012161588310846128,
+ "gamma_dfa_per_layer": [
+ 0.0021385664585977793,
+ 0.0015012789517641068,
+ 0.0016565187834203243,
+ -0.0004317288694437593
+ ],
+ "acc_eval": 0.2158203125,
+ "loss_eval": 2.1137895584106445,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 23.29258155822754,
+ 4616424.5,
+ 5061994.0,
+ 6831782.5,
+ 12437102.0
+ ],
+ "hidden_norms_avg": [
+ 768.5599975585938,
+ 4586839.5,
+ 5567332.5,
+ 6953557.0,
+ 11342041.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021542877948377281,
+ 1.9688994878919175e-09,
+ 1.0831572305747272e-09,
+ 9.59386015075836e-10,
+ 9.76972058808201e-10
+ ],
+ "bp_grad_F": [
+ 0.09346769750118256,
+ 4.979455843567848e-05,
+ 4.6927411290198506e-08,
+ 3.8312244043936516e-08,
+ 3.882623289541698e-08
+ ],
+ "gamma_dfa": 0.0011904535058420151,
+ "gamma_dfa_per_layer": [
+ 0.0024171490222215652,
+ 0.0012326111318543553,
+ 0.0015420420095324516,
+ -0.0004299881402403116
+ ],
+ "acc_eval": 0.2333984375,
+ "loss_eval": 2.0970499515533447,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 24.054462432861328,
+ 5806660.5,
+ 6270370.0,
+ 7861086.0,
+ 14600824.0
+ ],
+ "hidden_norms_avg": [
+ 801.1851806640625,
+ 5855518.5,
+ 6747570.0,
+ 8137969.0,
+ 13373154.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012799039541278034,
+ 1.5442244150065676e-09,
+ 9.774002718287989e-10,
+ 8.729071909741037e-10,
+ 8.921305361120346e-10
+ ],
+ "bp_grad_F": [
+ 0.9552626609802246,
+ 1.163827892014524e-05,
+ 2.461903250150499e-07,
+ 3.4675800009154045e-08,
+ 3.4831803219503854e-08
+ ],
+ "gamma_dfa": 0.0018355100764892995,
+ "gamma_dfa_per_layer": [
+ 0.004604285582900047,
+ 0.00167210737708956,
+ 0.001404301729053259,
+ -0.0003386543830856681
+ ],
+ "acc_eval": 0.2138671875,
+ "loss_eval": 2.11769700050354,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 24.826902389526367,
+ 6414338.0,
+ 6989573.0,
+ 8609765.0,
+ 15368301.0
+ ],
+ "hidden_norms_avg": [
+ 830.1490478515625,
+ 6946265.5,
+ 7916239.0,
+ 9224772.0,
+ 14431417.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015248128329403698,
+ 1.4729809594271615e-09,
+ 9.462167716023373e-10,
+ 8.629364445233989e-10,
+ 8.805687845558907e-10
+ ],
+ "bp_grad_F": [
+ 0.1705506592988968,
+ 0.00016797611897345632,
+ 4.810285503253908e-08,
+ 3.399246040203252e-08,
+ 3.436711182303043e-08
+ ],
+ "gamma_dfa": 0.0015317398574552499,
+ "gamma_dfa_per_layer": [
+ 0.004021936096251011,
+ 0.0012830595951527357,
+ 0.0012305387062951922,
+ -0.00040857496787793934
+ ],
+ "acc_eval": 0.2236328125,
+ "loss_eval": 2.102954864501953,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 25.52900505065918,
+ 8152435.5,
+ 8736555.0,
+ 9881049.0,
+ 16997340.0
+ ],
+ "hidden_norms_avg": [
+ 858.3137817382812,
+ 7544203.0,
+ 8860779.0,
+ 10224814.0,
+ 15607154.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001363755582133308,
+ 1.2969386675720784e-09,
+ 9.174655479782245e-10,
+ 8.421383035361885e-10,
+ 8.538599827190296e-10
+ ],
+ "bp_grad_F": [
+ 0.07549053430557251,
+ 2.9420058126561344e-05,
+ 5.8904493727141016e-08,
+ 3.187446395713778e-08,
+ 3.1860317051268794e-08
+ ],
+ "gamma_dfa": 0.0023631651129107922,
+ "gamma_dfa_per_layer": [
+ 0.007739294320344925,
+ 0.0009300304809585214,
+ 0.001171439653262496,
+ -0.00038810400292277336
+ ],
+ "acc_eval": 0.2080078125,
+ "loss_eval": 2.1162400245666504,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 26.122589111328125,
+ 9255466.0,
+ 9964734.0,
+ 11054792.0,
+ 18565818.0
+ ],
+ "hidden_norms_avg": [
+ 884.7098388671875,
+ 8814330.0,
+ 10177720.0,
+ 11552646.0,
+ 17489728.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014142012514639646,
+ 1.3653665975610352e-09,
+ 8.580440802319345e-10,
+ 7.922714151398225e-10,
+ 8.032630116616701e-10
+ ],
+ "bp_grad_F": [
+ 0.11926258355379105,
+ 1.2633940968953539e-05,
+ 3.893048727832138e-08,
+ 3.075604126934195e-08,
+ 3.043995278062539e-08
+ ],
+ "gamma_dfa": 0.0013515961618395522,
+ "gamma_dfa_per_layer": [
+ 0.0038036422338336706,
+ 0.0009011125075630844,
+ 0.0010650388430804014,
+ -0.0003634089371189475
+ ],
+ "acc_eval": 0.201171875,
+ "loss_eval": 2.134256362915039,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 26.71797752380371,
+ 8691604.0,
+ 9652268.0,
+ 11413482.0,
+ 19342164.0
+ ],
+ "hidden_norms_avg": [
+ 908.3400268554688,
+ 9418884.0,
+ 11132975.0,
+ 12548590.0,
+ 18516546.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00016020517796278,
+ 1.5232745065318909e-09,
+ 8.103306359252826e-10,
+ 7.392123024807518e-10,
+ 7.529800671868259e-10
+ ],
+ "bp_grad_F": [
+ 0.08055854588747025,
+ 1.5452902516699396e-05,
+ 3.9288735820264264e-08,
+ 3.091117406484045e-08,
+ 2.9865013573271426e-08
+ ],
+ "gamma_dfa": 0.0012649961790884845,
+ "gamma_dfa_per_layer": [
+ 0.0036856848746538162,
+ 0.0008738536853343248,
+ 0.0009324033162556589,
+ -0.00043195715988986194
+ ],
+ "acc_eval": 0.216796875,
+ "loss_eval": 2.1074087619781494,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 27.27407455444336,
+ 9931691.0,
+ 10836582.0,
+ 12350148.0,
+ 20677670.0
+ ],
+ "hidden_norms_avg": [
+ 931.8362426757812,
+ 10575293.0,
+ 12476721.0,
+ 13979366.0,
+ 20145220.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002644142950884998,
+ 1.4137412351900025e-09,
+ 7.711813965194381e-10,
+ 7.245293809354791e-10,
+ 7.329452600401964e-10
+ ],
+ "bp_grad_F": [
+ 0.08752908557653427,
+ 3.3139032893814147e-05,
+ 4.584432744536571e-08,
+ 2.996421955003825e-08,
+ 2.8689356668110122e-08
+ ],
+ "gamma_dfa": 0.0013240749976830557,
+ "gamma_dfa_per_layer": [
+ 0.003940493334084749,
+ 0.0008323215297423303,
+ 0.0009093738626688719,
+ -0.0003858887357637286
+ ],
+ "acc_eval": 0.2080078125,
+ "loss_eval": 2.1011557579040527,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 27.817367553710938,
+ 12253263.0,
+ 13105294.0,
+ 14345712.0,
+ 22455440.0
+ ],
+ "hidden_norms_avg": [
+ 953.0517578125,
+ 12373978.0,
+ 14141729.0,
+ 15597335.0,
+ 22309104.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014759604528080672,
+ 1.123480086739903e-09,
+ 7.102037291595309e-10,
+ 6.690955567378865e-10,
+ 6.791667228611686e-10
+ ],
+ "bp_grad_F": [
+ 0.05615593492984772,
+ 0.00010146480053663254,
+ 3.714368190799178e-08,
+ 2.748037175592799e-08,
+ 2.6385574614096186e-08
+ ],
+ "gamma_dfa": 0.0012311612081248313,
+ "gamma_dfa_per_layer": [
+ 0.003369898535311222,
+ 0.0009893677197396755,
+ 0.0009041082230396569,
+ -0.0003387296455912292
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 2.105236291885376,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 28.32236099243164,
+ 13643201.0,
+ 14611628.0,
+ 15764247.0,
+ 24160378.0
+ ],
+ "hidden_norms_avg": [
+ 973.9281616210938,
+ 13221320.0,
+ 15394035.0,
+ 16890642.0,
+ 23678466.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00016657183005008847,
+ 9.720990679085162e-10,
+ 6.881580305595492e-10,
+ 6.496979620962406e-10,
+ 6.5528305004392e-10
+ ],
+ "bp_grad_F": [
+ 0.21266740560531616,
+ 1.0097430276800878e-05,
+ 5.8009760550703504e-08,
+ 2.5056060337647068e-08,
+ 2.5318335872270836e-08
+ ],
+ "gamma_dfa": 0.0010233484499622136,
+ "gamma_dfa_per_layer": [
+ 0.0030805980786681175,
+ 0.0005203179316595197,
+ 0.000822446309030056,
+ -0.00032996851950883865
+ ],
+ "acc_eval": 0.212890625,
+ "loss_eval": 2.137085437774658,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 28.79292106628418,
+ 13177481.0,
+ 14299000.0,
+ 15555998.0,
+ 23304192.0
+ ],
+ "hidden_norms_avg": [
+ 992.415771484375,
+ 14624837.0,
+ 16826644.0,
+ 18325902.0,
+ 25292966.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00020211696391925216,
+ 1.1425522750130312e-09,
+ 6.55300591567709e-10,
+ 6.094423854463571e-10,
+ 6.189129764244683e-10
+ ],
+ "bp_grad_F": [
+ 0.17359277606010437,
+ 1.2817296010325663e-05,
+ 7.396955936656013e-08,
+ 2.5667416636565576e-08,
+ 2.485118777428852e-08
+ ],
+ "gamma_dfa": 0.0013693289074581116,
+ "gamma_dfa_per_layer": [
+ 0.004313473589718342,
+ 0.0007373306434601545,
+ 0.000740988994948566,
+ -0.00031447759829461575
+ ],
+ "acc_eval": 0.2255859375,
+ "loss_eval": 2.095831871032715,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 29.206546783447266,
+ 13026473.0,
+ 14086985.0,
+ 16207103.0,
+ 25752542.0
+ ],
+ "hidden_norms_avg": [
+ 1012.0676879882812,
+ 14977745.0,
+ 17788350.0,
+ 19459138.0,
+ 26297900.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002467916056048125,
+ 1.5415436704913077e-09,
+ 6.588643519656046e-10,
+ 6.053296752739357e-10,
+ 6.112412798131572e-10
+ ],
+ "bp_grad_F": [
+ 0.042935822159051895,
+ 9.192503966914956e-06,
+ 3.478140442325639e-08,
+ 2.366191687031005e-08,
+ 2.384759412166204e-08
+ ],
+ "gamma_dfa": 0.0008732089045224711,
+ "gamma_dfa_per_layer": [
+ 0.002771018771454692,
+ 0.00032788922544568777,
+ 0.0007068651611916721,
+ -0.0003129375400021672
+ ],
+ "acc_eval": 0.2294921875,
+ "loss_eval": 2.0877132415771484,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 29.655010223388672,
+ 18104814.0,
+ 18959442.0,
+ 20352136.0,
+ 30115644.0
+ ],
+ "hidden_norms_avg": [
+ 1030.1336669921875,
+ 17704192.0,
+ 19945910.0,
+ 21540694.0,
+ 29199112.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00019920141494367272,
+ 8.472024748407136e-10,
+ 5.961620086480934e-10,
+ 5.578593698096768e-10,
+ 5.602495689593923e-10
+ ],
+ "bp_grad_F": [
+ 0.05658308416604996,
+ 2.5135868781944737e-05,
+ 4.3493169954444966e-08,
+ 2.1390142990185268e-08,
+ 2.1341643119399123e-08
+ ],
+ "gamma_dfa": 0.0010463381186127663,
+ "gamma_dfa_per_layer": [
+ 0.0027386434376239777,
+ 0.0009209397248923779,
+ 0.0007645037840120494,
+ -0.0002387344720773399
+ ],
+ "acc_eval": 0.2138671875,
+ "loss_eval": 2.1298673152923584,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 30.063920974731445,
+ 20103628.0,
+ 20986630.0,
+ 22120356.0,
+ 31195618.0
+ ],
+ "hidden_norms_avg": [
+ 1046.1927490234375,
+ 18906620.0,
+ 21404482.0,
+ 23038508.0,
+ 30526688.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002040969266090542,
+ 9.528980937645315e-10,
+ 5.700001026731627e-10,
+ 5.158900528989818e-10,
+ 5.214851328538828e-10
+ ],
+ "bp_grad_F": [
+ 0.0816737711429596,
+ 5.908617822569795e-05,
+ 3.4592272157851767e-08,
+ 2.022995992945198e-08,
+ 2.0381063947638722e-08
+ ],
+ "gamma_dfa": 0.001085347576008644,
+ "gamma_dfa_per_layer": [
+ 0.0035934830084443092,
+ 0.0002959886915050447,
+ 0.0007062341319397092,
+ -0.0002543155278544873
+ ],
+ "acc_eval": 0.2041015625,
+ "loss_eval": 2.116055965423584,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 30.392677307128906,
+ 21290946.0,
+ 22100456.0,
+ 23440498.0,
+ 32839040.0
+ ],
+ "hidden_norms_avg": [
+ 1062.797119140625,
+ 20072588.0,
+ 22866046.0,
+ 24608556.0,
+ 32259930.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00022883246128913015,
+ 1.3679187782500435e-09,
+ 5.444520945196984e-10,
+ 5.043216955158414e-10,
+ 5.114720313947885e-10
+ ],
+ "bp_grad_F": [
+ 0.2192479968070984,
+ 0.0001256070681847632,
+ 1.2757884348957305e-07,
+ 2.0006645229386777e-08,
+ 1.9971306386423748e-08
+ ],
+ "gamma_dfa": 0.0019978012933279388,
+ "gamma_dfa_per_layer": [
+ 0.0072806887328624725,
+ 0.0002412673202343285,
+ 0.000707695260643959,
+ -0.00023844614042900503
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 2.1034791469573975,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 30.711090087890625,
+ 22272344.0,
+ 23036462.0,
+ 24462584.0,
+ 35130192.0
+ ],
+ "hidden_norms_avg": [
+ 1082.3468017578125,
+ 20945452.0,
+ 23993758.0,
+ 25838460.0,
+ 33448582.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005148049676790833,
+ 2.304462176638822e-09,
+ 5.340937136999457e-10,
+ 4.950916898671665e-10,
+ 5.010572512453848e-10
+ ],
+ "bp_grad_F": [
+ 0.15110087394714355,
+ 3.209088754374534e-05,
+ 1.0334197497741116e-07,
+ 2.0131187383753968e-08,
+ 1.9814510920923567e-08
+ ],
+ "gamma_dfa": 0.003046433750569122,
+ "gamma_dfa_per_layer": [
+ 0.011593285948038101,
+ 0.00019314857490826398,
+ 0.0006439671851694584,
+ -0.0002446667058393359
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 2.112250328063965,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 31.0146427154541,
+ 29106790.0,
+ 29617952.0,
+ 31075512.0,
+ 42307980.0
+ ],
+ "hidden_norms_avg": [
+ 1102.4920654296875,
+ 22080922.0,
+ 25255976.0,
+ 27220448.0,
+ 35072796.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003266549902036786,
+ 3.0358568992028268e-09,
+ 4.893331295718895e-10,
+ 4.395950825575312e-10,
+ 4.4405815136094873e-10
+ ],
+ "bp_grad_F": [
+ 1.0139163732528687,
+ 1.6822159523144364e-05,
+ 1.2544650473955699e-07,
+ 1.6449900996917677e-08,
+ 1.5756539184508256e-08
+ ],
+ "gamma_dfa": 0.004347974703705404,
+ "gamma_dfa_per_layer": [
+ 0.016904333606362343,
+ -2.5271147023886442e-05,
+ 0.0006614690646529198,
+ -0.00014863270916976035
+ ],
+ "acc_eval": 0.1806640625,
+ "loss_eval": 2.1869568824768066,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 31.282560348510742,
+ 30793450.0,
+ 31273076.0,
+ 33029836.0,
+ 44659544.0
+ ],
+ "hidden_norms_avg": [
+ 1120.8310546875,
+ 23223250.0,
+ 26597348.0,
+ 28740710.0,
+ 37219140.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004533866886049509,
+ 8.621259817154225e-10,
+ 4.717314872060285e-10,
+ 4.43607900413312e-10,
+ 4.492739236194865e-10
+ ],
+ "bp_grad_F": [
+ 0.8242164254188538,
+ 9.425415555597283e-06,
+ 6.696246401816097e-08,
+ 1.4385987512355314e-08,
+ 1.456661191667763e-08
+ ],
+ "gamma_dfa": 0.004019053936644923,
+ "gamma_dfa_per_layer": [
+ 0.015497363172471523,
+ 0.0001274545502383262,
+ 0.0006036070408299565,
+ -0.00015220901696011424
+ ],
+ "acc_eval": 0.1396484375,
+ "loss_eval": 2.199540615081787,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 31.512802124023438,
+ 21969868.0,
+ 22884238.0,
+ 24682478.0,
+ 38405980.0
+ ],
+ "hidden_norms_avg": [
+ 1138.61962890625,
+ 23861642.0,
+ 27547416.0,
+ 29877192.0,
+ 38524416.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00065120670478791,
+ 1.8789774181016128e-09,
+ 5.075246334307337e-10,
+ 4.637440431665141e-10,
+ 4.687980004192127e-10
+ ],
+ "bp_grad_F": [
+ 0.22404567897319794,
+ 6.978048531891545e-06,
+ 5.974419536869391e-08,
+ 1.854446907145757e-08,
+ 1.8726453276940447e-08
+ ],
+ "gamma_dfa": 0.0030916051182430238,
+ "gamma_dfa_per_layer": [
+ 0.011011095717549324,
+ 0.0010498585179448128,
+ 0.0005736061139032245,
+ -0.00026813987642526627
+ ],
+ "acc_eval": 0.20703125,
+ "loss_eval": 2.1297407150268555,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 31.728811264038086,
+ 29299954.0,
+ 29843046.0,
+ 31522240.0,
+ 44597740.0
+ ],
+ "hidden_norms_avg": [
+ 1154.2742919921875,
+ 26176784.0,
+ 29361794.0,
+ 31622036.0,
+ 40631524.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00057179294526577,
+ 8.620974489836897e-10,
+ 4.3859474385676833e-10,
+ 4.131678610352907e-10,
+ 4.158901834028228e-10
+ ],
+ "bp_grad_F": [
+ 0.1988120824098587,
+ 6.200312782311812e-06,
+ 7.633398269035752e-08,
+ 1.800971105581084e-08,
+ 1.6420651505200112e-08
+ ],
+ "gamma_dfa": 0.0036353242212499026,
+ "gamma_dfa_per_layer": [
+ 0.013258620165288448,
+ 0.0009053392568603158,
+ 0.0005595044931396842,
+ -0.00018216703028883785
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 2.162503719329834,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 31.93093490600586,
+ 24153264.0,
+ 24958016.0,
+ 27164164.0,
+ 41821856.0
+ ],
+ "hidden_norms_avg": [
+ 1168.3504638671875,
+ 25251302.0,
+ 29331440.0,
+ 31888322.0,
+ 40732864.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007007869426161051,
+ 3.803806603031035e-09,
+ 4.6435830181046356e-10,
+ 4.2823591894780577e-10,
+ 4.335505288111108e-10
+ ],
+ "bp_grad_F": [
+ 0.23370306193828583,
+ 5.834654530190164e-06,
+ 4.249230300956697e-08,
+ 1.778762737103534e-08,
+ 1.7575523258983594e-08
+ ],
+ "gamma_dfa": 0.003036663241800852,
+ "gamma_dfa_per_layer": [
+ 0.010693107731640339,
+ 0.001166085829026997,
+ 0.0005278221797198057,
+ -0.00024036277318373322
+ ],
+ "acc_eval": 0.2060546875,
+ "loss_eval": 2.145090103149414,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 32.11568069458008,
+ 30941254.0,
+ 31479742.0,
+ 33270594.0,
+ 46886708.0
+ ],
+ "hidden_norms_avg": [
+ 1180.89794921875,
+ 26732550.0,
+ 30676362.0,
+ 33269292.0,
+ 42382468.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006622264045290649,
+ 1.5328843749884413e-09,
+ 4.1302217201888425e-10,
+ 3.8878930630481534e-10,
+ 3.9369618676232676e-10
+ ],
+ "bp_grad_F": [
+ 0.7251601815223694,
+ 2.9320523026399314e-05,
+ 1.0578004605577007e-07,
+ 1.5190060764780355e-08,
+ 1.538120386612718e-08
+ ],
+ "gamma_dfa": 0.0034242832334712148,
+ "gamma_dfa_per_layer": [
+ 0.012806901708245277,
+ 0.0005313451401889324,
+ 0.0005365218385122716,
+ -0.00017763575306162238
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 2.1417269706726074,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 32.295955657958984,
+ 33935232.0,
+ 34368956.0,
+ 35934572.0,
+ 47697056.0
+ ],
+ "hidden_norms_avg": [
+ 1192.405517578125,
+ 27784236.0,
+ 31654758.0,
+ 34253712.0,
+ 43239588.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000609845039434731,
+ 1.1788049425476288e-09,
+ 4.4074988103659507e-10,
+ 3.883143528948807e-10,
+ 3.8990835560248627e-10
+ ],
+ "bp_grad_F": [
+ 0.3570167124271393,
+ 5.2556606533471495e-06,
+ 6.658066098452764e-08,
+ 1.6441132899558397e-08,
+ 1.5662063646004754e-08
+ ],
+ "gamma_dfa": 0.0031971330136002507,
+ "gamma_dfa_per_layer": [
+ 0.011760826222598553,
+ 0.000679977354593575,
+ 0.0005443703266791999,
+ -0.00019664184947032481
+ ],
+ "acc_eval": 0.1962890625,
+ "loss_eval": 2.159468173980713,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 32.446258544921875,
+ 19652562.0,
+ 21036314.0,
+ 25921266.0,
+ 40927384.0
+ ],
+ "hidden_norms_avg": [
+ 1203.144287109375,
+ 31749304.0,
+ 34556376.0,
+ 36976868.0,
+ 47059032.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006137214368209243,
+ 8.001962981118993e-10,
+ 4.3686718131930036e-10,
+ 4.163595301864831e-10,
+ 4.1693556940280985e-10
+ ],
+ "bp_grad_F": [
+ 0.12317141890525818,
+ 1.0874373401748016e-05,
+ 3.419825134187704e-08,
+ 1.7081790204542813e-08,
+ 1.7078438219186864e-08
+ ],
+ "gamma_dfa": 0.002385696723649744,
+ "gamma_dfa_per_layer": [
+ 0.008561503142118454,
+ 0.000761325703933835,
+ 0.00044924806570634246,
+ -0.0002292900171596557
+ ],
+ "acc_eval": 0.1943359375,
+ "loss_eval": 2.1486196517944336,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 32.65601348876953,
+ 18852588.0,
+ 20806824.0,
+ 26129350.0,
+ 41854136.0
+ ],
+ "hidden_norms_avg": [
+ 1211.216064453125,
+ 33512262.0,
+ 36150576.0,
+ 38488828.0,
+ 48876332.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00041886867256835103,
+ 6.960994003435417e-10,
+ 3.895795075425923e-10,
+ 3.7316269518861134e-10,
+ 3.8092326515304364e-10
+ ],
+ "bp_grad_F": [
+ 0.14164908230304718,
+ 1.2379082363622729e-06,
+ 2.6289937338219715e-08,
+ 1.6158612226035984e-08,
+ 1.6345055087185756e-08
+ ],
+ "gamma_dfa": 0.0026270662965544034,
+ "gamma_dfa_per_layer": [
+ 0.009110232815146446,
+ 0.0011993220541626215,
+ 0.00041866287938319147,
+ -0.00021995256247464567
+ ],
+ "acc_eval": 0.19140625,
+ "loss_eval": 2.1592655181884766,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 32.8077507019043,
+ 13604255.0,
+ 20737208.0,
+ 26201736.0,
+ 38498212.0
+ ],
+ "hidden_norms_avg": [
+ 1218.5357666015625,
+ 34337856.0,
+ 37186496.0,
+ 39492900.0,
+ 49837356.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00024631666019558907,
+ 7.821958081244418e-10,
+ 3.8121927836698433e-10,
+ 3.6691791271969976e-10,
+ 3.7013728193535655e-10
+ ],
+ "bp_grad_F": [
+ 0.16077305376529694,
+ 4.323472239775583e-06,
+ 3.772007772795405e-08,
+ 1.5986831414238623e-08,
+ 1.5948634413121e-08
+ ],
+ "gamma_dfa": 0.002168099657865241,
+ "gamma_dfa_per_layer": [
+ 0.007105600088834763,
+ 0.0013786349445581436,
+ 0.00041434637387283146,
+ -0.00022618277580477297
+ ],
+ "acc_eval": 0.193359375,
+ "loss_eval": 2.1537227630615234,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 32.95870590209961,
+ 17278438.0,
+ 21010234.0,
+ 26451948.0,
+ 41976576.0
+ ],
+ "hidden_norms_avg": [
+ 1225.39501953125,
+ 36196112.0,
+ 38833272.0,
+ 41042520.0,
+ 51415488.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00017274360288865864,
+ 7.227461407133262e-10,
+ 3.619011756939017e-10,
+ 3.5793992769761473e-10,
+ 3.6092046018509905e-10
+ ],
+ "bp_grad_F": [
+ 0.9672663807868958,
+ 3.41643476531317e-06,
+ 5.25712664511957e-08,
+ 1.5481989024124232e-08,
+ 1.548605688128646e-08
+ ],
+ "gamma_dfa": 0.001979457345441915,
+ "gamma_dfa_per_layer": [
+ 0.006772718392312527,
+ 0.0009743775590322912,
+ 0.00037397228879854083,
+ -0.00020323885837569833
+ ],
+ "acc_eval": 0.208984375,
+ "loss_eval": 2.1646997928619385,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 33.06986999511719,
+ 23368844.0,
+ 24521804.0,
+ 27230594.0,
+ 45358652.0
+ ],
+ "hidden_norms_avg": [
+ 1231.394287109375,
+ 38020996.0,
+ 40414464.0,
+ 42538228.0,
+ 53283596.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015840897685848176,
+ 6.067092384043349e-10,
+ 3.4933173020945674e-10,
+ 3.3962907486362326e-10,
+ 3.42745692938351e-10
+ ],
+ "bp_grad_F": [
+ 0.3695656955242157,
+ 2.3579739263368538e-06,
+ 5.5092176154403205e-08,
+ 1.777137192959799e-08,
+ 1.4559810246339566e-08
+ ],
+ "gamma_dfa": 0.0020704490307252854,
+ "gamma_dfa_per_layer": [
+ 0.007164421491324902,
+ 0.0009055124246515334,
+ 0.0003939281450584531,
+ -0.00018206593813374639
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 2.1666717529296875,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 33.164432525634766,
+ 29174184.0,
+ 30089798.0,
+ 32367896.0,
+ 48892740.0
+ ],
+ "hidden_norms_avg": [
+ 1237.1142578125,
+ 37470168.0,
+ 40219512.0,
+ 42356984.0,
+ 52772660.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00024464691523462534,
+ 5.441591066634999e-10,
+ 3.6414088411262924e-10,
+ 3.320065611323031e-10,
+ 3.387692348866267e-10
+ ],
+ "bp_grad_F": [
+ 0.20688536763191223,
+ 4.435638402355835e-06,
+ 8.288016317692382e-08,
+ 1.4215274291018432e-08,
+ 1.4331217101926086e-08
+ ],
+ "gamma_dfa": 0.0017712319058773573,
+ "gamma_dfa_per_layer": [
+ 0.006079941056668758,
+ 0.0008057263912633061,
+ 0.00038248312193900347,
+ -0.0001832229463616386
+ ],
+ "acc_eval": 0.1806640625,
+ "loss_eval": 2.173765182495117,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 33.24842071533203,
+ 33830332.0,
+ 34499304.0,
+ 36673048.0,
+ 51963528.0
+ ],
+ "hidden_norms_avg": [
+ 1242.226318359375,
+ 38073352.0,
+ 40806512.0,
+ 42901500.0,
+ 53437180.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002524294250179082,
+ 5.388652302151797e-10,
+ 3.6845529405304944e-10,
+ 3.3760005901939394e-10,
+ 3.4174474361492457e-10
+ ],
+ "bp_grad_F": [
+ 0.12659014761447906,
+ 2.532647158659529e-06,
+ 5.97612910269163e-08,
+ 1.3431267653629675e-08,
+ 1.3499856343912597e-08
+ ],
+ "gamma_dfa": 0.0021579467684205156,
+ "gamma_dfa_per_layer": [
+ 0.007928929291665554,
+ 0.00047530903248116374,
+ 0.00039780279621481895,
+ -0.0001702540466794744
+ ],
+ "acc_eval": 0.2099609375,
+ "loss_eval": 2.161896228790283,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 33.338741302490234,
+ 19795148.0,
+ 21916948.0,
+ 27189936.0,
+ 43588712.0
+ ],
+ "hidden_norms_avg": [
+ 1246.7552490234375,
+ 38983196.0,
+ 41658504.0,
+ 43769460.0,
+ 54177164.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002599447325337678,
+ 6.2289540192495e-10,
+ 3.6807956682594067e-10,
+ 3.4037242468976103e-10,
+ 3.472495624379235e-10
+ ],
+ "bp_grad_F": [
+ 0.11130323261022568,
+ 6.972830760787474e-06,
+ 5.447330764241087e-08,
+ 1.4756569299834155e-08,
+ 1.4917180379825368e-08
+ ],
+ "gamma_dfa": 0.0021847522366442718,
+ "gamma_dfa_per_layer": [
+ 0.007594278547912836,
+ 0.0009666476398706436,
+ 0.0003712670295499265,
+ -0.00019318427075631917
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 2.1626296043395996,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 33.42045974731445,
+ 24898126.0,
+ 26009376.0,
+ 28516464.0,
+ 47394980.0
+ ],
+ "hidden_norms_avg": [
+ 1250.1884765625,
+ 39632580.0,
+ 42285708.0,
+ 44390100.0,
+ 55233620.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001829452667152509,
+ 5.726033536213038e-10,
+ 3.5659752928296484e-10,
+ 3.292066619309253e-10,
+ 3.31846911061362e-10
+ ],
+ "bp_grad_F": [
+ 0.23442988097667694,
+ 3.2595114589639707e-06,
+ 1.0605135969399271e-07,
+ 1.4677630666426467e-08,
+ 1.445219677265186e-08
+ ],
+ "gamma_dfa": 0.0021932553718215786,
+ "gamma_dfa_per_layer": [
+ 0.007973091676831245,
+ 0.0006458763382397592,
+ 0.00032728860969655216,
+ -0.00017323513748124242
+ ],
+ "acc_eval": 0.1923828125,
+ "loss_eval": 2.175835609436035,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 33.47613525390625,
+ 25550002.0,
+ 26776384.0,
+ 28507352.0,
+ 47268464.0
+ ],
+ "hidden_norms_avg": [
+ 1253.279541015625,
+ 39494300.0,
+ 42348356.0,
+ 44479368.0,
+ 55121100.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00012893354869447649,
+ 5.787402224122218e-10,
+ 3.341840137949248e-10,
+ 3.2919431069977634e-10,
+ 3.3201591476128556e-10
+ ],
+ "bp_grad_F": [
+ 0.10876749455928802,
+ 4.772132342623081e-06,
+ 7.90316647680811e-08,
+ 1.4042406348835357e-08,
+ 1.4153799909877307e-08
+ ],
+ "gamma_dfa": 0.001727514507365413,
+ "gamma_dfa_per_layer": [
+ 0.0062596434727311134,
+ 0.0004772312822751701,
+ 0.000357049866579473,
+ -0.0001838665921241045
+ ],
+ "acc_eval": 0.1904296875,
+ "loss_eval": 2.164583444595337,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 33.52043914794922,
+ 28050636.0,
+ 29099278.0,
+ 31227182.0,
+ 49045872.0
+ ],
+ "hidden_norms_avg": [
+ 1255.7454833984375,
+ 40231008.0,
+ 42960368.0,
+ 45079784.0,
+ 55989944.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015386792074423283,
+ 5.41802436249128e-10,
+ 3.373940293815991e-10,
+ 3.3321326253776817e-10,
+ 3.361276257329848e-10
+ ],
+ "bp_grad_F": [
+ 0.2656819522380829,
+ 2.482481932020164e-06,
+ 8.287289432473699e-08,
+ 1.3792345932017724e-08,
+ 1.3917338392843703e-08
+ ],
+ "gamma_dfa": 0.001938080065883696,
+ "gamma_dfa_per_layer": [
+ 0.006978346034884453,
+ 0.0005946386372670531,
+ 0.00036033656215295196,
+ -0.00018100097076967359
+ ],
+ "acc_eval": 0.1962890625,
+ "loss_eval": 2.176473379135132,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 33.55419921875,
+ 25508434.0,
+ 26505134.0,
+ 29051658.0,
+ 47339916.0
+ ],
+ "hidden_norms_avg": [
+ 1257.7822265625,
+ 40388772.0,
+ 43162480.0,
+ 45217960.0,
+ 55966100.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00018102869216818362,
+ 5.443374639924059e-10,
+ 3.9548594954474936e-10,
+ 3.679410942591943e-10,
+ 3.717116892065775e-10
+ ],
+ "bp_grad_F": [
+ 0.28429684042930603,
+ 3.3983885714405915e-06,
+ 8.993236377818903e-08,
+ 1.4510244561449781e-08,
+ 1.4562592021150067e-08
+ ],
+ "gamma_dfa": 0.001642326584260445,
+ "gamma_dfa_per_layer": [
+ 0.006192460190504789,
+ 0.00019942648941650987,
+ 0.00037004181649535894,
+ -0.0001926221593748778
+ ],
+ "acc_eval": 0.2001953125,
+ "loss_eval": 2.1743006706237793,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 33.58127212524414,
+ 28540952.0,
+ 29607362.0,
+ 31472670.0,
+ 49191068.0
+ ],
+ "hidden_norms_avg": [
+ 1259.4189453125,
+ 40550800.0,
+ 43364984.0,
+ 45506960.0,
+ 56297104.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00018638238543644547,
+ 5.299162220140374e-10,
+ 3.2437005859087265e-10,
+ 3.1624741714253446e-10,
+ 3.1920088794379353e-10
+ ],
+ "bp_grad_F": [
+ 0.21056434512138367,
+ 3.217361381757655e-06,
+ 5.1724125427199397e-08,
+ 1.390105897058902e-08,
+ 1.3961146017038573e-08
+ ],
+ "gamma_dfa": 0.0018532263711676933,
+ "gamma_dfa_per_layer": [
+ 0.006584585644304752,
+ 0.0006806463352404535,
+ 0.00032758695306256413,
+ -0.00017991344793699682
+ ],
+ "acc_eval": 0.19921875,
+ "loss_eval": 2.167957067489624,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 33.60611343383789,
+ 27949698.0,
+ 28918304.0,
+ 31366946.0,
+ 48876736.0
+ ],
+ "hidden_norms_avg": [
+ 1260.694091796875,
+ 41001392.0,
+ 43744060.0,
+ 45853688.0,
+ 56636716.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021861983987037092,
+ 5.396287861003657e-10,
+ 3.377726154329963e-10,
+ 3.201852394330018e-10,
+ 3.237338452866112e-10
+ ],
+ "bp_grad_F": [
+ 0.12415990233421326,
+ 1.6796100226201816e-06,
+ 6.823196940786147e-08,
+ 1.384469427989643e-08,
+ 1.3965705036866893e-08
+ ],
+ "gamma_dfa": 0.0017868579998321366,
+ "gamma_dfa_per_layer": [
+ 0.006317156832665205,
+ 0.0006519090966321528,
+ 0.0003622731601353735,
+ -0.00018390709010418504
+ ],
+ "acc_eval": 0.1953125,
+ "loss_eval": 2.178144931793213,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 33.620914459228516,
+ 27607036.0,
+ 28622492.0,
+ 31370470.0,
+ 48645068.0
+ ],
+ "hidden_norms_avg": [
+ 1261.64208984375,
+ 40948476.0,
+ 43773536.0,
+ 45888992.0,
+ 56623536.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002112231741193682,
+ 5.336073249928575e-10,
+ 3.533912051878474e-10,
+ 3.186636232666018e-10,
+ 3.226934830458106e-10
+ ],
+ "bp_grad_F": [
+ 0.1486925333738327,
+ 3.3336793876515003e-06,
+ 9.466339889740993e-08,
+ 1.4568017014937595e-08,
+ 1.4240884915750485e-08
+ ],
+ "gamma_dfa": 0.0018792969822243322,
+ "gamma_dfa_per_layer": [
+ 0.006730419583618641,
+ 0.000605170032940805,
+ 0.0003661802038550377,
+ -0.00018458189151715487
+ ],
+ "acc_eval": 0.1982421875,
+ "loss_eval": 2.172356367111206,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 33.63143539428711,
+ 28410040.0,
+ 29532286.0,
+ 31697578.0,
+ 48914624.0
+ ],
+ "hidden_norms_avg": [
+ 1262.2918701171875,
+ 40698620.0,
+ 43622904.0,
+ 45764712.0,
+ 56531748.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002270409750053659,
+ 5.479600106994553e-10,
+ 3.2429942065093087e-10,
+ 3.150284755282229e-10,
+ 3.179212726411862e-10
+ ],
+ "bp_grad_F": [
+ 0.10118122398853302,
+ 2.5195840862579644e-06,
+ 8.798109263352671e-08,
+ 1.3570585544186997e-08,
+ 1.3736383586149259e-08
+ ],
+ "gamma_dfa": 0.0017859039653558284,
+ "gamma_dfa_per_layer": [
+ 0.006382801569998264,
+ 0.0005453285994008183,
+ 0.00039217708399519324,
+ -0.00017669139197096229
+ ],
+ "acc_eval": 0.1943359375,
+ "loss_eval": 2.1648902893066406,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 33.63875961303711,
+ 31114778.0,
+ 32184654.0,
+ 34278688.0,
+ 50894352.0
+ ],
+ "hidden_norms_avg": [
+ 1262.7132568359375,
+ 40792528.0,
+ 43713536.0,
+ 45850224.0,
+ 56615416.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00019923689251299948,
+ 5.368823718931992e-10,
+ 3.306654117185559e-10,
+ 3.113070912164062e-10,
+ 3.1328556415743947e-10
+ ],
+ "bp_grad_F": [
+ 0.3573400378227234,
+ 1.249598790309392e-05,
+ 1.6106491784739774e-07,
+ 3.301076745287901e-08,
+ 1.3328084413899433e-08
+ ],
+ "gamma_dfa": 0.0016940671957854647,
+ "gamma_dfa_per_layer": [
+ 0.006114102900028229,
+ 0.0004918627091683447,
+ 0.00032346430816687644,
+ -0.00015316113422159106
+ ],
+ "acc_eval": 0.201171875,
+ "loss_eval": 2.1634349822998047,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 33.642520904541016,
+ 31868976.0,
+ 32779660.0,
+ 35005740.0,
+ 51305220.0
+ ],
+ "hidden_norms_avg": [
+ 1262.9461669921875,
+ 41087592.0,
+ 43928832.0,
+ 46043268.0,
+ 56839576.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002181618328904733,
+ 5.162476557352136e-10,
+ 3.3206276617292474e-10,
+ 3.1130611977125966e-10,
+ 3.1441516057384433e-10
+ ],
+ "bp_grad_F": [
+ 0.12289460748434067,
+ 1.5301338862627745e-05,
+ 8.779379356838035e-08,
+ 1.4331889452989799e-08,
+ 1.318165843144925e-08
+ ],
+ "gamma_dfa": 0.001529279034002684,
+ "gamma_dfa_per_layer": [
+ 0.00539398193359375,
+ 0.0005496743833646178,
+ 0.00034435215638950467,
+ -0.00017089233733713627
+ ],
+ "acc_eval": 0.2021484375,
+ "loss_eval": 2.164745807647705,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 33.6442756652832,
+ 31315430.0,
+ 32160978.0,
+ 34340796.0,
+ 51077484.0
+ ],
+ "hidden_norms_avg": [
+ 1263.062744140625,
+ 41015680.0,
+ 43882708.0,
+ 46002096.0,
+ 56770896.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021884885791223496,
+ 5.177114292820306e-10,
+ 3.350683897007656e-10,
+ 3.101042200803761e-10,
+ 3.12167347527037e-10
+ ],
+ "bp_grad_F": [
+ 0.11127890646457672,
+ 1.1515544429130387e-05,
+ 8.542571805492116e-08,
+ 1.319963871537766e-08,
+ 1.3264477516372608e-08
+ ],
+ "gamma_dfa": 0.0016308917693095282,
+ "gamma_dfa_per_layer": [
+ 0.005676542408764362,
+ 0.0006629846757277846,
+ 0.0003523063496686518,
+ -0.0001682663569226861
+ ],
+ "acc_eval": 0.19921875,
+ "loss_eval": 2.1635866165161133,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 33.643985748291016,
+ 31097308.0,
+ 32052318.0,
+ 34155804.0,
+ 50803736.0
+ ],
+ "hidden_norms_avg": [
+ 1263.064208984375,
+ 40997444.0,
+ 43870400.0,
+ 45990872.0,
+ 56755540.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021703331731259823,
+ 5.1921633659191e-10,
+ 3.35882821556055e-10,
+ 3.102589296588576e-10,
+ 3.1300673164480486e-10
+ ],
+ "bp_grad_F": [
+ 0.1889268010854721,
+ 1.0328590178687591e-05,
+ 1.1096560825762936e-07,
+ 1.3215729843807367e-08,
+ 1.3306935997547953e-08
+ ],
+ "gamma_dfa": 0.0016646812255203258,
+ "gamma_dfa_per_layer": [
+ 0.005869406741112471,
+ 0.0006016636616550386,
+ 0.0003579354961402714,
+ -0.00017028099682647735
+ ],
+ "acc_eval": 0.2021484375,
+ "loss_eval": 2.163691520690918,
+ "epoch": 60
+ }
+ ]
+} \ No newline at end of file