summaryrefslogtreecommitdiff
path: root/results/snapshot_vit_v1/snapshot_vit_s456.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s456.json')
-rw-r--r--results/snapshot_vit_v1/snapshot_vit_s456.json4594
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s456.json b/results/snapshot_vit_v1/snapshot_vit_s456.json
new file mode 100644
index 0000000..1b43b92
--- /dev/null
+++ b/results/snapshot_vit_v1/snapshot_vit_s456.json
@@ -0,0 +1,4594 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_vit_v1",
+ "epochs": 60,
+ "lr": 0.001,
+ "wd": 0.05,
+ "seed": 456,
+ "depth": 4,
+ "d_model": 128,
+ "n_heads": 4
+ },
+ "depth": 4,
+ "d_model": 128,
+ "architecture": "ViTMini",
+ "bp_log": [
+ {
+ "hidden_norms_cls": [
+ 0.3042769432067871,
+ 3.2273340225219727,
+ 4.6926493644714355,
+ 6.003997802734375,
+ 6.652705669403076
+ ],
+ "hidden_norms_avg": [
+ 6.027750492095947,
+ 7.1044697761535645,
+ 7.910475730895996,
+ 8.79189682006836,
+ 9.458833694458008
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.005248428788036108,
+ 0.0012287507997825742,
+ 0.0010387187357991934,
+ 0.0009678652859292924,
+ 0.0009174557635560632
+ ],
+ "bp_grad_F": [
+ 0.248850479722023,
+ 0.0424945093691349,
+ 0.0348997563123703,
+ 0.03202275559306145,
+ 0.030239813029766083
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.0791015625,
+ "loss_eval": 2.544933319091797,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 0.47296053171157837,
+ 11.65749454498291,
+ 18.3483943939209,
+ 24.296405792236328,
+ 29.94684410095215
+ ],
+ "hidden_norms_avg": [
+ 4.04442834854126,
+ 9.927255630493164,
+ 14.762720108032227,
+ 19.817049026489258,
+ 24.69188690185547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0025219416711479425,
+ 0.00024655580637045205,
+ 0.00017099862452596426,
+ 0.0001493149611633271,
+ 0.00015047143097035587
+ ],
+ "bp_grad_F": [
+ 0.11354690045118332,
+ 0.00995445717126131,
+ 0.006139951758086681,
+ 0.005140931811183691,
+ 0.005088545847684145
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.458984375,
+ "loss_eval": 1.4817876815795898,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 0.6174129843711853,
+ 12.388140678405762,
+ 20.656904220581055,
+ 27.073535919189453,
+ 32.43647003173828
+ ],
+ "hidden_norms_avg": [
+ 3.8196825981140137,
+ 10.982677459716797,
+ 17.020437240600586,
+ 22.471168518066406,
+ 27.064218521118164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0020673249382525682,
+ 0.0002501676499377936,
+ 0.00015905944746918976,
+ 0.00013718422269448638,
+ 0.0001328626531176269
+ ],
+ "bp_grad_F": [
+ 0.09556808322668076,
+ 0.01051106583327055,
+ 0.005822391714900732,
+ 0.004766201134771109,
+ 0.004577947780489922
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.498046875,
+ "loss_eval": 1.356250286102295,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 0.7216586470603943,
+ 12.527997016906738,
+ 19.815393447875977,
+ 26.452791213989258,
+ 30.71564483642578
+ ],
+ "hidden_norms_avg": [
+ 3.8907485008239746,
+ 11.261369705200195,
+ 16.61492156982422,
+ 21.57110023498535,
+ 24.978900909423828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0021546317730098963,
+ 0.00030062923906371,
+ 0.00018509272194933146,
+ 0.00013865686196368188,
+ 0.00012920796871185303
+ ],
+ "bp_grad_F": [
+ 0.10040326416492462,
+ 0.012564396485686302,
+ 0.007171053439378738,
+ 0.005316051654517651,
+ 0.004880763124674559
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5263671875,
+ "loss_eval": 1.2655537128448486,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 0.8026084899902344,
+ 12.023736953735352,
+ 20.35123062133789,
+ 26.937381744384766,
+ 31.122047424316406
+ ],
+ "hidden_norms_avg": [
+ 3.9065797328948975,
+ 11.544925689697266,
+ 17.131011962890625,
+ 22.292007446289062,
+ 25.61225128173828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0019258656539022923,
+ 0.00027825392317026854,
+ 0.00017385024693794549,
+ 0.0001323536125710234,
+ 0.00012172113929409534
+ ],
+ "bp_grad_F": [
+ 0.09238748997449875,
+ 0.01207020040601492,
+ 0.007036368828266859,
+ 0.005208354443311691,
+ 0.0047498126514256
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5673828125,
+ "loss_eval": 1.1375834941864014,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 0.8784403204917908,
+ 11.689644813537598,
+ 20.318578720092773,
+ 27.47210121154785,
+ 30.616111755371094
+ ],
+ "hidden_norms_avg": [
+ 3.991969585418701,
+ 11.499222755432129,
+ 17.010013580322266,
+ 21.869060516357422,
+ 24.784456253051758
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017466156277805567,
+ 0.00030884172883816063,
+ 0.00018451173673383892,
+ 0.00013519970525521785,
+ 0.00011779358464991674
+ ],
+ "bp_grad_F": [
+ 0.0881652981042862,
+ 0.014197942800819874,
+ 0.008167672902345657,
+ 0.00570154283195734,
+ 0.0048713223077356815
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.611328125,
+ "loss_eval": 1.078152060508728,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 0.9501535892486572,
+ 12.59860610961914,
+ 20.491111755371094,
+ 27.280519485473633,
+ 30.350204467773438
+ ],
+ "hidden_norms_avg": [
+ 4.104201793670654,
+ 12.098063468933105,
+ 17.173715591430664,
+ 21.416263580322266,
+ 24.0885066986084
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001603498705662787,
+ 0.0003018827992491424,
+ 0.00017963100981432945,
+ 0.00013513887824956328,
+ 0.00010907831892836839
+ ],
+ "bp_grad_F": [
+ 0.08621370792388916,
+ 0.01517424639314413,
+ 0.008794959634542465,
+ 0.006117440760135651,
+ 0.0050094337202608585
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6337890625,
+ "loss_eval": 1.0198562145233154,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 1.000899076461792,
+ 12.766633987426758,
+ 21.096908569335938,
+ 28.377235412597656,
+ 31.630756378173828
+ ],
+ "hidden_norms_avg": [
+ 4.143934726715088,
+ 13.046825408935547,
+ 18.295841217041016,
+ 23.147098541259766,
+ 25.70033836364746
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015043691964820027,
+ 0.00027919537387788296,
+ 0.0001850408734753728,
+ 0.0001339056616416201,
+ 0.00011227549111936241
+ ],
+ "bp_grad_F": [
+ 0.07296615093946457,
+ 0.012746848165988922,
+ 0.00809843186289072,
+ 0.005660817492753267,
+ 0.00492064468562603
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6357421875,
+ "loss_eval": 1.0125277042388916,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 1.0544841289520264,
+ 10.223775863647461,
+ 18.59557342529297,
+ 26.47129249572754,
+ 29.77008819580078
+ ],
+ "hidden_norms_avg": [
+ 4.213057994842529,
+ 13.021050453186035,
+ 18.172080993652344,
+ 22.743032455444336,
+ 25.225244522094727
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001364147407002747,
+ 0.0002890345931518823,
+ 0.00017917664081323892,
+ 0.000133156034280546,
+ 0.00011372177687007934
+ ],
+ "bp_grad_F": [
+ 0.07409710437059402,
+ 0.015113108791410923,
+ 0.00921319704502821,
+ 0.006366679444909096,
+ 0.005320113617926836
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6376953125,
+ "loss_eval": 0.9630928039550781,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1071640253067017,
+ 12.073644638061523,
+ 19.524917602539062,
+ 26.858781814575195,
+ 30.318849563598633
+ ],
+ "hidden_norms_avg": [
+ 4.280055522918701,
+ 13.520170211791992,
+ 18.620624542236328,
+ 22.658164978027344,
+ 25.25646209716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012990576215088367,
+ 0.00027366873109713197,
+ 0.00016998387582134455,
+ 0.00012336595682427287,
+ 9.77109739324078e-05
+ ],
+ "bp_grad_F": [
+ 0.07662060856819153,
+ 0.015166237019002438,
+ 0.0096206646412611,
+ 0.006477049086242914,
+ 0.005294579081237316
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.654296875,
+ "loss_eval": 0.9390516877174377,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1426520347595215,
+ 12.005794525146484,
+ 20.33642578125,
+ 27.80829429626465,
+ 31.22698974609375
+ ],
+ "hidden_norms_avg": [
+ 4.328567981719971,
+ 13.725446701049805,
+ 19.644866943359375,
+ 23.91346549987793,
+ 26.409910202026367
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012125002685934305,
+ 0.00027867915923707187,
+ 0.00017298922466579825,
+ 0.0001231397909577936,
+ 0.00010014672443503514
+ ],
+ "bp_grad_F": [
+ 0.06728038191795349,
+ 0.014830472879111767,
+ 0.008772061206400394,
+ 0.006222804542630911,
+ 0.00518346531316638
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6708984375,
+ "loss_eval": 0.8987849950790405,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 1.182861089706421,
+ 11.343650817871094,
+ 19.158103942871094,
+ 26.537256240844727,
+ 29.248126983642578
+ ],
+ "hidden_norms_avg": [
+ 4.343320846557617,
+ 13.940053939819336,
+ 19.19382667541504,
+ 23.443157196044922,
+ 25.7342529296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012841055868193507,
+ 0.00029811219428665936,
+ 0.00019176788919139653,
+ 0.0001351374085061252,
+ 0.00010611475590849295
+ ],
+ "bp_grad_F": [
+ 0.07373103499412537,
+ 0.015750709921121597,
+ 0.010071114636957645,
+ 0.007257349323481321,
+ 0.00578929902985692
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6708984375,
+ "loss_eval": 0.9137783646583557,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2363859415054321,
+ 11.583894729614258,
+ 18.828346252441406,
+ 26.30917739868164,
+ 29.363861083984375
+ ],
+ "hidden_norms_avg": [
+ 4.441896915435791,
+ 13.568662643432617,
+ 18.774181365966797,
+ 22.73027801513672,
+ 24.84675407409668
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011289563262835145,
+ 0.00029387036920525134,
+ 0.0001886928512249142,
+ 0.00013024669897276908,
+ 9.712533210404217e-05
+ ],
+ "bp_grad_F": [
+ 0.06850193440914154,
+ 0.016727343201637268,
+ 0.010432050563395023,
+ 0.00744031835347414,
+ 0.0057919141836464405
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6865234375,
+ "loss_eval": 0.8655319809913635,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 1.276246428489685,
+ 11.161674499511719,
+ 18.18111801147461,
+ 24.498512268066406,
+ 28.472366333007812
+ ],
+ "hidden_norms_avg": [
+ 4.438092231750488,
+ 13.71449089050293,
+ 18.358896255493164,
+ 21.998794555664062,
+ 24.44672966003418
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.001100392546504736,
+ 0.0002873367629945278,
+ 0.00018384194117970765,
+ 0.0001337265275651589,
+ 9.951705578714609e-05
+ ],
+ "bp_grad_F": [
+ 0.06749056279659271,
+ 0.01716373674571514,
+ 0.010762249119579792,
+ 0.007881316356360912,
+ 0.005892573855817318
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6982421875,
+ "loss_eval": 0.8163608908653259,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3131792545318604,
+ 11.034884452819824,
+ 17.936412811279297,
+ 24.541194915771484,
+ 28.02472496032715
+ ],
+ "hidden_norms_avg": [
+ 4.504117012023926,
+ 13.86273193359375,
+ 18.456012725830078,
+ 22.296085357666016,
+ 24.57513427734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010489820269867778,
+ 0.0002784461830742657,
+ 0.00018129698582924902,
+ 0.00013628850865643471,
+ 0.00010334269609302282
+ ],
+ "bp_grad_F": [
+ 0.06553377211093903,
+ 0.016712775453925133,
+ 0.010981550440192223,
+ 0.007675213273614645,
+ 0.006061363499611616
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.69921875,
+ "loss_eval": 0.8088906407356262,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3631325960159302,
+ 10.72367000579834,
+ 17.147600173950195,
+ 23.750171661376953,
+ 26.97018051147461
+ ],
+ "hidden_norms_avg": [
+ 4.5338335037231445,
+ 13.55031967163086,
+ 17.503305435180664,
+ 21.003847122192383,
+ 23.168630599975586
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0010022176429629326,
+ 0.0002914569922722876,
+ 0.00018890199135057628,
+ 0.00013593978655990213,
+ 0.00010251985804643482
+ ],
+ "bp_grad_F": [
+ 0.06372744590044022,
+ 0.017576243728399277,
+ 0.011715950444340706,
+ 0.008481587283313274,
+ 0.006441249046474695
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.701171875,
+ "loss_eval": 0.815929651260376,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3926054239273071,
+ 10.609240531921387,
+ 17.234729766845703,
+ 23.659292221069336,
+ 27.24931526184082
+ ],
+ "hidden_norms_avg": [
+ 4.513574600219727,
+ 13.48448371887207,
+ 17.66766929626465,
+ 21.098644256591797,
+ 23.213909149169922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008784966776147485,
+ 0.0002452125190757215,
+ 0.0001629967155167833,
+ 0.00012193062138976529,
+ 8.820713992463425e-05
+ ],
+ "bp_grad_F": [
+ 0.06515656411647797,
+ 0.017664309591054916,
+ 0.011493389494717121,
+ 0.008405888453125954,
+ 0.006338838487863541
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.71875,
+ "loss_eval": 0.7755489349365234,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4288005828857422,
+ 9.991934776306152,
+ 16.30902671813965,
+ 22.53181266784668,
+ 25.98328971862793
+ ],
+ "hidden_norms_avg": [
+ 4.606818199157715,
+ 13.761014938354492,
+ 18.061887741088867,
+ 21.805465698242188,
+ 23.856918334960938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008885160204954445,
+ 0.00026409278507344425,
+ 0.0001749310758896172,
+ 0.00012756467913277447,
+ 8.965048618847504e-05
+ ],
+ "bp_grad_F": [
+ 0.07283030450344086,
+ 0.01973560079932213,
+ 0.013354410417377949,
+ 0.009586230851709843,
+ 0.006897584535181522
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.693359375,
+ "loss_eval": 0.8082709908485413,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4623849391937256,
+ 9.794211387634277,
+ 16.102649688720703,
+ 21.62982940673828,
+ 25.186201095581055
+ ],
+ "hidden_norms_avg": [
+ 4.6317901611328125,
+ 13.527764320373535,
+ 17.6087589263916,
+ 21.295202255249023,
+ 23.361501693725586
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008634055848233402,
+ 0.0002727442770265043,
+ 0.00018466924666427076,
+ 0.00013278424739837646,
+ 8.995016105473042e-05
+ ],
+ "bp_grad_F": [
+ 0.06913765519857407,
+ 0.02126000076532364,
+ 0.014007972553372383,
+ 0.010056250728666782,
+ 0.00732502993196249
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.720703125,
+ "loss_eval": 0.7786685824394226,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4771180152893066,
+ 9.776408195495605,
+ 15.485087394714355,
+ 21.054513931274414,
+ 25.07387351989746
+ ],
+ "hidden_norms_avg": [
+ 4.570744514465332,
+ 13.13935375213623,
+ 16.70624351501465,
+ 20.002471923828125,
+ 22.400487899780273
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008809147984720767,
+ 0.00026235057157464325,
+ 0.0001801249454729259,
+ 0.0001285924663534388,
+ 8.227767830248922e-05
+ ],
+ "bp_grad_F": [
+ 0.07356031239032745,
+ 0.02142982743680477,
+ 0.014684871770441532,
+ 0.010477974079549313,
+ 0.007170504424721003
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7412109375,
+ "loss_eval": 0.7548146843910217,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4932866096496582,
+ 9.586905479431152,
+ 15.190006256103516,
+ 20.53044891357422,
+ 23.871917724609375
+ ],
+ "hidden_norms_avg": [
+ 4.640237808227539,
+ 13.333914756774902,
+ 16.603134155273438,
+ 19.70735740661621,
+ 21.712968826293945
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008201555465348065,
+ 0.00025074987206608057,
+ 0.00018013773660641164,
+ 0.0001373633131152019,
+ 8.871335012372583e-05
+ ],
+ "bp_grad_F": [
+ 0.07453557848930359,
+ 0.02180560864508152,
+ 0.015117364004254341,
+ 0.010920760221779346,
+ 0.007648298051208258
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7294921875,
+ "loss_eval": 0.7338082790374756,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5380369424819946,
+ 8.941458702087402,
+ 14.383026123046875,
+ 19.64396858215332,
+ 23.333805084228516
+ ],
+ "hidden_norms_avg": [
+ 4.57804012298584,
+ 12.777068138122559,
+ 15.852535247802734,
+ 19.008466720581055,
+ 21.123043060302734
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007403296767733991,
+ 0.00023140048142522573,
+ 0.0001578826195327565,
+ 0.00011260491737630218,
+ 7.754044054308906e-05
+ ],
+ "bp_grad_F": [
+ 0.07555028051137924,
+ 0.024111615493893623,
+ 0.01656532846391201,
+ 0.01178746297955513,
+ 0.007888367399573326
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.744140625,
+ "loss_eval": 0.7344021201133728,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5561290979385376,
+ 9.454068183898926,
+ 14.400370597839355,
+ 19.253843307495117,
+ 22.27718734741211
+ ],
+ "hidden_norms_avg": [
+ 4.687749862670898,
+ 12.994861602783203,
+ 15.969095230102539,
+ 18.976381301879883,
+ 20.873851776123047
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008383935783058405,
+ 0.0002680755569599569,
+ 0.000193025975022465,
+ 0.00013935549941379577,
+ 9.83258432825096e-05
+ ],
+ "bp_grad_F": [
+ 0.06634547561407089,
+ 0.021603766828775406,
+ 0.01579204760491848,
+ 0.011702721007168293,
+ 0.008362310007214546
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.734375,
+ "loss_eval": 0.7299590110778809,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5774884223937988,
+ 8.741745948791504,
+ 13.803518295288086,
+ 18.90570831298828,
+ 22.218149185180664
+ ],
+ "hidden_norms_avg": [
+ 4.594933032989502,
+ 12.66419506072998,
+ 15.714310646057129,
+ 19.085254669189453,
+ 21.135629653930664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006682098028250039,
+ 0.00022848948719911277,
+ 0.00016414522542618215,
+ 0.0001115989507525228,
+ 7.056116737658158e-05
+ ],
+ "bp_grad_F": [
+ 0.07456765323877335,
+ 0.024261610582470894,
+ 0.01710386760532856,
+ 0.012147205881774426,
+ 0.008177526295185089
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7763671875,
+ "loss_eval": 0.699420154094696,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 1.576693058013916,
+ 8.762345314025879,
+ 13.443113327026367,
+ 18.230920791625977,
+ 22.07720375061035
+ ],
+ "hidden_norms_avg": [
+ 4.667433738708496,
+ 12.606098175048828,
+ 15.544108390808105,
+ 18.674053192138672,
+ 20.65712547302246
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006520473980344832,
+ 0.00022687950695399195,
+ 0.0001629517209948972,
+ 0.00011739470210159197,
+ 7.377319707302377e-05
+ ],
+ "bp_grad_F": [
+ 0.08037886768579483,
+ 0.026545122265815735,
+ 0.0190938338637352,
+ 0.013439938426017761,
+ 0.00869175884872675
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7353515625,
+ "loss_eval": 0.733207106590271,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5915056467056274,
+ 8.431538581848145,
+ 13.075739860534668,
+ 17.782840728759766,
+ 20.799991607666016
+ ],
+ "hidden_norms_avg": [
+ 4.626980304718018,
+ 12.152971267700195,
+ 14.936114311218262,
+ 18.13477325439453,
+ 19.853097915649414
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007118558278307319,
+ 0.00024262107035610825,
+ 0.0001753592659952119,
+ 0.00012127246736781672,
+ 7.87421886343509e-05
+ ],
+ "bp_grad_F": [
+ 0.0734892264008522,
+ 0.025602566078305244,
+ 0.018658706918358803,
+ 0.013666817918419838,
+ 0.009108936414122581
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7578125,
+ "loss_eval": 0.6893049478530884,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 1.589570164680481,
+ 8.064777374267578,
+ 12.609880447387695,
+ 17.195837020874023,
+ 20.27288818359375
+ ],
+ "hidden_norms_avg": [
+ 4.651576995849609,
+ 12.02392578125,
+ 14.5856351852417,
+ 17.578563690185547,
+ 19.327190399169922
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006660808576270938,
+ 0.0002373493480263278,
+ 0.0001695255923550576,
+ 0.00012064678594470024,
+ 7.89113255450502e-05
+ ],
+ "bp_grad_F": [
+ 0.08072065562009811,
+ 0.02827218733727932,
+ 0.020335549488663673,
+ 0.014427169226109982,
+ 0.009556911885738373
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.755859375,
+ "loss_eval": 0.7047942876815796,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6077263355255127,
+ 7.734760284423828,
+ 11.882841110229492,
+ 15.991426467895508,
+ 19.111549377441406
+ ],
+ "hidden_norms_avg": [
+ 4.672310829162598,
+ 11.994673728942871,
+ 14.48837661743164,
+ 16.922487258911133,
+ 18.498437881469727
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005716760642826557,
+ 0.00020494087948463857,
+ 0.0001548439176985994,
+ 0.00011144367454107851,
+ 6.537805165862665e-05
+ ],
+ "bp_grad_F": [
+ 0.08237622678279877,
+ 0.03036416694521904,
+ 0.022357620298862457,
+ 0.01651921682059765,
+ 0.010484294034540653
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7548828125,
+ "loss_eval": 0.6863161325454712,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6167913675308228,
+ 7.661223411560059,
+ 11.857555389404297,
+ 16.11384391784668,
+ 19.207155227661133
+ ],
+ "hidden_norms_avg": [
+ 4.6568603515625,
+ 11.916447639465332,
+ 14.127670288085938,
+ 16.765464782714844,
+ 18.548715591430664
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006015675025992095,
+ 0.00022187062131706625,
+ 0.00015665855607949197,
+ 0.00011372221342753619,
+ 6.673130701528862e-05
+ ],
+ "bp_grad_F": [
+ 0.08522997796535492,
+ 0.03222256526350975,
+ 0.023626696318387985,
+ 0.01693013124167919,
+ 0.010611210018396378
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.75390625,
+ "loss_eval": 0.6998279094696045,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6032800674438477,
+ 7.3315229415893555,
+ 11.458590507507324,
+ 15.827820777893066,
+ 19.03597640991211
+ ],
+ "hidden_norms_avg": [
+ 4.592748641967773,
+ 11.431793212890625,
+ 13.694733619689941,
+ 16.380725860595703,
+ 17.913341522216797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006015695980750024,
+ 0.00023376141325570643,
+ 0.00015724304830655456,
+ 0.00010976113844662905,
+ 6.412796210497618e-05
+ ],
+ "bp_grad_F": [
+ 0.09064542502164841,
+ 0.03456525132060051,
+ 0.02491987682878971,
+ 0.01721413992345333,
+ 0.010797572322189808
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7734375,
+ "loss_eval": 0.6845672130584717,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6067036390304565,
+ 7.343894004821777,
+ 11.072548866271973,
+ 15.027584075927734,
+ 17.731834411621094
+ ],
+ "hidden_norms_avg": [
+ 4.656601428985596,
+ 11.393535614013672,
+ 13.465471267700195,
+ 15.975980758666992,
+ 17.53518295288086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005384382093325257,
+ 0.00021189975086599588,
+ 0.0001552984758745879,
+ 0.00010658086830517277,
+ 6.326750008156523e-05
+ ],
+ "bp_grad_F": [
+ 0.08886278420686722,
+ 0.03500310331583023,
+ 0.025932280346751213,
+ 0.018638672307133675,
+ 0.011571940965950489
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7666015625,
+ "loss_eval": 0.6816176772117615,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6034201383590698,
+ 7.28795051574707,
+ 10.777915000915527,
+ 14.885525703430176,
+ 17.61635398864746
+ ],
+ "hidden_norms_avg": [
+ 4.614856719970703,
+ 11.156272888183594,
+ 13.103291511535645,
+ 15.514464378356934,
+ 16.799636840820312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005928887985646725,
+ 0.0002398774668108672,
+ 0.00018353872292209417,
+ 0.00012629387492779642,
+ 8.196983981179073e-05
+ ],
+ "bp_grad_F": [
+ 0.09026212245225906,
+ 0.03624382242560387,
+ 0.027555860579013824,
+ 0.019604889675974846,
+ 0.012266743928194046
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7578125,
+ "loss_eval": 0.6996170878410339,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 1.611714243888855,
+ 7.183743953704834,
+ 10.724074363708496,
+ 14.5570650100708,
+ 17.022544860839844
+ ],
+ "hidden_norms_avg": [
+ 4.623075485229492,
+ 11.19589614868164,
+ 13.009132385253906,
+ 15.365489959716797,
+ 16.62962532043457
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00036223753704689443,
+ 0.00014417112106457353,
+ 0.00010984936670865864,
+ 8.023829286685213e-05,
+ 4.624977009370923e-05
+ ],
+ "bp_grad_F": [
+ 0.09605100005865097,
+ 0.03848516568541527,
+ 0.029046298936009407,
+ 0.021008647978305817,
+ 0.012804670259356499
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7666015625,
+ "loss_eval": 0.6707476377487183,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 1.6100214719772339,
+ 6.872183322906494,
+ 10.294036865234375,
+ 14.205705642700195,
+ 17.145418167114258
+ ],
+ "hidden_norms_avg": [
+ 4.6112518310546875,
+ 11.086106300354004,
+ 12.928976058959961,
+ 15.350056648254395,
+ 16.69057846069336
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00041789902024902403,
+ 0.00017518684035167098,
+ 0.0001297849084949121,
+ 8.867425640346482e-05,
+ 4.886053648078814e-05
+ ],
+ "bp_grad_F": [
+ 0.10439282655715942,
+ 0.04290134832262993,
+ 0.03223341330885887,
+ 0.02269606664776802,
+ 0.013486144132912159
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.759765625,
+ "loss_eval": 0.7303465604782104,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5996708869934082,
+ 6.756699085235596,
+ 9.930717468261719,
+ 13.55428695678711,
+ 16.25560188293457
+ ],
+ "hidden_norms_avg": [
+ 4.561036109924316,
+ 10.72261905670166,
+ 12.331817626953125,
+ 14.622406005859375,
+ 16.10407829284668
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004882134380750358,
+ 0.0002138838026439771,
+ 0.00016901774506550282,
+ 0.0001125320850405842,
+ 6.579834007425234e-05
+ ],
+ "bp_grad_F": [
+ 0.10555483400821686,
+ 0.043922487646341324,
+ 0.03336327522993088,
+ 0.02399253286421299,
+ 0.013897648081183434
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7744140625,
+ "loss_eval": 0.71100252866745,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5904232263565063,
+ 6.662050247192383,
+ 9.66409683227539,
+ 13.113885879516602,
+ 15.527644157409668
+ ],
+ "hidden_norms_avg": [
+ 4.5454936027526855,
+ 10.621905326843262,
+ 12.306397438049316,
+ 14.576898574829102,
+ 15.954529762268066
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004819612659048289,
+ 0.00020982844580430537,
+ 0.00015760491078253835,
+ 0.00010895934246946126,
+ 5.958566543995403e-05
+ ],
+ "bp_grad_F": [
+ 0.10991083830595016,
+ 0.047212228178977966,
+ 0.03634340688586235,
+ 0.02575613744556904,
+ 0.014786512590944767
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7705078125,
+ "loss_eval": 0.7015272378921509,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5926766395568848,
+ 6.752022743225098,
+ 9.809683799743652,
+ 13.14870548248291,
+ 15.66618537902832
+ ],
+ "hidden_norms_avg": [
+ 4.554390907287598,
+ 10.59433650970459,
+ 12.38070011138916,
+ 14.597192764282227,
+ 15.870081901550293
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00043442551395855844,
+ 0.0001767174544511363,
+ 0.0001353291590930894,
+ 9.88640749710612e-05,
+ 5.115106250741519e-05
+ ],
+ "bp_grad_F": [
+ 0.11412353813648224,
+ 0.04936130344867706,
+ 0.03786878660321236,
+ 0.027230119332671165,
+ 0.015144454315304756
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7734375,
+ "loss_eval": 0.7246569395065308,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5873360633850098,
+ 6.424077987670898,
+ 9.43139934539795,
+ 12.677597999572754,
+ 15.172491073608398
+ ],
+ "hidden_norms_avg": [
+ 4.4964070320129395,
+ 10.287262916564941,
+ 11.751147270202637,
+ 13.867583274841309,
+ 15.24795150756836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004166838189121336,
+ 0.0001985515555134043,
+ 0.00014922211994417012,
+ 0.0001073441599146463,
+ 5.765057721873745e-05
+ ],
+ "bp_grad_F": [
+ 0.11522030830383301,
+ 0.05126715078949928,
+ 0.039791759103536606,
+ 0.028239542618393898,
+ 0.015849631279706955
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.76953125,
+ "loss_eval": 0.7268451452255249,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5890607833862305,
+ 6.295929431915283,
+ 9.119135856628418,
+ 12.20608901977539,
+ 14.642122268676758
+ ],
+ "hidden_norms_avg": [
+ 4.5021796226501465,
+ 10.095436096191406,
+ 11.7933988571167,
+ 13.924290657043457,
+ 15.25149917602539
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004105751868337393,
+ 0.00017681249300949275,
+ 0.00014306302182376385,
+ 9.77686358965002e-05,
+ 5.147796036908403e-05
+ ],
+ "bp_grad_F": [
+ 0.12662801146507263,
+ 0.057947222143411636,
+ 0.044759348034858704,
+ 0.03212600201368332,
+ 0.017064588144421577
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7587890625,
+ "loss_eval": 0.7464388012886047,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5761758089065552,
+ 6.18004846572876,
+ 9.069403648376465,
+ 12.180702209472656,
+ 14.516327857971191
+ ],
+ "hidden_norms_avg": [
+ 4.492326736450195,
+ 9.971968650817871,
+ 11.50478744506836,
+ 13.5086669921875,
+ 14.760706901550293
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003273288893979043,
+ 0.00015071693633217365,
+ 0.00011665018246276304,
+ 8.30927092465572e-05,
+ 4.371673639980145e-05
+ ],
+ "bp_grad_F": [
+ 0.1212363913655281,
+ 0.055609479546546936,
+ 0.04309426248073578,
+ 0.0311796423047781,
+ 0.016882745549082756
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7783203125,
+ "loss_eval": 0.7176246643066406,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5679142475128174,
+ 6.109372615814209,
+ 8.818140029907227,
+ 11.853668212890625,
+ 14.200343132019043
+ ],
+ "hidden_norms_avg": [
+ 4.478363037109375,
+ 9.777668952941895,
+ 11.217857360839844,
+ 13.170299530029297,
+ 14.35566520690918
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003435175749473274,
+ 0.00015563883061986417,
+ 0.00011927648301934823,
+ 8.298752072732896e-05,
+ 4.157157673034817e-05
+ ],
+ "bp_grad_F": [
+ 0.13136376440525055,
+ 0.06076597049832344,
+ 0.046719472855329514,
+ 0.033368490636348724,
+ 0.01777712069451809
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.78125,
+ "loss_eval": 0.7149413228034973,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5576080083847046,
+ 6.149768829345703,
+ 8.711091041564941,
+ 11.498035430908203,
+ 13.903903007507324
+ ],
+ "hidden_norms_avg": [
+ 4.435859680175781,
+ 9.742182731628418,
+ 10.966800689697266,
+ 12.826833724975586,
+ 13.987249374389648
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002820935333147645,
+ 0.00013546310947276652,
+ 0.00010691316856537014,
+ 7.935341272968799e-05,
+ 4.027710747322999e-05
+ ],
+ "bp_grad_F": [
+ 0.1424364149570465,
+ 0.0660286620259285,
+ 0.05190045386552811,
+ 0.037452246993780136,
+ 0.019488148391246796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.759765625,
+ "loss_eval": 0.7794969081878662,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 1.55929696559906,
+ 6.027406215667725,
+ 8.56254768371582,
+ 11.315313339233398,
+ 13.816405296325684
+ ],
+ "hidden_norms_avg": [
+ 4.444095611572266,
+ 9.598461151123047,
+ 11.017721176147461,
+ 12.939472198486328,
+ 14.150469779968262
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028881963226012886,
+ 0.00014081982953939587,
+ 0.00010864014620892704,
+ 7.903494406491518e-05,
+ 3.460505831753835e-05
+ ],
+ "bp_grad_F": [
+ 0.14435029029846191,
+ 0.06792720407247543,
+ 0.05288391932845116,
+ 0.03809889778494835,
+ 0.0192741546779871
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7783203125,
+ "loss_eval": 0.7500836253166199,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5569288730621338,
+ 5.83992338180542,
+ 8.285759925842285,
+ 11.15902328491211,
+ 13.44404125213623
+ ],
+ "hidden_norms_avg": [
+ 4.416918754577637,
+ 9.525116920471191,
+ 10.900503158569336,
+ 12.753186225891113,
+ 13.810358047485352
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003584402147680521,
+ 0.00016757070261519402,
+ 0.000135006892378442,
+ 8.858168439473957e-05,
+ 4.690655987360515e-05
+ ],
+ "bp_grad_F": [
+ 0.14751866459846497,
+ 0.07057010382413864,
+ 0.05518123507499695,
+ 0.039941366761922836,
+ 0.019994540140032768
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.783203125,
+ "loss_eval": 0.7740926146507263,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5507482290267944,
+ 5.7182297706604,
+ 8.143424034118652,
+ 10.900334358215332,
+ 13.179159164428711
+ ],
+ "hidden_norms_avg": [
+ 4.415921688079834,
+ 9.42380142211914,
+ 10.672327995300293,
+ 12.439417839050293,
+ 13.481410026550293
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002743537479545921,
+ 0.00013802653120364994,
+ 0.00010440178448334336,
+ 7.395831926260144e-05,
+ 3.546295192791149e-05
+ ],
+ "bp_grad_F": [
+ 0.15799099206924438,
+ 0.0763181671500206,
+ 0.060047682374715805,
+ 0.043460771441459656,
+ 0.02125636488199234
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.78125,
+ "loss_eval": 0.7693630456924438,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5424573421478271,
+ 5.688177585601807,
+ 7.995815753936768,
+ 10.642090797424316,
+ 12.71364688873291
+ ],
+ "hidden_norms_avg": [
+ 4.399099349975586,
+ 9.228434562683105,
+ 10.541167259216309,
+ 12.30521297454834,
+ 13.311983108520508
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00024789522285573184,
+ 0.0001290303043788299,
+ 9.614775626687333e-05,
+ 6.680067599518225e-05,
+ 3.041914533241652e-05
+ ],
+ "bp_grad_F": [
+ 0.16617916524410248,
+ 0.08274275809526443,
+ 0.06457101553678513,
+ 0.04608331620693207,
+ 0.02214660868048668
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.77734375,
+ "loss_eval": 0.7963705062866211,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5373201370239258,
+ 5.651702880859375,
+ 7.870075702667236,
+ 10.383352279663086,
+ 12.742950439453125
+ ],
+ "hidden_norms_avg": [
+ 4.359274387359619,
+ 9.120989799499512,
+ 10.328361511230469,
+ 11.979691505432129,
+ 13.047332763671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00020789829432033002,
+ 0.00010236673551844433,
+ 8.31241559353657e-05,
+ 5.5589163821423426e-05,
+ 2.5046059818123467e-05
+ ],
+ "bp_grad_F": [
+ 0.1711728274822235,
+ 0.08452030271291733,
+ 0.06641850620508194,
+ 0.048034753650426865,
+ 0.022233933210372925
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.796875,
+ "loss_eval": 0.787158727645874,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 1.534119725227356,
+ 5.64213752746582,
+ 7.87826681137085,
+ 10.351583480834961,
+ 12.802285194396973
+ ],
+ "hidden_norms_avg": [
+ 4.381091594696045,
+ 9.210761070251465,
+ 10.374320030212402,
+ 12.017292976379395,
+ 13.094472885131836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00020434240286704153,
+ 9.69645261648111e-05,
+ 7.39863608032465e-05,
+ 5.592328670900315e-05,
+ 2.489626240276266e-05
+ ],
+ "bp_grad_F": [
+ 0.17339713871479034,
+ 0.08632633090019226,
+ 0.06861955672502518,
+ 0.05006933584809303,
+ 0.022428762167692184
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7919921875,
+ "loss_eval": 0.7851632833480835,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5289297103881836,
+ 5.52672004699707,
+ 7.675796985626221,
+ 10.204718589782715,
+ 12.873387336730957
+ ],
+ "hidden_norms_avg": [
+ 4.3382954597473145,
+ 8.994754791259766,
+ 10.112909317016602,
+ 11.741432189941406,
+ 12.863862037658691
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001689869095571339,
+ 8.723067730898038e-05,
+ 6.962454062886536e-05,
+ 4.9918842705665156e-05,
+ 2.0077559383935295e-05
+ ],
+ "bp_grad_F": [
+ 0.1893138736486435,
+ 0.09529414772987366,
+ 0.07472710311412811,
+ 0.053626082837581635,
+ 0.023708311840891838
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7802734375,
+ "loss_eval": 0.8306612968444824,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5282790660858154,
+ 5.412533760070801,
+ 7.559310436248779,
+ 10.040712356567383,
+ 12.344849586486816
+ ],
+ "hidden_norms_avg": [
+ 4.344850063323975,
+ 8.943357467651367,
+ 10.036619186401367,
+ 11.63318157196045,
+ 12.690427780151367
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015994974819477648,
+ 8.589095523348078e-05,
+ 6.632162694586441e-05,
+ 4.7776728024473414e-05,
+ 1.923311901919078e-05
+ ],
+ "bp_grad_F": [
+ 0.19004860520362854,
+ 0.09673094749450684,
+ 0.07585947215557098,
+ 0.05484768748283386,
+ 0.02464146539568901
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7880859375,
+ "loss_eval": 0.8193543553352356,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5247719287872314,
+ 5.414742469787598,
+ 7.496610164642334,
+ 9.884673118591309,
+ 12.301740646362305
+ ],
+ "hidden_norms_avg": [
+ 4.334397792816162,
+ 8.873777389526367,
+ 9.937097549438477,
+ 11.524014472961426,
+ 12.564128875732422
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00016137116472236812,
+ 8.459146192763001e-05,
+ 7.113611354725435e-05,
+ 4.750298467115499e-05,
+ 1.9900418919860385e-05
+ ],
+ "bp_grad_F": [
+ 0.1871533840894699,
+ 0.09687218815088272,
+ 0.0768747329711914,
+ 0.05509059876203537,
+ 0.024593451991677284
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.80078125,
+ "loss_eval": 0.810278058052063,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5175530910491943,
+ 5.423762798309326,
+ 7.493518352508545,
+ 9.848480224609375,
+ 12.152653694152832
+ ],
+ "hidden_norms_avg": [
+ 4.333771228790283,
+ 8.846830368041992,
+ 9.895172119140625,
+ 11.470880508422852,
+ 12.51230239868164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00018688049749471247,
+ 9.502686589257792e-05,
+ 7.833576091798022e-05,
+ 5.505367516889237e-05,
+ 2.1109613953740336e-05
+ ],
+ "bp_grad_F": [
+ 0.19925038516521454,
+ 0.10273440927267075,
+ 0.08146088570356369,
+ 0.05800405889749527,
+ 0.025326546281576157
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.79296875,
+ "loss_eval": 0.8315975069999695,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5154390335083008,
+ 5.332769870758057,
+ 7.351593971252441,
+ 9.726226806640625,
+ 12.217824935913086
+ ],
+ "hidden_norms_avg": [
+ 4.312089443206787,
+ 8.77189826965332,
+ 9.80828857421875,
+ 11.376079559326172,
+ 12.424320220947266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001625730947125703,
+ 8.300685294670984e-05,
+ 6.064521585358307e-05,
+ 4.498598718782887e-05,
+ 1.878884904726874e-05
+ ],
+ "bp_grad_F": [
+ 0.20003639161586761,
+ 0.10495735704898834,
+ 0.08297032862901688,
+ 0.059033025056123734,
+ 0.02547283098101616
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7890625,
+ "loss_eval": 0.8281288146972656,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5136713981628418,
+ 5.367674827575684,
+ 7.355134963989258,
+ 9.682082176208496,
+ 12.047696113586426
+ ],
+ "hidden_norms_avg": [
+ 4.316784381866455,
+ 8.783827781677246,
+ 9.812792778015137,
+ 11.395760536193848,
+ 12.420063018798828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00016071743448264897,
+ 7.887884567026049e-05,
+ 6.097723598941229e-05,
+ 4.243743751430884e-05,
+ 1.8102018657373264e-05
+ ],
+ "bp_grad_F": [
+ 0.20199808478355408,
+ 0.10541712492704391,
+ 0.0835103914141655,
+ 0.05967256799340248,
+ 0.025771932676434517
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7890625,
+ "loss_eval": 0.8389135599136353,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5129119157791138,
+ 5.326069355010986,
+ 7.275172233581543,
+ 9.633310317993164,
+ 12.064473152160645
+ ],
+ "hidden_norms_avg": [
+ 4.308472633361816,
+ 8.717856407165527,
+ 9.717677116394043,
+ 11.28734016418457,
+ 12.3176851272583
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015608215471729636,
+ 8.108095789793879e-05,
+ 6.294465129030868e-05,
+ 4.2116138502024114e-05,
+ 1.7733293134369887e-05
+ ],
+ "bp_grad_F": [
+ 0.20727074146270752,
+ 0.10958535224199295,
+ 0.08667060732841492,
+ 0.06113011762499809,
+ 0.026037005707621574
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.787109375,
+ "loss_eval": 0.8504288792610168,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5120813846588135,
+ 5.313214302062988,
+ 7.253427982330322,
+ 9.583664894104004,
+ 12.01283073425293
+ ],
+ "hidden_norms_avg": [
+ 4.303354263305664,
+ 8.709893226623535,
+ 9.714727401733398,
+ 11.287162780761719,
+ 12.301621437072754
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014261712203733623,
+ 8.006545249372721e-05,
+ 6.104232306824997e-05,
+ 4.1361305193277076e-05,
+ 1.670202073000837e-05
+ ],
+ "bp_grad_F": [
+ 0.20587928593158722,
+ 0.10970292240381241,
+ 0.0869779959321022,
+ 0.06163511052727699,
+ 0.02630491554737091
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7919921875,
+ "loss_eval": 0.8500803709030151,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5113301277160645,
+ 5.33270263671875,
+ 7.255039215087891,
+ 9.560588836669922,
+ 11.935233116149902
+ ],
+ "hidden_norms_avg": [
+ 4.311485767364502,
+ 8.737537384033203,
+ 9.710383415222168,
+ 11.27385425567627,
+ 12.309149742126465
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014448253205046058,
+ 7.629570609424263e-05,
+ 6.040706284693442e-05,
+ 4.236707536620088e-05,
+ 1.7641770682530478e-05
+ ],
+ "bp_grad_F": [
+ 0.20638784766197205,
+ 0.10957971960306168,
+ 0.08719436824321747,
+ 0.06181200593709946,
+ 0.026369713246822357
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7900390625,
+ "loss_eval": 0.8525989055633545,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5115892887115479,
+ 5.313480377197266,
+ 7.247244834899902,
+ 9.550230979919434,
+ 11.989883422851562
+ ],
+ "hidden_norms_avg": [
+ 4.3022141456604,
+ 8.688987731933594,
+ 9.685582160949707,
+ 11.234566688537598,
+ 12.270132064819336
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001483379164710641,
+ 7.948598067741841e-05,
+ 6.1946535424795e-05,
+ 4.4680935388896614e-05,
+ 1.6852744010975584e-05
+ ],
+ "bp_grad_F": [
+ 0.21088635921478271,
+ 0.11181779950857162,
+ 0.08855349570512772,
+ 0.06269123405218124,
+ 0.026410162448883057
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7890625,
+ "loss_eval": 0.8474454879760742,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5110703706741333,
+ 5.306856632232666,
+ 7.230412483215332,
+ 9.542105674743652,
+ 11.942556381225586
+ ],
+ "hidden_norms_avg": [
+ 4.305404186248779,
+ 8.697504997253418,
+ 9.679413795471191,
+ 11.226194381713867,
+ 12.25047492980957
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014003549586050212,
+ 7.460260530933738e-05,
+ 6.204132660059258e-05,
+ 3.912465035682544e-05,
+ 1.6441039406345226e-05
+ ],
+ "bp_grad_F": [
+ 0.20991134643554688,
+ 0.11143218725919724,
+ 0.08832813799381256,
+ 0.06269684433937073,
+ 0.026480402797460556
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.791015625,
+ "loss_eval": 0.8496487140655518,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5111491680145264,
+ 5.304075717926025,
+ 7.234795093536377,
+ 9.53318977355957,
+ 11.964473724365234
+ ],
+ "hidden_norms_avg": [
+ 4.304405689239502,
+ 8.697833061218262,
+ 9.683843612670898,
+ 11.22890853881836,
+ 12.259684562683105
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014237761206459254,
+ 7.472094148397446e-05,
+ 5.683211929863319e-05,
+ 4.049929339089431e-05,
+ 1.4964447473175824e-05
+ ],
+ "bp_grad_F": [
+ 0.21009324491024017,
+ 0.11155029386281967,
+ 0.08846566081047058,
+ 0.06290413439273834,
+ 0.026488499715924263
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.794921875,
+ "loss_eval": 0.8498167395591736,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5111573934555054,
+ 5.304897785186768,
+ 7.23397970199585,
+ 9.53254508972168,
+ 11.969621658325195
+ ],
+ "hidden_norms_avg": [
+ 4.304327964782715,
+ 8.696623802185059,
+ 9.681411743164062,
+ 11.225934982299805,
+ 12.255182266235352
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001376860454911366,
+ 7.4876043072436e-05,
+ 5.8659916248871014e-05,
+ 4.048796836286783e-05,
+ 1.5446972611243837e-05
+ ],
+ "bp_grad_F": [
+ 0.210032656788826,
+ 0.11159469932317734,
+ 0.08847951143980026,
+ 0.06288634985685349,
+ 0.02649829164147377
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.791015625,
+ "loss_eval": 0.8496516942977905,
+ "epoch": 60
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms_cls": [
+ 0.3042769432067871,
+ 3.2273340225219727,
+ 4.6926493644714355,
+ 6.003997802734375,
+ 6.652705669403076
+ ],
+ "hidden_norms_avg": [
+ 6.027750492095947,
+ 7.1044697761535645,
+ 7.910475730895996,
+ 8.79189682006836,
+ 9.458833694458008
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.005248428788036108,
+ 0.0012287507997825742,
+ 0.0010387187357991934,
+ 0.0009678652859292924,
+ 0.0009174557635560632
+ ],
+ "bp_grad_F": [
+ 0.248850479722023,
+ 0.0424945093691349,
+ 0.0348997563123703,
+ 0.03202275559306145,
+ 0.030239813029766083
+ ],
+ "gamma_dfa": -0.0027123973850393668,
+ "gamma_dfa_per_layer": [
+ -0.0010305923642590642,
+ -0.01111956313252449,
+ 0.0014823779929429293,
+ -0.00018181203631684184
+ ],
+ "acc_eval": 0.0791015625,
+ "loss_eval": 2.544933319091797,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 1.8898234367370605,
+ 1755.5985107421875,
+ 3812.865966796875,
+ 4063.967529296875,
+ 6749.62646484375
+ ],
+ "hidden_norms_avg": [
+ 48.02373504638672,
+ 2610.970458984375,
+ 7442.5693359375,
+ 13001.9443359375,
+ 19569.59765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006367825553752482,
+ 1.061867237694969e-06,
+ 9.113553005590802e-07,
+ 8.042399599617056e-07,
+ 7.901451226643985e-07
+ ],
+ "bp_grad_F": [
+ 0.11358296871185303,
+ 5.570299981627613e-05,
+ 4.605366484611295e-05,
+ 3.752685370272957e-05,
+ 3.027659113286063e-05
+ ],
+ "gamma_dfa": 0.007312511210329831,
+ "gamma_dfa_per_layer": [
+ 0.01007317565381527,
+ 0.008024577051401138,
+ 0.008248038589954376,
+ 0.0029042535461485386
+ ],
+ "acc_eval": 0.2333984375,
+ "loss_eval": 2.0879125595092773,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 3.704786777496338,
+ 7219.806640625,
+ 19592.4140625,
+ 21808.44921875,
+ 46117.11328125
+ ],
+ "hidden_norms_avg": [
+ 97.33866882324219,
+ 9787.240234375,
+ 35216.66015625,
+ 64377.67578125,
+ 97116.8125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.637367475079373e-05,
+ 1.6794896851024532e-07,
+ 1.5954641696680483e-07,
+ 1.4061814113119908e-07,
+ 1.445507677999558e-07
+ ],
+ "bp_grad_F": [
+ 0.04642009362578392,
+ 2.128358573827427e-05,
+ 2.0123250578762963e-05,
+ 6.922710781509522e-06,
+ 6.6381039687257726e-06
+ ],
+ "gamma_dfa": 0.007922766148112714,
+ "gamma_dfa_per_layer": [
+ 0.016379408538341522,
+ 0.005931380204856396,
+ 0.007020577322691679,
+ 0.0023596985265612602
+ ],
+ "acc_eval": 0.205078125,
+ "loss_eval": 2.1287283897399902,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 5.554904937744141,
+ 16081.3388671875,
+ 48028.96875,
+ 51717.93359375,
+ 100197.7265625
+ ],
+ "hidden_norms_avg": [
+ 147.4190216064453,
+ 22860.939453125,
+ 90670.5078125,
+ 172520.15625,
+ 247624.09375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.051399289688561e-05,
+ 9.248702070863146e-08,
+ 7.303499671706959e-08,
+ 6.487525183729304e-08,
+ 6.620962977876843e-08
+ ],
+ "bp_grad_F": [
+ 0.034720927476882935,
+ 1.6823112673591822e-05,
+ 1.1384844583517406e-05,
+ 3.0318508379423292e-06,
+ 2.624829903652426e-06
+ ],
+ "gamma_dfa": 0.0067759081866825,
+ "gamma_dfa_per_layer": [
+ 0.014651123434305191,
+ 0.004187515936791897,
+ 0.007594288792461157,
+ 0.0006707045831717551
+ ],
+ "acc_eval": 0.20703125,
+ "loss_eval": 2.107574462890625,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 7.38655424118042,
+ 30113.763671875,
+ 92815.4375,
+ 102848.4453125,
+ 183389.40625
+ ],
+ "hidden_norms_avg": [
+ 194.20396423339844,
+ 39156.78515625,
+ 166144.453125,
+ 360300.25,
+ 500574.96875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7757007046602666e-05,
+ 6.177719313882335e-08,
+ 4.3474216226968565e-08,
+ 3.8972562066419414e-08,
+ 3.9463689205376795e-08
+ ],
+ "bp_grad_F": [
+ 0.03289186581969261,
+ 5.563175363931805e-06,
+ 2.151713033526903e-06,
+ 1.463158696424216e-06,
+ 1.3795681752526434e-06
+ ],
+ "gamma_dfa": 0.006396490931365406,
+ "gamma_dfa_per_layer": [
+ 0.015158161520957947,
+ 0.0035972977057099342,
+ 0.006714952643960714,
+ 0.00011555185483302921
+ ],
+ "acc_eval": 0.203125,
+ "loss_eval": 2.1379737854003906,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 9.15835189819336,
+ 53591.8984375,
+ 170615.734375,
+ 181427.171875,
+ 289063.5625
+ ],
+ "hidden_norms_avg": [
+ 238.28347778320312,
+ 61062.31640625,
+ 250187.6875,
+ 548101.3125,
+ 724058.1875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.960537312901579e-05,
+ 4.670241438020639e-08,
+ 3.080446120407032e-08,
+ 2.670985388419922e-08,
+ 2.6331489877406966e-08
+ ],
+ "bp_grad_F": [
+ 0.016260992735624313,
+ 4.766869551531272e-06,
+ 2.067620698653627e-06,
+ 9.787106591829797e-07,
+ 8.912123234949831e-07
+ ],
+ "gamma_dfa": 0.0068261599517427385,
+ "gamma_dfa_per_layer": [
+ 0.014116348698735237,
+ 0.003242844482883811,
+ 0.008411802351474762,
+ 0.0015336442738771439
+ ],
+ "acc_eval": 0.1962890625,
+ "loss_eval": 2.1309733390808105,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 10.888343811035156,
+ 91755.1171875,
+ 249917.8125,
+ 274005.3125,
+ 444277.53125
+ ],
+ "hidden_norms_avg": [
+ 276.9202880859375,
+ 104021.7109375,
+ 349872.5,
+ 931915.875,
+ 1222273.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7342781322658993e-05,
+ 3.6854661544794e-08,
+ 2.4993127567540796e-08,
+ 1.8662358769461207e-08,
+ 1.7811659702715588e-08
+ ],
+ "bp_grad_F": [
+ 0.022468894720077515,
+ 3.493201802484691e-06,
+ 1.1520894531713566e-06,
+ 7.113425795068906e-07,
+ 6.108040793151304e-07
+ ],
+ "gamma_dfa": 0.007193240569904447,
+ "gamma_dfa_per_layer": [
+ 0.017048656940460205,
+ 0.002665129955857992,
+ 0.007390158250927925,
+ 0.001669017132371664
+ ],
+ "acc_eval": 0.2109375,
+ "loss_eval": 2.1020355224609375,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 12.623483657836914,
+ 158915.890625,
+ 360070.6875,
+ 406906.3125,
+ 630641.3125
+ ],
+ "hidden_norms_avg": [
+ 315.0859680175781,
+ 172244.328125,
+ 490065.59375,
+ 1510240.375,
+ 1952914.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.403881783015095e-05,
+ 2.7625405962794503e-08,
+ 1.651102543576144e-08,
+ 1.1742161909467086e-08,
+ 1.0927361238088906e-08
+ ],
+ "bp_grad_F": [
+ 0.024832597002387047,
+ 1.8080392010233481e-06,
+ 7.246239306368807e-07,
+ 4.936595132676302e-07,
+ 4.0145107504940825e-07
+ ],
+ "gamma_dfa": 0.006596001767320558,
+ "gamma_dfa_per_layer": [
+ 0.016851693391799927,
+ 0.001910479972139001,
+ 0.0058369822800159454,
+ 0.0017848514253273606
+ ],
+ "acc_eval": 0.2138671875,
+ "loss_eval": 2.1312928199768066,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 14.368335723876953,
+ 243332.8125,
+ 525771.0,
+ 593291.75,
+ 875288.5
+ ],
+ "hidden_norms_avg": [
+ 351.16015625,
+ 247222.375,
+ 640658.75,
+ 1855662.75,
+ 2391194.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.87416060018586e-05,
+ 1.8018790015617014e-08,
+ 1.2651691250198382e-08,
+ 9.33115984480537e-09,
+ 8.563736386690834e-09
+ ],
+ "bp_grad_F": [
+ 0.017871394753456116,
+ 9.426115070709784e-07,
+ 4.7217255882969766e-07,
+ 3.564711050785263e-07,
+ 3.2240865266430774e-07
+ ],
+ "gamma_dfa": 0.006289168493822217,
+ "gamma_dfa_per_layer": [
+ 0.013373943977057934,
+ 0.0037157258484512568,
+ 0.00672483816742897,
+ 0.001342165982350707
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 2.0829837322235107,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 16.041412353515625,
+ 385486.09375,
+ 776263.875,
+ 869037.0,
+ 1191002.25
+ ],
+ "hidden_norms_avg": [
+ 383.5213317871094,
+ 383708.40625,
+ 941498.0,
+ 2793651.25,
+ 3510556.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8917142117279582e-05,
+ 1.1363525231899985e-08,
+ 8.616331648170217e-09,
+ 5.602694308493028e-09,
+ 5.260086588521062e-09
+ ],
+ "bp_grad_F": [
+ 0.024791762232780457,
+ 6.833873840150773e-07,
+ 3.100701633229619e-07,
+ 2.26619619070334e-07,
+ 2.1342954426017968e-07
+ ],
+ "gamma_dfa": 0.00652129843365401,
+ "gamma_dfa_per_layer": [
+ 0.014406262896955013,
+ 0.004345592111349106,
+ 0.006529162637889385,
+ 0.0008041760884225368
+ ],
+ "acc_eval": 0.2197265625,
+ "loss_eval": 2.1437277793884277,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 17.677919387817383,
+ 582942.5,
+ 1148260.75,
+ 1279834.25,
+ 1709270.625
+ ],
+ "hidden_norms_avg": [
+ 416.1814880371094,
+ 530246.375,
+ 1201761.5,
+ 2944394.0,
+ 3732565.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.369058686075732e-05,
+ 6.623859238885643e-09,
+ 4.513381224313662e-09,
+ 3.933114278709127e-09,
+ 3.794405678547719e-09
+ ],
+ "bp_grad_F": [
+ 0.01620429754257202,
+ 3.022730652446626e-07,
+ 1.9097409165169665e-07,
+ 1.773983058228623e-07,
+ 1.593236333974346e-07
+ ],
+ "gamma_dfa": 0.006082151841837913,
+ "gamma_dfa_per_layer": [
+ 0.01578153669834137,
+ 0.002655572956427932,
+ 0.005509376525878906,
+ 0.00038212118670344353
+ ],
+ "acc_eval": 0.197265625,
+ "loss_eval": 2.089698314666748,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 19.31073760986328,
+ 843820.0625,
+ 1587423.25,
+ 1759006.0,
+ 2222149.5
+ ],
+ "hidden_norms_avg": [
+ 448.93133544921875,
+ 796172.1875,
+ 1678321.375,
+ 3888912.0,
+ 4810418.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 4.445635568117723e-05,
+ 3.5140981236025937e-09,
+ 2.8926525619255017e-09,
+ 2.65975419466713e-09,
+ 2.6499111793754082e-09
+ ],
+ "bp_grad_F": [
+ 0.020245229825377464,
+ 2.6993967594535206e-07,
+ 1.701987457636278e-07,
+ 1.3198047099649557e-07,
+ 1.2469256205349666e-07
+ ],
+ "gamma_dfa": 0.005559869911849091,
+ "gamma_dfa_per_layer": [
+ 0.015185668133199215,
+ 0.0025689376052469015,
+ 0.004468783736228943,
+ 1.6090172721305862e-05
+ ],
+ "acc_eval": 0.2314453125,
+ "loss_eval": 2.0838193893432617,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 20.861183166503906,
+ 1157778.75,
+ 2054207.5,
+ 2289084.5,
+ 2841995.0
+ ],
+ "hidden_norms_avg": [
+ 479.8387145996094,
+ 981138.875,
+ 2112497.25,
+ 4439588.0,
+ 5517614.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.176981772412546e-05,
+ 3.1782512177613853e-09,
+ 2.5456772245746606e-09,
+ 2.4393245201537184e-09,
+ 2.414718425214346e-09
+ ],
+ "bp_grad_F": [
+ 0.09368129819631577,
+ 9.166008680949744e-07,
+ 2.675243706562469e-07,
+ 1.0984689424731187e-07,
+ 1.0444787079677553e-07
+ ],
+ "gamma_dfa": 0.004390636342577636,
+ "gamma_dfa_per_layer": [
+ 0.011994147673249245,
+ 0.001997251994907856,
+ 0.003865728620439768,
+ -0.00029458291828632355
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 2.0896079540252686,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 22.362810134887695,
+ 1504072.375,
+ 2527410.75,
+ 2870361.25,
+ 3557771.0
+ ],
+ "hidden_norms_avg": [
+ 510.81561279296875,
+ 1188843.375,
+ 2574796.25,
+ 5296089.0,
+ 6640932.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8154454412288032e-05,
+ 3.057065711686846e-09,
+ 2.121731013104977e-09,
+ 2.0999049166192663e-09,
+ 2.0892536589656174e-09
+ ],
+ "bp_grad_F": [
+ 0.011068353429436684,
+ 1.3467251847032458e-06,
+ 1.0581060649883511e-07,
+ 9.427417069218791e-08,
+ 9.197237460512042e-08
+ ],
+ "gamma_dfa": 0.003989392673247494,
+ "gamma_dfa_per_layer": [
+ 0.011822337284684181,
+ 0.001384879695251584,
+ 0.00329465395770967,
+ -0.0005443002446554601
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.077056407928467,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 23.812599182128906,
+ 1930070.0,
+ 2995981.75,
+ 3469627.0,
+ 4303896.0
+ ],
+ "hidden_norms_avg": [
+ 539.9255981445312,
+ 1589889.5,
+ 3066154.25,
+ 6015238.0,
+ 7540605.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.170168929500505e-05,
+ 2.518652619798445e-09,
+ 1.924201020742089e-09,
+ 1.8520206479522017e-09,
+ 1.8417810609960839e-09
+ ],
+ "bp_grad_F": [
+ 0.032089244574308395,
+ 1.0142422297576559e-06,
+ 1.6566445992793888e-07,
+ 8.33219857554468e-08,
+ 7.640721122470495e-08
+ ],
+ "gamma_dfa": 0.0029267592035466805,
+ "gamma_dfa_per_layer": [
+ 0.008105762302875519,
+ 0.001629034522920847,
+ 0.0022919299080967903,
+ -0.000319689919706434
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 2.0748229026794434,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 25.248563766479492,
+ 2452306.5,
+ 3664022.75,
+ 4168536.0,
+ 5106242.5
+ ],
+ "hidden_norms_avg": [
+ 570.19384765625,
+ 1965615.5,
+ 3710471.5,
+ 7372995.0,
+ 9239893.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.4190969270421192e-05,
+ 1.8390389211475622e-09,
+ 1.5613663695290825e-09,
+ 1.5359991056840272e-09,
+ 1.5388512686342892e-09
+ ],
+ "bp_grad_F": [
+ 0.015056902542710304,
+ 6.693913292110665e-06,
+ 1.241161982079575e-07,
+ 7.622224984515924e-08,
+ 6.743793790064956e-08
+ ],
+ "gamma_dfa": 0.0022661721595795825,
+ "gamma_dfa_per_layer": [
+ 0.006208081729710102,
+ 0.001149914925917983,
+ 0.0020575951784849167,
+ -0.0003509031957946718
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 2.0835204124450684,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 26.6426944732666,
+ 3107169.0,
+ 4381372.0,
+ 5027998.5,
+ 6065136.0
+ ],
+ "hidden_norms_avg": [
+ 596.7793579101562,
+ 2542559.0,
+ 4400625.5,
+ 8374831.5,
+ 10510773.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.787545781757217e-05,
+ 1.5701163702530607e-09,
+ 1.2841328000945396e-09,
+ 1.2669904014828148e-09,
+ 1.2700215323846464e-09
+ ],
+ "bp_grad_F": [
+ 0.006971500348299742,
+ 1.8619180991663598e-05,
+ 6.465826629664662e-08,
+ 5.84209978171657e-08,
+ 5.694714744208795e-08
+ ],
+ "gamma_dfa": 0.0030232197314035147,
+ "gamma_dfa_per_layer": [
+ 0.009539565071463585,
+ 0.0012945058988407254,
+ 0.0015697493217885494,
+ -0.0003109413664788008
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 2.058485507965088,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 27.95879364013672,
+ 3613966.25,
+ 5044349.0,
+ 5874924.0,
+ 7080756.0
+ ],
+ "hidden_norms_avg": [
+ 623.2052612304688,
+ 2844551.5,
+ 4942977.0,
+ 8742455.0,
+ 11094594.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8442762413760647e-05,
+ 1.629689605486817e-09,
+ 1.115437520127216e-09,
+ 1.0797144289753646e-09,
+ 1.0779978021346892e-09
+ ],
+ "bp_grad_F": [
+ 0.0072508929297327995,
+ 1.4132167507341364e-06,
+ 6.271753250075562e-08,
+ 4.991998281411725e-08,
+ 4.950436149897541e-08
+ ],
+ "gamma_dfa": 0.001284227124415338,
+ "gamma_dfa_per_layer": [
+ 0.00256139412522316,
+ 0.0014944188296794891,
+ 0.0013982560485601425,
+ -0.0003171605058014393
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 2.0549392700195312,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 29.22184181213379,
+ 4211867.5,
+ 5636704.5,
+ 6891397.5,
+ 8559809.0
+ ],
+ "hidden_norms_avg": [
+ 647.4288330078125,
+ 3423908.25,
+ 5695376.5,
+ 10367815.0,
+ 13188250.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8086895326850936e-05,
+ 1.1501447572115353e-09,
+ 8.738501033889179e-10,
+ 8.528160400089746e-10,
+ 8.584906674435899e-10
+ ],
+ "bp_grad_F": [
+ 0.012267161160707474,
+ 1.591232035025314e-06,
+ 4.697067268466526e-08,
+ 4.271150899626264e-08,
+ 4.017679700041299e-08
+ ],
+ "gamma_dfa": 0.0022953646985115483,
+ "gamma_dfa_per_layer": [
+ 0.007007642649114132,
+ 0.0012370320037007332,
+ 0.0011846421984955668,
+ -0.0002478580572642386
+ ],
+ "acc_eval": 0.228515625,
+ "loss_eval": 2.053128242492676,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 30.412078857421875,
+ 4986411.0,
+ 6504586.0,
+ 7889628.0,
+ 9783147.0
+ ],
+ "hidden_norms_avg": [
+ 670.3391723632812,
+ 3921667.0,
+ 6270645.0,
+ 10589857.0,
+ 13580617.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.768085505522322e-05,
+ 1.3132780418700918e-09,
+ 7.742924079678914e-10,
+ 7.418777814294231e-10,
+ 7.448673344789825e-10
+ ],
+ "bp_grad_F": [
+ 0.007575999945402145,
+ 1.7771724287740653e-06,
+ 5.529824420591467e-08,
+ 3.790939828718365e-08,
+ 3.6307092443621514e-08
+ ],
+ "gamma_dfa": 0.0009071348831639625,
+ "gamma_dfa_per_layer": [
+ 0.001273356145247817,
+ 0.001484773471020162,
+ 0.0010661636479198933,
+ -0.00019575373153202236
+ ],
+ "acc_eval": 0.25390625,
+ "loss_eval": 2.0479414463043213,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 31.54771614074707,
+ 5502896.5,
+ 7070197.5,
+ 8994800.0,
+ 11604998.0
+ ],
+ "hidden_norms_avg": [
+ 692.4578247070312,
+ 4249610.0,
+ 6837255.0,
+ 11617683.0,
+ 15223152.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0367684303200804e-05,
+ 1.325711207478264e-09,
+ 6.525959217462685e-10,
+ 6.324714640904006e-10,
+ 6.32227936669949e-10
+ ],
+ "bp_grad_F": [
+ 0.0062190573662519455,
+ 1.129235442931531e-06,
+ 3.317861896334762e-08,
+ 3.131979653403505e-08,
+ 3.109861168582029e-08
+ ],
+ "gamma_dfa": 0.0011510169642861001,
+ "gamma_dfa_per_layer": [
+ 0.002568549243733287,
+ 0.0013005147920921445,
+ 0.0009535959688946605,
+ -0.00021859214757569134
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0359444618225098,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 32.638641357421875,
+ 6320697.0,
+ 7897073.5,
+ 10165307.0,
+ 13313912.0
+ ],
+ "hidden_norms_avg": [
+ 713.3525390625,
+ 4812640.5,
+ 7533297.5,
+ 12847435.0,
+ 16993420.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.871564695145935e-05,
+ 1.2221273992807369e-09,
+ 6.080098646776833e-10,
+ 5.917044632042234e-10,
+ 5.89539916884263e-10
+ ],
+ "bp_grad_F": [
+ 0.011915000155568123,
+ 6.25122083874885e-06,
+ 3.6603957198622084e-08,
+ 2.876341298474472e-08,
+ 2.8581927935533713e-08
+ ],
+ "gamma_dfa": 0.0002986440376844257,
+ "gamma_dfa_per_layer": [
+ -0.0004627959569916129,
+ 0.0009951044339686632,
+ 0.0008257199660874903,
+ -0.00016345229232683778
+ ],
+ "acc_eval": 0.2626953125,
+ "loss_eval": 2.059875965118408,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 33.6330451965332,
+ 7264995.5,
+ 8758988.0,
+ 11785280.0,
+ 15874132.0
+ ],
+ "hidden_norms_avg": [
+ 732.8869018554688,
+ 5982206.0,
+ 8454064.0,
+ 14846262.0,
+ 19834080.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.5420635211048648e-05,
+ 7.56205986718328e-10,
+ 5.169706884800007e-10,
+ 5.026724592127607e-10,
+ 5.024383686880185e-10
+ ],
+ "bp_grad_F": [
+ 0.014803220517933369,
+ 4.478873961488716e-06,
+ 4.4555019229619575e-08,
+ 2.4910459472948787e-08,
+ 2.4745437698925343e-08
+ ],
+ "gamma_dfa": 0.001046390665578656,
+ "gamma_dfa_per_layer": [
+ 0.0027164756320416927,
+ 0.0009058329742401838,
+ 0.0007253356743603945,
+ -0.00016208161832764745
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0538365840911865,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 34.621524810791016,
+ 8089090.5,
+ 9671455.0,
+ 13086530.0,
+ 17616980.0
+ ],
+ "hidden_norms_avg": [
+ 751.2442016601562,
+ 6699752.5,
+ 9159771.0,
+ 15622865.0,
+ 21214146.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7939373467233963e-05,
+ 7.656756340068682e-10,
+ 5.061054908495066e-10,
+ 4.837483191799663e-10,
+ 4.820439047925618e-10
+ ],
+ "bp_grad_F": [
+ 0.008210284635424614,
+ 3.91981393477181e-06,
+ 2.727725245676993e-08,
+ 2.349457695061119e-08,
+ 2.2768137597495297e-08
+ ],
+ "gamma_dfa": 0.0013028495595790446,
+ "gamma_dfa_per_layer": [
+ 0.0034610098227858543,
+ 0.0012297509238123894,
+ 0.0006837932160124183,
+ -0.00016315572429448366
+ ],
+ "acc_eval": 0.2646484375,
+ "loss_eval": 2.0430214405059814,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 35.54478454589844,
+ 9145767.0,
+ 10558942.0,
+ 14636200.0,
+ 19721632.0
+ ],
+ "hidden_norms_avg": [
+ 768.5211791992188,
+ 7473006.0,
+ 10093548.0,
+ 17775052.0,
+ 24159262.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.364618532941677e-05,
+ 8.066202705769854e-10,
+ 4.5619852340195166e-10,
+ 4.4121445386124947e-10,
+ 4.323804370098827e-10
+ ],
+ "bp_grad_F": [
+ 0.09167197346687317,
+ 4.855019597016508e-06,
+ 2.689265521382822e-08,
+ 2.1627007740221416e-08,
+ 2.0867716443717654e-08
+ ],
+ "gamma_dfa": 0.0001647558601689525,
+ "gamma_dfa_per_layer": [
+ -0.0005364040262065828,
+ 0.0007433416321873665,
+ 0.0005910456529818475,
+ -0.00013895981828682125
+ ],
+ "acc_eval": 0.23046875,
+ "loss_eval": 2.0427517890930176,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 36.43881607055664,
+ 10216266.0,
+ 11478190.0,
+ 16476424.0,
+ 22393992.0
+ ],
+ "hidden_norms_avg": [
+ 785.1990966796875,
+ 8300483.0,
+ 10872433.0,
+ 18667924.0,
+ 25447926.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0938736017560586e-05,
+ 7.561202219896757e-10,
+ 4.2832748459176173e-10,
+ 4.0923736621678586e-10,
+ 4.0218126051705383e-10
+ ],
+ "bp_grad_F": [
+ 0.013463743962347507,
+ 1.9222785340389237e-05,
+ 2.2825457079989064e-08,
+ 1.9977358434175585e-08,
+ 1.9259800865256693e-08
+ ],
+ "gamma_dfa": 0.0005702937960450072,
+ "gamma_dfa_per_layer": [
+ 0.0011116554960608482,
+ 0.0007594762137159705,
+ 0.0005430461023934186,
+ -0.00013300262799020857
+ ],
+ "acc_eval": 0.2568359375,
+ "loss_eval": 2.0594615936279297,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 37.30263137817383,
+ 11623684.0,
+ 12776919.0,
+ 18306868.0,
+ 24740858.0
+ ],
+ "hidden_norms_avg": [
+ 800.9972534179688,
+ 9603253.0,
+ 12104963.0,
+ 20835068.0,
+ 28405318.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.261065648985095e-05,
+ 6.65525801135658e-10,
+ 3.838940831890625e-10,
+ 3.742672838313865e-10,
+ 3.7395189722566613e-10
+ ],
+ "bp_grad_F": [
+ 0.007853930816054344,
+ 1.2899076864414383e-06,
+ 1.9278010299217385e-08,
+ 1.8154999281705386e-08,
+ 1.7368931182204506e-08
+ ],
+ "gamma_dfa": 0.00021361159815569408,
+ "gamma_dfa_per_layer": [
+ -0.00034064118517562747,
+ 0.0008438127697445452,
+ 0.0004718025156762451,
+ -0.00012052770762238652
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0433781147003174,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 38.06776428222656,
+ 12599130.0,
+ 13703165.0,
+ 19834172.0,
+ 26867468.0
+ ],
+ "hidden_norms_avg": [
+ 816.2463989257812,
+ 10421772.0,
+ 12873138.0,
+ 21321398.0,
+ 29452538.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.774638414848596e-05,
+ 6.227232618449818e-10,
+ 3.566741624272396e-10,
+ 3.4781866276034634e-10,
+ 3.45437983773067e-10
+ ],
+ "bp_grad_F": [
+ 0.013920681551098824,
+ 3.4208371744171018e-06,
+ 2.1883508338760294e-08,
+ 1.7128741092165e-08,
+ 1.6603545205384762e-08
+ ],
+ "gamma_dfa": 0.0008690126524015795,
+ "gamma_dfa_per_layer": [
+ 0.0021882583387196064,
+ 0.0009064457844942808,
+ 0.0004841286572627723,
+ -0.00010278217087034136
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.0433974266052246,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 38.7847785949707,
+ 14429584.0,
+ 15438086.0,
+ 21566880.0,
+ 29267340.0
+ ],
+ "hidden_norms_avg": [
+ 830.9344482421875,
+ 11436777.0,
+ 13832175.0,
+ 22913616.0,
+ 32026754.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8682481570285745e-05,
+ 5.758302168423768e-10,
+ 3.3607527871737375e-10,
+ 3.304233830991876e-10,
+ 3.2846284026000205e-10
+ ],
+ "bp_grad_F": [
+ 0.012251574546098709,
+ 2.996052717207931e-05,
+ 2.7452134787608884e-08,
+ 1.577506480998636e-08,
+ 1.5141546683139495e-08
+ ],
+ "gamma_dfa": 0.0004505918041104451,
+ "gamma_dfa_per_layer": [
+ 0.00026967719895765185,
+ 0.001212525530718267,
+ 0.0004131481982767582,
+ -9.298371151089668e-05
+ ],
+ "acc_eval": 0.2607421875,
+ "loss_eval": 2.039923667907715,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 39.49647521972656,
+ 15523604.0,
+ 16504434.0,
+ 23236370.0,
+ 31306890.0
+ ],
+ "hidden_norms_avg": [
+ 844.8562622070312,
+ 12856661.0,
+ 15124535.0,
+ 23633704.0,
+ 32995118.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.6219468054478057e-05,
+ 5.519696366640403e-10,
+ 3.2825916984613457e-10,
+ 3.235848811122821e-10,
+ 3.2190172749579915e-10
+ ],
+ "bp_grad_F": [
+ 0.012884745374321938,
+ 1.8329246813664213e-05,
+ 1.8323355277516384e-08,
+ 1.5584015855552025e-08,
+ 1.4755748622974352e-08
+ ],
+ "gamma_dfa": 0.0006857650478195865,
+ "gamma_dfa_per_layer": [
+ 0.0016966589028015733,
+ 0.0007126724813133478,
+ 0.0003994358121417463,
+ -6.570700497832149e-05
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.0533735752105713,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 40.16881561279297,
+ 16141660.0,
+ 17137856.0,
+ 24286464.0,
+ 32903152.0
+ ],
+ "hidden_norms_avg": [
+ 857.8116455078125,
+ 12895693.0,
+ 15492559.0,
+ 23745768.0,
+ 33843860.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.2289473892888054e-05,
+ 6.340856728570543e-10,
+ 3.264067627295475e-10,
+ 3.149370209065694e-10,
+ 3.097411216401724e-10
+ ],
+ "bp_grad_F": [
+ 0.006337009835988283,
+ 1.7065680367522873e-05,
+ 5.785592804841144e-08,
+ 1.519365788738014e-08,
+ 1.464850551968766e-08
+ ],
+ "gamma_dfa": 0.0005419648223323748,
+ "gamma_dfa_per_layer": [
+ 0.00038546844734810293,
+ 0.0014093497302383184,
+ 0.0004054713645018637,
+ -3.243025275878608e-05
+ ],
+ "acc_eval": 0.265625,
+ "loss_eval": 2.0390102863311768,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 40.790164947509766,
+ 18768648.0,
+ 19610716.0,
+ 26926266.0,
+ 36060360.0
+ ],
+ "hidden_norms_avg": [
+ 869.6182861328125,
+ 15248417.0,
+ 17480158.0,
+ 26928640.0,
+ 37555876.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.939497062470764e-05,
+ 5.127394064885493e-10,
+ 3.1137872835707014e-10,
+ 3.074558663218596e-10,
+ 3.04990144250894e-10
+ ],
+ "bp_grad_F": [
+ 0.03832927718758583,
+ 8.881174835551064e-06,
+ 2.5206949416656244e-08,
+ 1.4185034480362901e-08,
+ 1.3504863893842867e-08
+ ],
+ "gamma_dfa": 0.0005767397606177838,
+ "gamma_dfa_per_layer": [
+ 0.00058704090770334,
+ 0.0013887862442061305,
+ 0.0003486467176117003,
+ -1.751482705003582e-05
+ ],
+ "acc_eval": 0.232421875,
+ "loss_eval": 2.055915117263794,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 41.36415481567383,
+ 20590018.0,
+ 21418164.0,
+ 28674892.0,
+ 38102536.0
+ ],
+ "hidden_norms_avg": [
+ 880.8012084960938,
+ 15857472.0,
+ 18200580.0,
+ 27607590.0,
+ 38905496.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.6930878448183648e-05,
+ 5.041319584009329e-10,
+ 3.0716035270828e-10,
+ 2.9963459491355593e-10,
+ 2.9755845010193127e-10
+ ],
+ "bp_grad_F": [
+ 0.01052916795015335,
+ 1.7662874597590417e-05,
+ 1.8223250464188823e-08,
+ 1.4229329714510186e-08,
+ 1.2928855319671584e-08
+ ],
+ "gamma_dfa": 0.0005623552362976625,
+ "gamma_dfa_per_layer": [
+ 0.0005056762602180243,
+ 0.00140343327075243,
+ 0.0003372218052390963,
+ 3.0896089810994454e-06
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.054579734802246,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 41.9267578125,
+ 21995458.0,
+ 22701258.0,
+ 30227660.0,
+ 40381468.0
+ ],
+ "hidden_norms_avg": [
+ 891.6727294921875,
+ 17925388.0,
+ 19924592.0,
+ 29375846.0,
+ 41265952.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.4433691325830296e-05,
+ 4.786913088139499e-10,
+ 3.083476807219654e-10,
+ 3.030005690796145e-10,
+ 3.0202479406327143e-10
+ ],
+ "bp_grad_F": [
+ 0.006410651374608278,
+ 9.426087672181893e-06,
+ 1.748733602369157e-08,
+ 1.330249954634155e-08,
+ 1.2548162509062877e-08
+ ],
+ "gamma_dfa": 0.0005204869294175296,
+ "gamma_dfa_per_layer": [
+ 0.0004088875139132142,
+ 0.001322226831689477,
+ 0.00032363145146518946,
+ 2.7201920602237806e-05
+ ],
+ "acc_eval": 0.2568359375,
+ "loss_eval": 2.0504493713378906,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 42.43289566040039,
+ 23788478.0,
+ 24547006.0,
+ 32122702.0,
+ 42524392.0
+ ],
+ "hidden_norms_avg": [
+ 902.5420532226562,
+ 19126440.0,
+ 21210522.0,
+ 30872922.0,
+ 43207040.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8793765523005277e-05,
+ 4.69506655775831e-10,
+ 2.9882180063722785e-10,
+ 2.9027436010409247e-10,
+ 2.88086998700976e-10
+ ],
+ "bp_grad_F": [
+ 0.02046363614499569,
+ 1.535968840471469e-05,
+ 1.9181511490273806e-08,
+ 1.3211375105015577e-08,
+ 1.2052867148781843e-08
+ ],
+ "gamma_dfa": 0.0005800028211524477,
+ "gamma_dfa_per_layer": [
+ 0.0005789051647298038,
+ 0.001365642063319683,
+ 0.0003222030645702034,
+ 5.326099199010059e-05
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 2.056929349899292,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 42.88957595825195,
+ 24876160.0,
+ 25665632.0,
+ 33698024.0,
+ 44433192.0
+ ],
+ "hidden_norms_avg": [
+ 912.5694580078125,
+ 20388924.0,
+ 22492538.0,
+ 32293406.0,
+ 44758584.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.043079595954623e-05,
+ 4.6556239419182077e-10,
+ 3.0177585430557485e-10,
+ 2.9259758504984745e-10,
+ 2.8850585809259144e-10
+ ],
+ "bp_grad_F": [
+ 0.018651673570275307,
+ 8.0938043538481e-06,
+ 2.600621051840335e-08,
+ 1.3419185762586494e-08,
+ 1.200509913701353e-08
+ ],
+ "gamma_dfa": 0.0008372370848519495,
+ "gamma_dfa_per_layer": [
+ 0.001413366524502635,
+ 0.0015261531807482243,
+ 0.0003260627272538841,
+ 8.336590690305457e-05
+ ],
+ "acc_eval": 0.2353515625,
+ "loss_eval": 2.060340404510498,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 43.32978057861328,
+ 25917158.0,
+ 26720118.0,
+ 34948196.0,
+ 46313048.0
+ ],
+ "hidden_norms_avg": [
+ 921.58642578125,
+ 21474648.0,
+ 23549474.0,
+ 33572188.0,
+ 46615396.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.262757672928274e-05,
+ 4.5062673037499223e-10,
+ 2.984587021970242e-10,
+ 2.923088993078693e-10,
+ 2.888300987269332e-10
+ ],
+ "bp_grad_F": [
+ 0.01846941001713276,
+ 2.4291131921927445e-05,
+ 2.994345393858566e-08,
+ 1.4564162320596097e-08,
+ 1.1765412644137996e-08
+ ],
+ "gamma_dfa": 0.0007057133989292197,
+ "gamma_dfa_per_layer": [
+ 0.0011925556464120746,
+ 0.0012432597577571869,
+ 0.0002897845406550914,
+ 9.725365089252591e-05
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.0591180324554443,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 43.74128341674805,
+ 27200966.0,
+ 27911578.0,
+ 36161972.0,
+ 47854788.0
+ ],
+ "hidden_norms_avg": [
+ 930.2008666992188,
+ 22529414.0,
+ 24601434.0,
+ 34829948.0,
+ 48238220.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.328157981741242e-05,
+ 4.659617691693541e-10,
+ 2.8960928100119077e-10,
+ 2.8687860420539835e-10,
+ 2.800103759970085e-10
+ ],
+ "bp_grad_F": [
+ 0.004556785803288221,
+ 9.644008059694897e-06,
+ 1.5685751364458156e-08,
+ 1.2929571191477862e-08,
+ 1.1707988356590704e-08
+ ],
+ "gamma_dfa": 0.0005315981106832623,
+ "gamma_dfa_per_layer": [
+ 0.0004304055473767221,
+ 0.0012520912569016218,
+ 0.0003118191962130368,
+ 0.0001320764422416687
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.049736738204956,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 44.10750198364258,
+ 28860724.0,
+ 29566448.0,
+ 37605440.0,
+ 49767188.0
+ ],
+ "hidden_norms_avg": [
+ 938.7098999023438,
+ 24297102.0,
+ 26192510.0,
+ 36561148.0,
+ 49957968.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.900460640375968e-05,
+ 4.445998014190877e-10,
+ 2.888302930159625e-10,
+ 2.855987946137617e-10,
+ 2.818917876901139e-10
+ ],
+ "bp_grad_F": [
+ 0.013354518450796604,
+ 6.135221156000625e-06,
+ 1.780158420672251e-08,
+ 1.3947193622243503e-08,
+ 1.161484952660885e-08
+ ],
+ "gamma_dfa": 0.0005519518890650943,
+ "gamma_dfa_per_layer": [
+ 0.0005505518638528883,
+ 0.001156628131866455,
+ 0.00033354441984556615,
+ 0.0001670831406954676
+ ],
+ "acc_eval": 0.2412109375,
+ "loss_eval": 2.0527162551879883,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 44.42500305175781,
+ 30085758.0,
+ 30793664.0,
+ 39317268.0,
+ 51773680.0
+ ],
+ "hidden_norms_avg": [
+ 946.3699340820312,
+ 24723960.0,
+ 26763662.0,
+ 37607688.0,
+ 51575988.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.9910466764704324e-05,
+ 4.753269444712771e-10,
+ 2.936461906966059e-10,
+ 2.873846438600225e-10,
+ 2.8520716344182517e-10
+ ],
+ "bp_grad_F": [
+ 0.00976789090782404,
+ 1.76885150722228e-05,
+ 1.7970489096796882e-08,
+ 1.3952313970833075e-08,
+ 1.130456972475713e-08
+ ],
+ "gamma_dfa": 0.0009108289959840477,
+ "gamma_dfa_per_layer": [
+ 0.0019160081865265965,
+ 0.0012680008076131344,
+ 0.00030145354685373604,
+ 0.00015785344294272363
+ ],
+ "acc_eval": 0.2412109375,
+ "loss_eval": 2.0550765991210938,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 44.73127746582031,
+ 30730856.0,
+ 31431762.0,
+ 40187116.0,
+ 53148352.0
+ ],
+ "hidden_norms_avg": [
+ 953.6856079101562,
+ 24778752.0,
+ 27014248.0,
+ 38275640.0,
+ 52795456.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8919872420374304e-05,
+ 4.755910110176842e-10,
+ 2.84101492331601e-10,
+ 2.7933383384137755e-10,
+ 2.7627339305169585e-10
+ ],
+ "bp_grad_F": [
+ 0.009574169293045998,
+ 4.757252463605255e-05,
+ 1.5709005651842745e-08,
+ 1.3778580054690792e-08,
+ 1.1154800638735196e-08
+ ],
+ "gamma_dfa": 0.0003838329284917563,
+ "gamma_dfa_per_layer": [
+ -0.0004134870832785964,
+ 0.001480170525610447,
+ 0.0002943193248938769,
+ 0.00017432894674129784
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0383803844451904,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 44.999107360839844,
+ 32617970.0,
+ 33381886.0,
+ 41663220.0,
+ 54853168.0
+ ],
+ "hidden_norms_avg": [
+ 960.5386962890625,
+ 27910628.0,
+ 29647900.0,
+ 40418716.0,
+ 54716684.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.9992028430569917e-05,
+ 4.221052118946744e-10,
+ 2.9753777219809763e-10,
+ 2.8370578109004896e-10,
+ 2.813366484222257e-10
+ ],
+ "bp_grad_F": [
+ 0.015446176752448082,
+ 3.8060017686802894e-05,
+ 5.211516906911129e-08,
+ 1.3235438522940512e-08,
+ 1.116207481999254e-08
+ ],
+ "gamma_dfa": 0.0005705733274226077,
+ "gamma_dfa_per_layer": [
+ 0.0006168894469738007,
+ 0.0011725829681381583,
+ 0.00029753358103334904,
+ 0.00019528731354512274
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 2.0557656288146973,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 45.25053024291992,
+ 33936992.0,
+ 34621240.0,
+ 42946580.0,
+ 56031144.0
+ ],
+ "hidden_norms_avg": [
+ 966.2922973632812,
+ 28239400.0,
+ 30055502.0,
+ 41338012.0,
+ 56048388.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0256345780799165e-05,
+ 4.424338395647709e-10,
+ 2.9891861208497517e-10,
+ 2.8403482343897224e-10,
+ 2.798661857816853e-10
+ ],
+ "bp_grad_F": [
+ 0.006179355084896088,
+ 8.527667887392454e-06,
+ 2.116273023489157e-08,
+ 1.2261468285146293e-08,
+ 1.1058569171495947e-08
+ ],
+ "gamma_dfa": 0.0009438929373573046,
+ "gamma_dfa_per_layer": [
+ 0.00216879416257143,
+ 0.0010916339233517647,
+ 0.0003159396001137793,
+ 0.00019920406339224428
+ ],
+ "acc_eval": 0.2470703125,
+ "loss_eval": 2.0517942905426025,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 45.481727600097656,
+ 34746476.0,
+ 35397348.0,
+ 43639664.0,
+ 57119836.0
+ ],
+ "hidden_norms_avg": [
+ 971.5364379882812,
+ 28891962.0,
+ 30705540.0,
+ 42078288.0,
+ 57065612.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.9764614737359807e-05,
+ 4.5060349895820195e-10,
+ 3.0148228358228835e-10,
+ 2.912529661891483e-10,
+ 2.8715479993834947e-10
+ ],
+ "bp_grad_F": [
+ 0.02291245572268963,
+ 1.3926567589805927e-05,
+ 3.118159241921603e-08,
+ 2.1897225366274142e-08,
+ 1.1063916893760961e-08
+ ],
+ "gamma_dfa": 0.00046937728620832786,
+ "gamma_dfa_per_layer": [
+ -0.00010078266495838761,
+ 0.0014219002332538366,
+ 0.0003067174111492932,
+ 0.00024967416538856924
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.054462432861328,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 45.68215560913086,
+ 35169816.0,
+ 35827116.0,
+ 44266788.0,
+ 58219984.0
+ ],
+ "hidden_norms_avg": [
+ 976.61279296875,
+ 29302304.0,
+ 31207594.0,
+ 42541932.0,
+ 57918596.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.18697166221682e-05,
+ 4.4465031656670817e-10,
+ 3.0559865749069104e-10,
+ 2.891223926937414e-10,
+ 2.8127278284273416e-10
+ ],
+ "bp_grad_F": [
+ 0.02285478264093399,
+ 5.0576767534948885e-05,
+ 2.966898726697309e-08,
+ 1.374073210769211e-08,
+ 1.1011787037773502e-08
+ ],
+ "gamma_dfa": 0.0006015256294631399,
+ "gamma_dfa_per_layer": [
+ 0.0005435256171040237,
+ 0.0013653798960149288,
+ 0.000284912355709821,
+ 0.0002122846490237862
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0539493560791016,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 45.86240005493164,
+ 36071220.0,
+ 36702996.0,
+ 45105948.0,
+ 59117940.0
+ ],
+ "hidden_norms_avg": [
+ 980.9766845703125,
+ 29250424.0,
+ 31315982.0,
+ 42895240.0,
+ 58632240.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0838917155051604e-05,
+ 4.517226037670241e-10,
+ 3.037594897836726e-10,
+ 2.95300450758873e-10,
+ 2.8246391337027887e-10
+ ],
+ "bp_grad_F": [
+ 0.009441024623811245,
+ 2.5670700779301114e-05,
+ 2.221704953342396e-08,
+ 1.750507294673298e-08,
+ 1.1021731971538884e-08
+ ],
+ "gamma_dfa": 0.00038505904376506805,
+ "gamma_dfa_per_layer": [
+ -0.0006303560803644359,
+ 0.0016098625492304564,
+ 0.00032150247716344893,
+ 0.00023922722903080285
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0488905906677246,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 46.00979995727539,
+ 36876176.0,
+ 37547776.0,
+ 45586304.0,
+ 59641656.0
+ ],
+ "hidden_norms_avg": [
+ 984.9158935546875,
+ 29720264.0,
+ 31840778.0,
+ 43341952.0,
+ 59202960.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8270042093936354e-05,
+ 4.981586254615422e-10,
+ 3.011032534416813e-10,
+ 2.830454204350019e-10,
+ 2.763113071679868e-10
+ ],
+ "bp_grad_F": [
+ 0.01947774738073349,
+ 4.3539188482100144e-05,
+ 2.1426325602647012e-08,
+ 1.4225844502391283e-08,
+ 1.0958768115187922e-08
+ ],
+ "gamma_dfa": 0.0003295415808679536,
+ "gamma_dfa_per_layer": [
+ -0.0008024196140468121,
+ 0.0015490652294829488,
+ 0.0003235205076634884,
+ 0.0002480002003721893
+ ],
+ "acc_eval": 0.2568359375,
+ "loss_eval": 2.0367085933685303,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 46.14581298828125,
+ 37542628.0,
+ 38211032.0,
+ 46396536.0,
+ 60543468.0
+ ],
+ "hidden_norms_avg": [
+ 988.5308837890625,
+ 31589698.0,
+ 33421126.0,
+ 44806960.0,
+ 60355708.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.7766556740971282e-05,
+ 4.28473617697378e-10,
+ 3.07322972625812e-10,
+ 2.9381372335102185e-10,
+ 2.797302944834712e-10
+ ],
+ "bp_grad_F": [
+ 0.06864868849515915,
+ 3.788271715166047e-05,
+ 2.1370066605186366e-08,
+ 1.4025233419090455e-08,
+ 1.1044066994259083e-08
+ ],
+ "gamma_dfa": 9.462468733545393e-05,
+ "gamma_dfa_per_layer": [
+ -0.0015880623832345009,
+ 0.0014036648208275437,
+ 0.0003099621389992535,
+ 0.00025293417274951935
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0631895065307617,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 46.26278305053711,
+ 38372568.0,
+ 39046204.0,
+ 47148944.0,
+ 61308416.0
+ ],
+ "hidden_norms_avg": [
+ 991.4658813476562,
+ 31279712.0,
+ 33238512.0,
+ 44902484.0,
+ 60826544.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.812536695273593e-05,
+ 4.3919237691092405e-10,
+ 3.053821084897379e-10,
+ 2.9203767182295337e-10,
+ 2.833127066281804e-10
+ ],
+ "bp_grad_F": [
+ 0.011117708869278431,
+ 2.0018645955133252e-05,
+ 1.9244726701117543e-08,
+ 1.4165241424279884e-08,
+ 1.090406964721069e-08
+ ],
+ "gamma_dfa": 0.00016991631855489686,
+ "gamma_dfa_per_layer": [
+ -0.0015358870150521398,
+ 0.0016542371595278382,
+ 0.0003059905138798058,
+ 0.00025532461586408317
+ ],
+ "acc_eval": 0.2548828125,
+ "loss_eval": 2.0491740703582764,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 46.36857223510742,
+ 38788812.0,
+ 39461172.0,
+ 47582644.0,
+ 61831224.0
+ ],
+ "hidden_norms_avg": [
+ 994.04541015625,
+ 32215950.0,
+ 34096260.0,
+ 45599356.0,
+ 61425516.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0041363061172888e-05,
+ 4.480187609789965e-10,
+ 3.0562316566395964e-10,
+ 2.9085803210371353e-10,
+ 2.820148004012424e-10
+ ],
+ "bp_grad_F": [
+ 0.03149434179067612,
+ 6.209969433257356e-05,
+ 2.1469357847081483e-08,
+ 1.3228349970972886e-08,
+ 1.092844392758252e-08
+ ],
+ "gamma_dfa": 0.00010758559074020013,
+ "gamma_dfa_per_layer": [
+ -0.0014505982398986816,
+ 0.001327117788605392,
+ 0.0002981229918077588,
+ 0.0002556998224463314
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0554656982421875,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 46.4505729675293,
+ 38845108.0,
+ 39504860.0,
+ 47660992.0,
+ 62097052.0
+ ],
+ "hidden_norms_avg": [
+ 996.2877807617188,
+ 32178676.0,
+ 34106748.0,
+ 45494312.0,
+ 61553340.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0276962206698954e-05,
+ 4.5564105266571175e-10,
+ 3.0059965627771135e-10,
+ 2.8785077099691136e-10,
+ 2.794499076586021e-10
+ ],
+ "bp_grad_F": [
+ 0.011724308133125305,
+ 1.9755616449401714e-05,
+ 2.1592299503936374e-08,
+ 1.3796129572085647e-08,
+ 1.0886693324607677e-08
+ ],
+ "gamma_dfa": 0.0002330350544070825,
+ "gamma_dfa_per_layer": [
+ -0.0009828422917053103,
+ 0.0013922813814133406,
+ 0.00027237151516601443,
+ 0.00025032961275428534
+ ],
+ "acc_eval": 0.2578125,
+ "loss_eval": 2.0504729747772217,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 46.521934509277344,
+ 39260604.0,
+ 39906660.0,
+ 48073644.0,
+ 62524844.0
+ ],
+ "hidden_norms_avg": [
+ 998.1359252929688,
+ 32138106.0,
+ 34129788.0,
+ 45757544.0,
+ 61958428.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.9659293431905098e-05,
+ 4.597033309572396e-10,
+ 3.0463259692581346e-10,
+ 2.893623118893629e-10,
+ 2.780784769118583e-10
+ ],
+ "bp_grad_F": [
+ 0.009033501148223877,
+ 1.7998809198616073e-05,
+ 2.5067617315244206e-08,
+ 1.8738653295713448e-08,
+ 1.087139978039886e-08
+ ],
+ "gamma_dfa": 0.00016801172751002014,
+ "gamma_dfa_per_layer": [
+ -0.0013465819647535682,
+ 0.0014174225507304072,
+ 0.00031502131605520844,
+ 0.00028618500800803304
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0473151206970215,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 46.57882308959961,
+ 39427768.0,
+ 40090548.0,
+ 48369740.0,
+ 62859588.0
+ ],
+ "hidden_norms_avg": [
+ 999.5881958007812,
+ 32546802.0,
+ 34502940.0,
+ 46179212.0,
+ 62426560.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0221139240893535e-05,
+ 4.495410987903625e-10,
+ 3.065779852207129e-10,
+ 2.9148336522233365e-10,
+ 2.8107866034687845e-10
+ ],
+ "bp_grad_F": [
+ 0.016372976824641228,
+ 2.868929186661262e-05,
+ 2.4158071099122935e-08,
+ 2.1377838166358742e-08,
+ 1.0851396226030374e-08
+ ],
+ "gamma_dfa": 0.00012949823576491326,
+ "gamma_dfa_per_layer": [
+ -0.0014246907085180283,
+ 0.0013606694992631674,
+ 0.0003105594660155475,
+ 0.0002714546862989664
+ ],
+ "acc_eval": 0.2568359375,
+ "loss_eval": 2.0468568801879883,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 46.621891021728516,
+ 39709320.0,
+ 40367452.0,
+ 48619224.0,
+ 63258040.0
+ ],
+ "hidden_norms_avg": [
+ 1000.7721557617188,
+ 33325650.0,
+ 35170832.0,
+ 47006208.0,
+ 63117408.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.0193185011739843e-05,
+ 4.388156504830931e-10,
+ 3.137757831339627e-10,
+ 2.8996427481331466e-10,
+ 2.7836044580453745e-10
+ ],
+ "bp_grad_F": [
+ 0.020163528621196747,
+ 3.054905027966015e-05,
+ 2.3064796295102497e-08,
+ 1.4526934322134366e-08,
+ 1.0852998499899513e-08
+ ],
+ "gamma_dfa": 0.00017183857562486082,
+ "gamma_dfa_per_layer": [
+ -0.0013185564894229174,
+ 0.0014156483812257648,
+ 0.00031098624458536506,
+ 0.00027927616611123085
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.054586410522461,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 46.65864562988281,
+ 39798476.0,
+ 40463920.0,
+ 48764504.0,
+ 63346472.0
+ ],
+ "hidden_norms_avg": [
+ 1001.6641845703125,
+ 33379128.0,
+ 35239452.0,
+ 46955488.0,
+ 63122060.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.965362000395544e-05,
+ 4.4001230437018535e-10,
+ 3.0546970508638083e-10,
+ 2.8820767994375274e-10,
+ 2.777780505613947e-10
+ ],
+ "bp_grad_F": [
+ 0.048469845205545425,
+ 4.790218736161478e-05,
+ 2.6222814142329298e-08,
+ 2.4079582772174035e-08,
+ 1.0861339383438917e-08
+ ],
+ "gamma_dfa": -6.432890222640708e-05,
+ "gamma_dfa_per_layer": [
+ -0.002126228529959917,
+ 0.0012497524730861187,
+ 0.00034036440774798393,
+ 0.0002787960402201861
+ ],
+ "acc_eval": 0.2509765625,
+ "loss_eval": 2.0531256198883057,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 46.683528900146484,
+ 39922192.0,
+ 40544356.0,
+ 48855360.0,
+ 63435588.0
+ ],
+ "hidden_norms_avg": [
+ 1002.31494140625,
+ 33437468.0,
+ 35316604.0,
+ 47039952.0,
+ 63236136.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.79724281426752e-05,
+ 4.357196548010478e-10,
+ 3.0789479299464517e-10,
+ 2.8999944112761966e-10,
+ 2.7672003577450255e-10
+ ],
+ "bp_grad_F": [
+ 0.009082098491489887,
+ 6.448025487770792e-06,
+ 2.3372145108169207e-08,
+ 1.58603672417712e-08,
+ 1.0855457865943663e-08
+ ],
+ "gamma_dfa": 8.819025242701173e-05,
+ "gamma_dfa_per_layer": [
+ -0.0015805144794285297,
+ 0.0013432127889245749,
+ 0.000321696512401104,
+ 0.00026836618781089783
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.0517051219940186,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 46.70249938964844,
+ 40094040.0,
+ 40695052.0,
+ 48969004.0,
+ 63542232.0
+ ],
+ "hidden_norms_avg": [
+ 1002.7830810546875,
+ 33826664.0,
+ 35653116.0,
+ 47279168.0,
+ 63409756.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8208709409227595e-05,
+ 4.3868975119210063e-10,
+ 3.102354484418868e-10,
+ 2.8893865078316594e-10,
+ 2.794520170823489e-10
+ ],
+ "bp_grad_F": [
+ 0.012775770388543606,
+ 3.5907680285163224e-05,
+ 3.276610627267473e-08,
+ 1.9733393585852355e-08,
+ 1.0837335473468102e-08
+ ],
+ "gamma_dfa": -7.604052370879799e-06,
+ "gamma_dfa_per_layer": [
+ -0.0020841513760387897,
+ 0.001464233035221696,
+ 0.0003138828033115715,
+ 0.0002756193280220032
+ ],
+ "acc_eval": 0.2509765625,
+ "loss_eval": 2.053762912750244,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 46.71390914916992,
+ 39990840.0,
+ 40613704.0,
+ 48947088.0,
+ 63626668.0
+ ],
+ "hidden_norms_avg": [
+ 1003.0780639648438,
+ 33512400.0,
+ 35398544.0,
+ 47052320.0,
+ 63319172.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.8852005925728008e-05,
+ 4.408986231663192e-10,
+ 3.0767774439333095e-10,
+ 2.8811911190196327e-10,
+ 2.780060626150771e-10
+ ],
+ "bp_grad_F": [
+ 0.017775027081370354,
+ 2.9518716473830864e-05,
+ 1.6785485001946654e-08,
+ 1.3991450664718741e-08,
+ 1.082214762249123e-08
+ ],
+ "gamma_dfa": 0.0001292051310883835,
+ "gamma_dfa_per_layer": [
+ -0.001528067048639059,
+ 0.0014583747833967209,
+ 0.0003044582554139197,
+ 0.0002820545341819525
+ ],
+ "acc_eval": 0.2548828125,
+ "loss_eval": 2.0512585639953613,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 46.72029495239258,
+ 40048976.0,
+ 40673908.0,
+ 49005780.0,
+ 63650516.0
+ ],
+ "hidden_norms_avg": [
+ 1003.2393188476562,
+ 33518072.0,
+ 35408260.0,
+ 47059300.0,
+ 63337588.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 3.040391493414063e-05,
+ 4.422071042675668e-10,
+ 3.0922153726464785e-10,
+ 2.885988392709038e-10,
+ 2.7767882437856883e-10
+ ],
+ "bp_grad_F": [
+ 0.05996337905526161,
+ 4.702213846030645e-05,
+ 2.0060964445178797e-08,
+ 1.6814832193290385e-08,
+ 1.0825355722943186e-08
+ ],
+ "gamma_dfa": 6.977042357902974e-05,
+ "gamma_dfa_per_layer": [
+ -0.0016858375165611506,
+ 0.001342209754511714,
+ 0.00032920570811256766,
+ 0.00029350374825298786
+ ],
+ "acc_eval": 0.25390625,
+ "loss_eval": 2.0525753498077393,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 46.723426818847656,
+ 40078224.0,
+ 40696452.0,
+ 49005116.0,
+ 63676392.0
+ ],
+ "hidden_norms_avg": [
+ 1003.3213500976562,
+ 33528454.0,
+ 35420932.0,
+ 47084140.0,
+ 63362884.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.9969949537189677e-05,
+ 4.438247824811725e-10,
+ 3.0574925924398144e-10,
+ 2.876155424935689e-10,
+ 2.772651552795935e-10
+ ],
+ "bp_grad_F": [
+ 0.015555496327579021,
+ 1.9468383470666595e-05,
+ 2.2645199493354085e-08,
+ 2.0153352764396004e-08,
+ 1.082723954937137e-08
+ ],
+ "gamma_dfa": -2.766123361652717e-05,
+ "gamma_dfa_per_layer": [
+ -0.0021022262517362833,
+ 0.0013793597463518381,
+ 0.0003187692491337657,
+ 0.0002934523217845708
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.05129337310791,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 46.72323226928711,
+ 40073516.0,
+ 40694276.0,
+ 48970848.0,
+ 63674696.0
+ ],
+ "hidden_norms_avg": [
+ 1003.3206176757812,
+ 33517796.0,
+ 35411552.0,
+ 47074216.0,
+ 63356572.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 2.986433173646219e-05,
+ 4.4209438887499175e-10,
+ 3.069269838285038e-10,
+ 2.8717661582078335e-10,
+ 2.7721389073143143e-10
+ ],
+ "bp_grad_F": [
+ 0.011835500597953796,
+ 1.2977254300494678e-05,
+ 2.7325663509714104e-08,
+ 2.23609397664859e-08,
+ 1.0828303587118171e-08
+ ],
+ "gamma_dfa": 4.879416519543156e-05,
+ "gamma_dfa_per_layer": [
+ -0.0018596879672259092,
+ 0.0014319919282570481,
+ 0.0003201703366357833,
+ 0.00030270236311480403
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.051326274871826,
+ "epoch": 60
+ }
+ ]
+} \ No newline at end of file