diff options
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s456.json')
| -rw-r--r-- | results/snapshot_vit_v1/snapshot_vit_s456.json | 4594 |
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s456.json b/results/snapshot_vit_v1/snapshot_vit_s456.json new file mode 100644 index 0000000..1b43b92 --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s456.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 456, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.3042769432067871, + 3.2273340225219727, + 4.6926493644714355, + 6.003997802734375, + 6.652705669403076 + ], + "hidden_norms_avg": [ + 6.027750492095947, + 7.1044697761535645, + 7.910475730895996, + 8.79189682006836, + 9.458833694458008 + ], + "bp_grad_per_sample_l2_med": [ + 0.005248428788036108, + 0.0012287507997825742, + 0.0010387187357991934, + 0.0009678652859292924, + 0.0009174557635560632 + ], + "bp_grad_F": [ + 0.248850479722023, + 0.0424945093691349, + 0.0348997563123703, + 0.03202275559306145, + 0.030239813029766083 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.0791015625, + "loss_eval": 2.544933319091797, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.47296053171157837, + 11.65749454498291, + 18.3483943939209, + 24.296405792236328, + 29.94684410095215 + ], + "hidden_norms_avg": [ + 4.04442834854126, + 9.927255630493164, + 14.762720108032227, + 19.817049026489258, + 24.69188690185547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0025219416711479425, + 0.00024655580637045205, + 0.00017099862452596426, + 0.0001493149611633271, + 0.00015047143097035587 + ], + "bp_grad_F": [ + 0.11354690045118332, + 0.00995445717126131, + 0.006139951758086681, + 0.005140931811183691, + 0.005088545847684145 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.458984375, + "loss_eval": 1.4817876815795898, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6174129843711853, + 12.388140678405762, + 20.656904220581055, + 27.073535919189453, + 32.43647003173828 + ], + "hidden_norms_avg": [ + 3.8196825981140137, + 10.982677459716797, + 17.020437240600586, + 22.471168518066406, + 27.064218521118164 + ], + "bp_grad_per_sample_l2_med": [ + 0.0020673249382525682, + 0.0002501676499377936, + 0.00015905944746918976, + 0.00013718422269448638, + 0.0001328626531176269 + ], + "bp_grad_F": [ + 0.09556808322668076, + 0.01051106583327055, + 0.005822391714900732, + 0.004766201134771109, + 0.004577947780489922 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.498046875, + "loss_eval": 1.356250286102295, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.7216586470603943, + 12.527997016906738, + 19.815393447875977, + 26.452791213989258, + 30.71564483642578 + ], + "hidden_norms_avg": [ + 3.8907485008239746, + 11.261369705200195, + 16.61492156982422, + 21.57110023498535, + 24.978900909423828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0021546317730098963, + 0.00030062923906371, + 0.00018509272194933146, + 0.00013865686196368188, + 0.00012920796871185303 + ], + "bp_grad_F": [ + 0.10040326416492462, + 0.012564396485686302, + 0.007171053439378738, + 0.005316051654517651, + 0.004880763124674559 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5263671875, + "loss_eval": 1.2655537128448486, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.8026084899902344, + 12.023736953735352, + 20.35123062133789, + 26.937381744384766, + 31.122047424316406 + ], + "hidden_norms_avg": [ + 3.9065797328948975, + 11.544925689697266, + 17.131011962890625, + 22.292007446289062, + 25.61225128173828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019258656539022923, + 0.00027825392317026854, + 0.00017385024693794549, + 0.0001323536125710234, + 0.00012172113929409534 + ], + "bp_grad_F": [ + 0.09238748997449875, + 0.01207020040601492, + 0.007036368828266859, + 0.005208354443311691, + 0.0047498126514256 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5673828125, + "loss_eval": 1.1375834941864014, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.8784403204917908, + 11.689644813537598, + 20.318578720092773, + 27.47210121154785, + 30.616111755371094 + ], + "hidden_norms_avg": [ + 3.991969585418701, + 11.499222755432129, + 17.010013580322266, + 21.869060516357422, + 24.784456253051758 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017466156277805567, + 0.00030884172883816063, + 0.00018451173673383892, + 0.00013519970525521785, + 0.00011779358464991674 + ], + "bp_grad_F": [ + 0.0881652981042862, + 0.014197942800819874, + 0.008167672902345657, + 0.00570154283195734, + 0.0048713223077356815 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.611328125, + "loss_eval": 1.078152060508728, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9501535892486572, + 12.59860610961914, + 20.491111755371094, + 27.280519485473633, + 30.350204467773438 + ], + "hidden_norms_avg": [ + 4.104201793670654, + 12.098063468933105, + 17.173715591430664, + 21.416263580322266, + 24.0885066986084 + ], + "bp_grad_per_sample_l2_med": [ + 0.001603498705662787, + 0.0003018827992491424, + 0.00017963100981432945, + 0.00013513887824956328, + 0.00010907831892836839 + ], + "bp_grad_F": [ + 0.08621370792388916, + 0.01517424639314413, + 0.008794959634542465, + 0.006117440760135651, + 0.0050094337202608585 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6337890625, + "loss_eval": 1.0198562145233154, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 1.000899076461792, + 12.766633987426758, + 21.096908569335938, + 28.377235412597656, + 31.630756378173828 + ], + "hidden_norms_avg": [ + 4.143934726715088, + 13.046825408935547, + 18.295841217041016, + 23.147098541259766, + 25.70033836364746 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015043691964820027, + 0.00027919537387788296, + 0.0001850408734753728, + 0.0001339056616416201, + 0.00011227549111936241 + ], + "bp_grad_F": [ + 0.07296615093946457, + 0.012746848165988922, + 0.00809843186289072, + 0.005660817492753267, + 0.00492064468562603 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6357421875, + "loss_eval": 1.0125277042388916, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.0544841289520264, + 10.223775863647461, + 18.59557342529297, + 26.47129249572754, + 29.77008819580078 + ], + "hidden_norms_avg": [ + 4.213057994842529, + 13.021050453186035, + 18.172080993652344, + 22.743032455444336, + 25.225244522094727 + ], + "bp_grad_per_sample_l2_med": [ + 0.001364147407002747, + 0.0002890345931518823, + 0.00017917664081323892, + 0.000133156034280546, + 0.00011372177687007934 + ], + "bp_grad_F": [ + 0.07409710437059402, + 0.015113108791410923, + 0.00921319704502821, + 0.006366679444909096, + 0.005320113617926836 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6376953125, + "loss_eval": 0.9630928039550781, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.1071640253067017, + 12.073644638061523, + 19.524917602539062, + 26.858781814575195, + 30.318849563598633 + ], + "hidden_norms_avg": [ + 4.280055522918701, + 13.520170211791992, + 18.620624542236328, + 22.658164978027344, + 25.25646209716797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012990576215088367, + 0.00027366873109713197, + 0.00016998387582134455, + 0.00012336595682427287, + 9.77109739324078e-05 + ], + "bp_grad_F": [ + 0.07662060856819153, + 0.015166237019002438, + 0.0096206646412611, + 0.006477049086242914, + 0.005294579081237316 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.654296875, + "loss_eval": 0.9390516877174377, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1426520347595215, + 12.005794525146484, + 20.33642578125, + 27.80829429626465, + 31.22698974609375 + ], + "hidden_norms_avg": [ + 4.328567981719971, + 13.725446701049805, + 19.644866943359375, + 23.91346549987793, + 26.409910202026367 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012125002685934305, + 0.00027867915923707187, + 0.00017298922466579825, + 0.0001231397909577936, + 0.00010014672443503514 + ], + "bp_grad_F": [ + 0.06728038191795349, + 0.014830472879111767, + 0.008772061206400394, + 0.006222804542630911, + 0.00518346531316638 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6708984375, + "loss_eval": 0.8987849950790405, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.182861089706421, + 11.343650817871094, + 19.158103942871094, + 26.537256240844727, + 29.248126983642578 + ], + "hidden_norms_avg": [ + 4.343320846557617, + 13.940053939819336, + 19.19382667541504, + 23.443157196044922, + 25.7342529296875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012841055868193507, + 0.00029811219428665936, + 0.00019176788919139653, + 0.0001351374085061252, + 0.00010611475590849295 + ], + "bp_grad_F": [ + 0.07373103499412537, + 0.015750709921121597, + 0.010071114636957645, + 0.007257349323481321, + 0.00578929902985692 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6708984375, + "loss_eval": 0.9137783646583557, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.2363859415054321, + 11.583894729614258, + 18.828346252441406, + 26.30917739868164, + 29.363861083984375 + ], + "hidden_norms_avg": [ + 4.441896915435791, + 13.568662643432617, + 18.774181365966797, + 22.73027801513672, + 24.84675407409668 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011289563262835145, + 0.00029387036920525134, + 0.0001886928512249142, + 0.00013024669897276908, + 9.712533210404217e-05 + ], + "bp_grad_F": [ + 0.06850193440914154, + 0.016727343201637268, + 0.010432050563395023, + 0.00744031835347414, + 0.0057919141836464405 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6865234375, + "loss_eval": 0.8655319809913635, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.276246428489685, + 11.161674499511719, + 18.18111801147461, + 24.498512268066406, + 28.472366333007812 + ], + "hidden_norms_avg": [ + 4.438092231750488, + 13.71449089050293, + 18.358896255493164, + 21.998794555664062, + 24.44672966003418 + ], + "bp_grad_per_sample_l2_med": [ + 0.001100392546504736, + 0.0002873367629945278, + 0.00018384194117970765, + 0.0001337265275651589, + 9.951705578714609e-05 + ], + "bp_grad_F": [ + 0.06749056279659271, + 0.01716373674571514, + 0.010762249119579792, + 0.007881316356360912, + 0.005892573855817318 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6982421875, + "loss_eval": 0.8163608908653259, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.3131792545318604, + 11.034884452819824, + 17.936412811279297, + 24.541194915771484, + 28.02472496032715 + ], + "hidden_norms_avg": [ + 4.504117012023926, + 13.86273193359375, + 18.456012725830078, + 22.296085357666016, + 24.57513427734375 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010489820269867778, + 0.0002784461830742657, + 0.00018129698582924902, + 0.00013628850865643471, + 0.00010334269609302282 + ], + "bp_grad_F": [ + 0.06553377211093903, + 0.016712775453925133, + 0.010981550440192223, + 0.007675213273614645, + 0.006061363499611616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.69921875, + "loss_eval": 0.8088906407356262, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.3631325960159302, + 10.72367000579834, + 17.147600173950195, + 23.750171661376953, + 26.97018051147461 + ], + "hidden_norms_avg": [ + 4.5338335037231445, + 13.55031967163086, + 17.503305435180664, + 21.003847122192383, + 23.168630599975586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0010022176429629326, + 0.0002914569922722876, + 0.00018890199135057628, + 0.00013593978655990213, + 0.00010251985804643482 + ], + "bp_grad_F": [ + 0.06372744590044022, + 0.017576243728399277, + 0.011715950444340706, + 0.008481587283313274, + 0.006441249046474695 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.701171875, + "loss_eval": 0.815929651260376, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.3926054239273071, + 10.609240531921387, + 17.234729766845703, + 23.659292221069336, + 27.24931526184082 + ], + "hidden_norms_avg": [ + 4.513574600219727, + 13.48448371887207, + 17.66766929626465, + 21.098644256591797, + 23.213909149169922 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008784966776147485, + 0.0002452125190757215, + 0.0001629967155167833, + 0.00012193062138976529, + 8.820713992463425e-05 + ], + "bp_grad_F": [ + 0.06515656411647797, + 0.017664309591054916, + 0.011493389494717121, + 0.008405888453125954, + 0.006338838487863541 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.71875, + "loss_eval": 0.7755489349365234, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.4288005828857422, + 9.991934776306152, + 16.30902671813965, + 22.53181266784668, + 25.98328971862793 + ], + "hidden_norms_avg": [ + 4.606818199157715, + 13.761014938354492, + 18.061887741088867, + 21.805465698242188, + 23.856918334960938 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008885160204954445, + 0.00026409278507344425, + 0.0001749310758896172, + 0.00012756467913277447, + 8.965048618847504e-05 + ], + "bp_grad_F": [ + 0.07283030450344086, + 0.01973560079932213, + 0.013354410417377949, + 0.009586230851709843, + 0.006897584535181522 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.693359375, + "loss_eval": 0.8082709908485413, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.4623849391937256, + 9.794211387634277, + 16.102649688720703, + 21.62982940673828, + 25.186201095581055 + ], + "hidden_norms_avg": [ + 4.6317901611328125, + 13.527764320373535, + 17.6087589263916, + 21.295202255249023, + 23.361501693725586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008634055848233402, + 0.0002727442770265043, + 0.00018466924666427076, + 0.00013278424739837646, + 8.995016105473042e-05 + ], + "bp_grad_F": [ + 0.06913765519857407, + 0.02126000076532364, + 0.014007972553372383, + 0.010056250728666782, + 0.00732502993196249 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.720703125, + "loss_eval": 0.7786685824394226, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.4771180152893066, + 9.776408195495605, + 15.485087394714355, + 21.054513931274414, + 25.07387351989746 + ], + "hidden_norms_avg": [ + 4.570744514465332, + 13.13935375213623, + 16.70624351501465, + 20.002471923828125, + 22.400487899780273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008809147984720767, + 0.00026235057157464325, + 0.0001801249454729259, + 0.0001285924663534388, + 8.227767830248922e-05 + ], + "bp_grad_F": [ + 0.07356031239032745, + 0.02142982743680477, + 0.014684871770441532, + 0.010477974079549313, + 0.007170504424721003 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7548146843910217, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.4932866096496582, + 9.586905479431152, + 15.190006256103516, + 20.53044891357422, + 23.871917724609375 + ], + "hidden_norms_avg": [ + 4.640237808227539, + 13.333914756774902, + 16.603134155273438, + 19.70735740661621, + 21.712968826293945 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008201555465348065, + 0.00025074987206608057, + 0.00018013773660641164, + 0.0001373633131152019, + 8.871335012372583e-05 + ], + "bp_grad_F": [ + 0.07453557848930359, + 0.02180560864508152, + 0.015117364004254341, + 0.010920760221779346, + 0.007648298051208258 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7294921875, + "loss_eval": 0.7338082790374756, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.5380369424819946, + 8.941458702087402, + 14.383026123046875, + 19.64396858215332, + 23.333805084228516 + ], + "hidden_norms_avg": [ + 4.57804012298584, + 12.777068138122559, + 15.852535247802734, + 19.008466720581055, + 21.123043060302734 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007403296767733991, + 0.00023140048142522573, + 0.0001578826195327565, + 0.00011260491737630218, + 7.754044054308906e-05 + ], + "bp_grad_F": [ + 0.07555028051137924, + 0.024111615493893623, + 0.01656532846391201, + 0.01178746297955513, + 0.007888367399573326 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.744140625, + "loss_eval": 0.7344021201133728, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.5561290979385376, + 9.454068183898926, + 14.400370597839355, + 19.253843307495117, + 22.27718734741211 + ], + "hidden_norms_avg": [ + 4.687749862670898, + 12.994861602783203, + 15.969095230102539, + 18.976381301879883, + 20.873851776123047 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008383935783058405, + 0.0002680755569599569, + 0.000193025975022465, + 0.00013935549941379577, + 9.83258432825096e-05 + ], + "bp_grad_F": [ + 0.06634547561407089, + 0.021603766828775406, + 0.01579204760491848, + 0.011702721007168293, + 0.008362310007214546 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.734375, + "loss_eval": 0.7299590110778809, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.5774884223937988, + 8.741745948791504, + 13.803518295288086, + 18.90570831298828, + 22.218149185180664 + ], + "hidden_norms_avg": [ + 4.594933032989502, + 12.66419506072998, + 15.714310646057129, + 19.085254669189453, + 21.135629653930664 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006682098028250039, + 0.00022848948719911277, + 0.00016414522542618215, + 0.0001115989507525228, + 7.056116737658158e-05 + ], + "bp_grad_F": [ + 0.07456765323877335, + 0.024261610582470894, + 0.01710386760532856, + 0.012147205881774426, + 0.008177526295185089 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.699420154094696, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.576693058013916, + 8.762345314025879, + 13.443113327026367, + 18.230920791625977, + 22.07720375061035 + ], + "hidden_norms_avg": [ + 4.667433738708496, + 12.606098175048828, + 15.544108390808105, + 18.674053192138672, + 20.65712547302246 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006520473980344832, + 0.00022687950695399195, + 0.0001629517209948972, + 0.00011739470210159197, + 7.377319707302377e-05 + ], + "bp_grad_F": [ + 0.08037886768579483, + 0.026545122265815735, + 0.0190938338637352, + 0.013439938426017761, + 0.00869175884872675 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7353515625, + "loss_eval": 0.733207106590271, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.5915056467056274, + 8.431538581848145, + 13.075739860534668, + 17.782840728759766, + 20.799991607666016 + ], + "hidden_norms_avg": [ + 4.626980304718018, + 12.152971267700195, + 14.936114311218262, + 18.13477325439453, + 19.853097915649414 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007118558278307319, + 0.00024262107035610825, + 0.0001753592659952119, + 0.00012127246736781672, + 7.87421886343509e-05 + ], + "bp_grad_F": [ + 0.0734892264008522, + 0.025602566078305244, + 0.018658706918358803, + 0.013666817918419838, + 0.009108936414122581 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7578125, + "loss_eval": 0.6893049478530884, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.589570164680481, + 8.064777374267578, + 12.609880447387695, + 17.195837020874023, + 20.27288818359375 + ], + "hidden_norms_avg": [ + 4.651576995849609, + 12.02392578125, + 14.5856351852417, + 17.578563690185547, + 19.327190399169922 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006660808576270938, + 0.0002373493480263278, + 0.0001695255923550576, + 0.00012064678594470024, + 7.89113255450502e-05 + ], + "bp_grad_F": [ + 0.08072065562009811, + 0.02827218733727932, + 0.020335549488663673, + 0.014427169226109982, + 0.009556911885738373 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.755859375, + "loss_eval": 0.7047942876815796, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.6077263355255127, + 7.734760284423828, + 11.882841110229492, + 15.991426467895508, + 19.111549377441406 + ], + "hidden_norms_avg": [ + 4.672310829162598, + 11.994673728942871, + 14.48837661743164, + 16.922487258911133, + 18.498437881469727 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005716760642826557, + 0.00020494087948463857, + 0.0001548439176985994, + 0.00011144367454107851, + 6.537805165862665e-05 + ], + "bp_grad_F": [ + 0.08237622678279877, + 0.03036416694521904, + 0.022357620298862457, + 0.01651921682059765, + 0.010484294034540653 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7548828125, + "loss_eval": 0.6863161325454712, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.6167913675308228, + 7.661223411560059, + 11.857555389404297, + 16.11384391784668, + 19.207155227661133 + ], + "hidden_norms_avg": [ + 4.6568603515625, + 11.916447639465332, + 14.127670288085938, + 16.765464782714844, + 18.548715591430664 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006015675025992095, + 0.00022187062131706625, + 0.00015665855607949197, + 0.00011372221342753619, + 6.673130701528862e-05 + ], + "bp_grad_F": [ + 0.08522997796535492, + 0.03222256526350975, + 0.023626696318387985, + 0.01693013124167919, + 0.010611210018396378 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.75390625, + "loss_eval": 0.6998279094696045, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.6032800674438477, + 7.3315229415893555, + 11.458590507507324, + 15.827820777893066, + 19.03597640991211 + ], + "hidden_norms_avg": [ + 4.592748641967773, + 11.431793212890625, + 13.694733619689941, + 16.380725860595703, + 17.913341522216797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006015695980750024, + 0.00023376141325570643, + 0.00015724304830655456, + 0.00010976113844662905, + 6.412796210497618e-05 + ], + "bp_grad_F": [ + 0.09064542502164841, + 0.03456525132060051, + 0.02491987682878971, + 0.01721413992345333, + 0.010797572322189808 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7734375, + "loss_eval": 0.6845672130584717, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.6067036390304565, + 7.343894004821777, + 11.072548866271973, + 15.027584075927734, + 17.731834411621094 + ], + "hidden_norms_avg": [ + 4.656601428985596, + 11.393535614013672, + 13.465471267700195, + 15.975980758666992, + 17.53518295288086 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005384382093325257, + 0.00021189975086599588, + 0.0001552984758745879, + 0.00010658086830517277, + 6.326750008156523e-05 + ], + "bp_grad_F": [ + 0.08886278420686722, + 0.03500310331583023, + 0.025932280346751213, + 0.018638672307133675, + 0.011571940965950489 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6816176772117615, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.6034201383590698, + 7.28795051574707, + 10.777915000915527, + 14.885525703430176, + 17.61635398864746 + ], + "hidden_norms_avg": [ + 4.614856719970703, + 11.156272888183594, + 13.103291511535645, + 15.514464378356934, + 16.799636840820312 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005928887985646725, + 0.0002398774668108672, + 0.00018353872292209417, + 0.00012629387492779642, + 8.196983981179073e-05 + ], + "bp_grad_F": [ + 0.09026212245225906, + 0.03624382242560387, + 0.027555860579013824, + 0.019604889675974846, + 0.012266743928194046 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7578125, + "loss_eval": 0.6996170878410339, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.611714243888855, + 7.183743953704834, + 10.724074363708496, + 14.5570650100708, + 17.022544860839844 + ], + "hidden_norms_avg": [ + 4.623075485229492, + 11.19589614868164, + 13.009132385253906, + 15.365489959716797, + 16.62962532043457 + ], + "bp_grad_per_sample_l2_med": [ + 0.00036223753704689443, + 0.00014417112106457353, + 0.00010984936670865864, + 8.023829286685213e-05, + 4.624977009370923e-05 + ], + "bp_grad_F": [ + 0.09605100005865097, + 0.03848516568541527, + 0.029046298936009407, + 0.021008647978305817, + 0.012804670259356499 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7666015625, + "loss_eval": 0.6707476377487183, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.6100214719772339, + 6.872183322906494, + 10.294036865234375, + 14.205705642700195, + 17.145418167114258 + ], + "hidden_norms_avg": [ + 4.6112518310546875, + 11.086106300354004, + 12.928976058959961, + 15.350056648254395, + 16.69057846069336 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041789902024902403, + 0.00017518684035167098, + 0.0001297849084949121, + 8.867425640346482e-05, + 4.886053648078814e-05 + ], + "bp_grad_F": [ + 0.10439282655715942, + 0.04290134832262993, + 0.03223341330885887, + 0.02269606664776802, + 0.013486144132912159 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.759765625, + "loss_eval": 0.7303465604782104, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5996708869934082, + 6.756699085235596, + 9.930717468261719, + 13.55428695678711, + 16.25560188293457 + ], + "hidden_norms_avg": [ + 4.561036109924316, + 10.72261905670166, + 12.331817626953125, + 14.622406005859375, + 16.10407829284668 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004882134380750358, + 0.0002138838026439771, + 0.00016901774506550282, + 0.0001125320850405842, + 6.579834007425234e-05 + ], + "bp_grad_F": [ + 0.10555483400821686, + 0.043922487646341324, + 0.03336327522993088, + 0.02399253286421299, + 0.013897648081183434 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.71100252866745, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.5904232263565063, + 6.662050247192383, + 9.66409683227539, + 13.113885879516602, + 15.527644157409668 + ], + "hidden_norms_avg": [ + 4.5454936027526855, + 10.621905326843262, + 12.306397438049316, + 14.576898574829102, + 15.954529762268066 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004819612659048289, + 0.00020982844580430537, + 0.00015760491078253835, + 0.00010895934246946126, + 5.958566543995403e-05 + ], + "bp_grad_F": [ + 0.10991083830595016, + 0.047212228178977966, + 0.03634340688586235, + 0.02575613744556904, + 0.014786512590944767 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7705078125, + "loss_eval": 0.7015272378921509, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.5926766395568848, + 6.752022743225098, + 9.809683799743652, + 13.14870548248291, + 15.66618537902832 + ], + "hidden_norms_avg": [ + 4.554390907287598, + 10.59433650970459, + 12.38070011138916, + 14.597192764282227, + 15.870081901550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043442551395855844, + 0.0001767174544511363, + 0.0001353291590930894, + 9.88640749710612e-05, + 5.115106250741519e-05 + ], + "bp_grad_F": [ + 0.11412353813648224, + 0.04936130344867706, + 0.03786878660321236, + 0.027230119332671165, + 0.015144454315304756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7734375, + "loss_eval": 0.7246569395065308, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.5873360633850098, + 6.424077987670898, + 9.43139934539795, + 12.677597999572754, + 15.172491073608398 + ], + "hidden_norms_avg": [ + 4.4964070320129395, + 10.287262916564941, + 11.751147270202637, + 13.867583274841309, + 15.24795150756836 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004166838189121336, + 0.0001985515555134043, + 0.00014922211994417012, + 0.0001073441599146463, + 5.765057721873745e-05 + ], + "bp_grad_F": [ + 0.11522030830383301, + 0.05126715078949928, + 0.039791759103536606, + 0.028239542618393898, + 0.015849631279706955 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.76953125, + "loss_eval": 0.7268451452255249, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.5890607833862305, + 6.295929431915283, + 9.119135856628418, + 12.20608901977539, + 14.642122268676758 + ], + "hidden_norms_avg": [ + 4.5021796226501465, + 10.095436096191406, + 11.7933988571167, + 13.924290657043457, + 15.25149917602539 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004105751868337393, + 0.00017681249300949275, + 0.00014306302182376385, + 9.77686358965002e-05, + 5.147796036908403e-05 + ], + "bp_grad_F": [ + 0.12662801146507263, + 0.057947222143411636, + 0.044759348034858704, + 0.03212600201368332, + 0.017064588144421577 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7587890625, + "loss_eval": 0.7464388012886047, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.5761758089065552, + 6.18004846572876, + 9.069403648376465, + 12.180702209472656, + 14.516327857971191 + ], + "hidden_norms_avg": [ + 4.492326736450195, + 9.971968650817871, + 11.50478744506836, + 13.5086669921875, + 14.760706901550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003273288893979043, + 0.00015071693633217365, + 0.00011665018246276304, + 8.30927092465572e-05, + 4.371673639980145e-05 + ], + "bp_grad_F": [ + 0.1212363913655281, + 0.055609479546546936, + 0.04309426248073578, + 0.0311796423047781, + 0.016882745549082756 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.7176246643066406, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.5679142475128174, + 6.109372615814209, + 8.818140029907227, + 11.853668212890625, + 14.200343132019043 + ], + "hidden_norms_avg": [ + 4.478363037109375, + 9.777668952941895, + 11.217857360839844, + 13.170299530029297, + 14.35566520690918 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003435175749473274, + 0.00015563883061986417, + 0.00011927648301934823, + 8.298752072732896e-05, + 4.157157673034817e-05 + ], + "bp_grad_F": [ + 0.13136376440525055, + 0.06076597049832344, + 0.046719472855329514, + 0.033368490636348724, + 0.01777712069451809 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.7149413228034973, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.5576080083847046, + 6.149768829345703, + 8.711091041564941, + 11.498035430908203, + 13.903903007507324 + ], + "hidden_norms_avg": [ + 4.435859680175781, + 9.742182731628418, + 10.966800689697266, + 12.826833724975586, + 13.987249374389648 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002820935333147645, + 0.00013546310947276652, + 0.00010691316856537014, + 7.935341272968799e-05, + 4.027710747322999e-05 + ], + "bp_grad_F": [ + 0.1424364149570465, + 0.0660286620259285, + 0.05190045386552811, + 0.037452246993780136, + 0.019488148391246796 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.759765625, + "loss_eval": 0.7794969081878662, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.55929696559906, + 6.027406215667725, + 8.56254768371582, + 11.315313339233398, + 13.816405296325684 + ], + "hidden_norms_avg": [ + 4.444095611572266, + 9.598461151123047, + 11.017721176147461, + 12.939472198486328, + 14.150469779968262 + ], + "bp_grad_per_sample_l2_med": [ + 0.00028881963226012886, + 0.00014081982953939587, + 0.00010864014620892704, + 7.903494406491518e-05, + 3.460505831753835e-05 + ], + "bp_grad_F": [ + 0.14435029029846191, + 0.06792720407247543, + 0.05288391932845116, + 0.03809889778494835, + 0.0192741546779871 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.7500836253166199, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.5569288730621338, + 5.83992338180542, + 8.285759925842285, + 11.15902328491211, + 13.44404125213623 + ], + "hidden_norms_avg": [ + 4.416918754577637, + 9.525116920471191, + 10.900503158569336, + 12.753186225891113, + 13.810358047485352 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003584402147680521, + 0.00016757070261519402, + 0.000135006892378442, + 8.858168439473957e-05, + 4.690655987360515e-05 + ], + "bp_grad_F": [ + 0.14751866459846497, + 0.07057010382413864, + 0.05518123507499695, + 0.039941366761922836, + 0.019994540140032768 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.783203125, + "loss_eval": 0.7740926146507263, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.5507482290267944, + 5.7182297706604, + 8.143424034118652, + 10.900334358215332, + 13.179159164428711 + ], + "hidden_norms_avg": [ + 4.415921688079834, + 9.42380142211914, + 10.672327995300293, + 12.439417839050293, + 13.481410026550293 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002743537479545921, + 0.00013802653120364994, + 0.00010440178448334336, + 7.395831926260144e-05, + 3.546295192791149e-05 + ], + "bp_grad_F": [ + 0.15799099206924438, + 0.0763181671500206, + 0.060047682374715805, + 0.043460771441459656, + 0.02125636488199234 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78125, + "loss_eval": 0.7693630456924438, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.5424573421478271, + 5.688177585601807, + 7.995815753936768, + 10.642090797424316, + 12.71364688873291 + ], + "hidden_norms_avg": [ + 4.399099349975586, + 9.228434562683105, + 10.541167259216309, + 12.30521297454834, + 13.311983108520508 + ], + "bp_grad_per_sample_l2_med": [ + 0.00024789522285573184, + 0.0001290303043788299, + 9.614775626687333e-05, + 6.680067599518225e-05, + 3.041914533241652e-05 + ], + "bp_grad_F": [ + 0.16617916524410248, + 0.08274275809526443, + 0.06457101553678513, + 0.04608331620693207, + 0.02214660868048668 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.77734375, + "loss_eval": 0.7963705062866211, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.5373201370239258, + 5.651702880859375, + 7.870075702667236, + 10.383352279663086, + 12.742950439453125 + ], + "hidden_norms_avg": [ + 4.359274387359619, + 9.120989799499512, + 10.328361511230469, + 11.979691505432129, + 13.047332763671875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020789829432033002, + 0.00010236673551844433, + 8.31241559353657e-05, + 5.5589163821423426e-05, + 2.5046059818123467e-05 + ], + "bp_grad_F": [ + 0.1711728274822235, + 0.08452030271291733, + 0.06641850620508194, + 0.048034753650426865, + 0.022233933210372925 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.796875, + "loss_eval": 0.787158727645874, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.534119725227356, + 5.64213752746582, + 7.87826681137085, + 10.351583480834961, + 12.802285194396973 + ], + "hidden_norms_avg": [ + 4.381091594696045, + 9.210761070251465, + 10.374320030212402, + 12.017292976379395, + 13.094472885131836 + ], + "bp_grad_per_sample_l2_med": [ + 0.00020434240286704153, + 9.69645261648111e-05, + 7.39863608032465e-05, + 5.592328670900315e-05, + 2.489626240276266e-05 + ], + "bp_grad_F": [ + 0.17339713871479034, + 0.08632633090019226, + 0.06861955672502518, + 0.05006933584809303, + 0.022428762167692184 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7919921875, + "loss_eval": 0.7851632833480835, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.5289297103881836, + 5.52672004699707, + 7.675796985626221, + 10.204718589782715, + 12.873387336730957 + ], + "hidden_norms_avg": [ + 4.3382954597473145, + 8.994754791259766, + 10.112909317016602, + 11.741432189941406, + 12.863862037658691 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001689869095571339, + 8.723067730898038e-05, + 6.962454062886536e-05, + 4.9918842705665156e-05, + 2.0077559383935295e-05 + ], + "bp_grad_F": [ + 0.1893138736486435, + 0.09529414772987366, + 0.07472710311412811, + 0.053626082837581635, + 0.023708311840891838 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7802734375, + "loss_eval": 0.8306612968444824, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.5282790660858154, + 5.412533760070801, + 7.559310436248779, + 10.040712356567383, + 12.344849586486816 + ], + "hidden_norms_avg": [ + 4.344850063323975, + 8.943357467651367, + 10.036619186401367, + 11.63318157196045, + 12.690427780151367 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015994974819477648, + 8.589095523348078e-05, + 6.632162694586441e-05, + 4.7776728024473414e-05, + 1.923311901919078e-05 + ], + "bp_grad_F": [ + 0.19004860520362854, + 0.09673094749450684, + 0.07585947215557098, + 0.05484768748283386, + 0.02464146539568901 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7880859375, + "loss_eval": 0.8193543553352356, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.5247719287872314, + 5.414742469787598, + 7.496610164642334, + 9.884673118591309, + 12.301740646362305 + ], + "hidden_norms_avg": [ + 4.334397792816162, + 8.873777389526367, + 9.937097549438477, + 11.524014472961426, + 12.564128875732422 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016137116472236812, + 8.459146192763001e-05, + 7.113611354725435e-05, + 4.750298467115499e-05, + 1.9900418919860385e-05 + ], + "bp_grad_F": [ + 0.1871533840894699, + 0.09687218815088272, + 0.0768747329711914, + 0.05509059876203537, + 0.024593451991677284 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.810278058052063, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.5175530910491943, + 5.423762798309326, + 7.493518352508545, + 9.848480224609375, + 12.152653694152832 + ], + "hidden_norms_avg": [ + 4.333771228790283, + 8.846830368041992, + 9.895172119140625, + 11.470880508422852, + 12.51230239868164 + ], + "bp_grad_per_sample_l2_med": [ + 0.00018688049749471247, + 9.502686589257792e-05, + 7.833576091798022e-05, + 5.505367516889237e-05, + 2.1109613953740336e-05 + ], + "bp_grad_F": [ + 0.19925038516521454, + 0.10273440927267075, + 0.08146088570356369, + 0.05800405889749527, + 0.025326546281576157 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.79296875, + "loss_eval": 0.8315975069999695, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.5154390335083008, + 5.332769870758057, + 7.351593971252441, + 9.726226806640625, + 12.217824935913086 + ], + "hidden_norms_avg": [ + 4.312089443206787, + 8.77189826965332, + 9.80828857421875, + 11.376079559326172, + 12.424320220947266 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001625730947125703, + 8.300685294670984e-05, + 6.064521585358307e-05, + 4.498598718782887e-05, + 1.878884904726874e-05 + ], + "bp_grad_F": [ + 0.20003639161586761, + 0.10495735704898834, + 0.08297032862901688, + 0.059033025056123734, + 0.02547283098101616 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8281288146972656, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.5136713981628418, + 5.367674827575684, + 7.355134963989258, + 9.682082176208496, + 12.047696113586426 + ], + "hidden_norms_avg": [ + 4.316784381866455, + 8.783827781677246, + 9.812792778015137, + 11.395760536193848, + 12.420063018798828 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016071743448264897, + 7.887884567026049e-05, + 6.097723598941229e-05, + 4.243743751430884e-05, + 1.8102018657373264e-05 + ], + "bp_grad_F": [ + 0.20199808478355408, + 0.10541712492704391, + 0.0835103914141655, + 0.05967256799340248, + 0.025771932676434517 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8389135599136353, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.5129119157791138, + 5.326069355010986, + 7.275172233581543, + 9.633310317993164, + 12.064473152160645 + ], + "hidden_norms_avg": [ + 4.308472633361816, + 8.717856407165527, + 9.717677116394043, + 11.28734016418457, + 12.3176851272583 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015608215471729636, + 8.108095789793879e-05, + 6.294465129030868e-05, + 4.2116138502024114e-05, + 1.7733293134369887e-05 + ], + "bp_grad_F": [ + 0.20727074146270752, + 0.10958535224199295, + 0.08667060732841492, + 0.06113011762499809, + 0.026037005707621574 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.787109375, + "loss_eval": 0.8504288792610168, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.5120813846588135, + 5.313214302062988, + 7.253427982330322, + 9.583664894104004, + 12.01283073425293 + ], + "hidden_norms_avg": [ + 4.303354263305664, + 8.709893226623535, + 9.714727401733398, + 11.287162780761719, + 12.301621437072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014261712203733623, + 8.006545249372721e-05, + 6.104232306824997e-05, + 4.1361305193277076e-05, + 1.670202073000837e-05 + ], + "bp_grad_F": [ + 0.20587928593158722, + 0.10970292240381241, + 0.0869779959321022, + 0.06163511052727699, + 0.02630491554737091 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7919921875, + "loss_eval": 0.8500803709030151, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.5113301277160645, + 5.33270263671875, + 7.255039215087891, + 9.560588836669922, + 11.935233116149902 + ], + "hidden_norms_avg": [ + 4.311485767364502, + 8.737537384033203, + 9.710383415222168, + 11.27385425567627, + 12.309149742126465 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014448253205046058, + 7.629570609424263e-05, + 6.040706284693442e-05, + 4.236707536620088e-05, + 1.7641770682530478e-05 + ], + "bp_grad_F": [ + 0.20638784766197205, + 0.10957971960306168, + 0.08719436824321747, + 0.06181200593709946, + 0.026369713246822357 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7900390625, + "loss_eval": 0.8525989055633545, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.5115892887115479, + 5.313480377197266, + 7.247244834899902, + 9.550230979919434, + 11.989883422851562 + ], + "hidden_norms_avg": [ + 4.3022141456604, + 8.688987731933594, + 9.685582160949707, + 11.234566688537598, + 12.270132064819336 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001483379164710641, + 7.948598067741841e-05, + 6.1946535424795e-05, + 4.4680935388896614e-05, + 1.6852744010975584e-05 + ], + "bp_grad_F": [ + 0.21088635921478271, + 0.11181779950857162, + 0.08855349570512772, + 0.06269123405218124, + 0.026410162448883057 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7890625, + "loss_eval": 0.8474454879760742, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.5110703706741333, + 5.306856632232666, + 7.230412483215332, + 9.542105674743652, + 11.942556381225586 + ], + "hidden_norms_avg": [ + 4.305404186248779, + 8.697504997253418, + 9.679413795471191, + 11.226194381713867, + 12.25047492980957 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014003549586050212, + 7.460260530933738e-05, + 6.204132660059258e-05, + 3.912465035682544e-05, + 1.6441039406345226e-05 + ], + "bp_grad_F": [ + 0.20991134643554688, + 0.11143218725919724, + 0.08832813799381256, + 0.06269684433937073, + 0.026480402797460556 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8496487140655518, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.5111491680145264, + 5.304075717926025, + 7.234795093536377, + 9.53318977355957, + 11.964473724365234 + ], + "hidden_norms_avg": [ + 4.304405689239502, + 8.697833061218262, + 9.683843612670898, + 11.22890853881836, + 12.259684562683105 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014237761206459254, + 7.472094148397446e-05, + 5.683211929863319e-05, + 4.049929339089431e-05, + 1.4964447473175824e-05 + ], + "bp_grad_F": [ + 0.21009324491024017, + 0.11155029386281967, + 0.08846566081047058, + 0.06290413439273834, + 0.026488499715924263 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.8498167395591736, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.5111573934555054, + 5.304897785186768, + 7.23397970199585, + 9.53254508972168, + 11.969621658325195 + ], + "hidden_norms_avg": [ + 4.304327964782715, + 8.696623802185059, + 9.681411743164062, + 11.225934982299805, + 12.255182266235352 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001376860454911366, + 7.4876043072436e-05, + 5.8659916248871014e-05, + 4.048796836286783e-05, + 1.5446972611243837e-05 + ], + "bp_grad_F": [ + 0.210032656788826, + 0.11159469932317734, + 0.08847951143980026, + 0.06288634985685349, + 0.02649829164147377 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.791015625, + "loss_eval": 0.8496516942977905, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.3042769432067871, + 3.2273340225219727, + 4.6926493644714355, + 6.003997802734375, + 6.652705669403076 + ], + "hidden_norms_avg": [ + 6.027750492095947, + 7.1044697761535645, + 7.910475730895996, + 8.79189682006836, + 9.458833694458008 + ], + "bp_grad_per_sample_l2_med": [ + 0.005248428788036108, + 0.0012287507997825742, + 0.0010387187357991934, + 0.0009678652859292924, + 0.0009174557635560632 + ], + "bp_grad_F": [ + 0.248850479722023, + 0.0424945093691349, + 0.0348997563123703, + 0.03202275559306145, + 0.030239813029766083 + ], + "gamma_dfa": -0.0027123973850393668, + "gamma_dfa_per_layer": [ + -0.0010305923642590642, + -0.01111956313252449, + 0.0014823779929429293, + -0.00018181203631684184 + ], + "acc_eval": 0.0791015625, + "loss_eval": 2.544933319091797, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.8898234367370605, + 1755.5985107421875, + 3812.865966796875, + 4063.967529296875, + 6749.62646484375 + ], + "hidden_norms_avg": [ + 48.02373504638672, + 2610.970458984375, + 7442.5693359375, + 13001.9443359375, + 19569.59765625 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006367825553752482, + 1.061867237694969e-06, + 9.113553005590802e-07, + 8.042399599617056e-07, + 7.901451226643985e-07 + ], + "bp_grad_F": [ + 0.11358296871185303, + 5.570299981627613e-05, + 4.605366484611295e-05, + 3.752685370272957e-05, + 3.027659113286063e-05 + ], + "gamma_dfa": 0.007312511210329831, + "gamma_dfa_per_layer": [ + 0.01007317565381527, + 0.008024577051401138, + 0.008248038589954376, + 0.0029042535461485386 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0879125595092773, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 3.704786777496338, + 7219.806640625, + 19592.4140625, + 21808.44921875, + 46117.11328125 + ], + "hidden_norms_avg": [ + 97.33866882324219, + 9787.240234375, + 35216.66015625, + 64377.67578125, + 97116.8125 + ], + "bp_grad_per_sample_l2_med": [ + 9.637367475079373e-05, + 1.6794896851024532e-07, + 1.5954641696680483e-07, + 1.4061814113119908e-07, + 1.445507677999558e-07 + ], + "bp_grad_F": [ + 0.04642009362578392, + 2.128358573827427e-05, + 2.0123250578762963e-05, + 6.922710781509522e-06, + 6.6381039687257726e-06 + ], + "gamma_dfa": 0.007922766148112714, + "gamma_dfa_per_layer": [ + 0.016379408538341522, + 0.005931380204856396, + 0.007020577322691679, + 0.0023596985265612602 + ], + "acc_eval": 0.205078125, + "loss_eval": 2.1287283897399902, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 5.554904937744141, + 16081.3388671875, + 48028.96875, + 51717.93359375, + 100197.7265625 + ], + "hidden_norms_avg": [ + 147.4190216064453, + 22860.939453125, + 90670.5078125, + 172520.15625, + 247624.09375 + ], + "bp_grad_per_sample_l2_med": [ + 3.051399289688561e-05, + 9.248702070863146e-08, + 7.303499671706959e-08, + 6.487525183729304e-08, + 6.620962977876843e-08 + ], + "bp_grad_F": [ + 0.034720927476882935, + 1.6823112673591822e-05, + 1.1384844583517406e-05, + 3.0318508379423292e-06, + 2.624829903652426e-06 + ], + "gamma_dfa": 0.0067759081866825, + "gamma_dfa_per_layer": [ + 0.014651123434305191, + 0.004187515936791897, + 0.007594288792461157, + 0.0006707045831717551 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.107574462890625, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 7.38655424118042, + 30113.763671875, + 92815.4375, + 102848.4453125, + 183389.40625 + ], + "hidden_norms_avg": [ + 194.20396423339844, + 39156.78515625, + 166144.453125, + 360300.25, + 500574.96875 + ], + "bp_grad_per_sample_l2_med": [ + 2.7757007046602666e-05, + 6.177719313882335e-08, + 4.3474216226968565e-08, + 3.8972562066419414e-08, + 3.9463689205376795e-08 + ], + "bp_grad_F": [ + 0.03289186581969261, + 5.563175363931805e-06, + 2.151713033526903e-06, + 1.463158696424216e-06, + 1.3795681752526434e-06 + ], + "gamma_dfa": 0.006396490931365406, + "gamma_dfa_per_layer": [ + 0.015158161520957947, + 0.0035972977057099342, + 0.006714952643960714, + 0.00011555185483302921 + ], + "acc_eval": 0.203125, + "loss_eval": 2.1379737854003906, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 9.15835189819336, + 53591.8984375, + 170615.734375, + 181427.171875, + 289063.5625 + ], + "hidden_norms_avg": [ + 238.28347778320312, + 61062.31640625, + 250187.6875, + 548101.3125, + 724058.1875 + ], + "bp_grad_per_sample_l2_med": [ + 2.960537312901579e-05, + 4.670241438020639e-08, + 3.080446120407032e-08, + 2.670985388419922e-08, + 2.6331489877406966e-08 + ], + "bp_grad_F": [ + 0.016260992735624313, + 4.766869551531272e-06, + 2.067620698653627e-06, + 9.787106591829797e-07, + 8.912123234949831e-07 + ], + "gamma_dfa": 0.0068261599517427385, + "gamma_dfa_per_layer": [ + 0.014116348698735237, + 0.003242844482883811, + 0.008411802351474762, + 0.0015336442738771439 + ], + "acc_eval": 0.1962890625, + "loss_eval": 2.1309733390808105, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 10.888343811035156, + 91755.1171875, + 249917.8125, + 274005.3125, + 444277.53125 + ], + "hidden_norms_avg": [ + 276.9202880859375, + 104021.7109375, + 349872.5, + 931915.875, + 1222273.75 + ], + "bp_grad_per_sample_l2_med": [ + 2.7342781322658993e-05, + 3.6854661544794e-08, + 2.4993127567540796e-08, + 1.8662358769461207e-08, + 1.7811659702715588e-08 + ], + "bp_grad_F": [ + 0.022468894720077515, + 3.493201802484691e-06, + 1.1520894531713566e-06, + 7.113425795068906e-07, + 6.108040793151304e-07 + ], + "gamma_dfa": 0.007193240569904447, + "gamma_dfa_per_layer": [ + 0.017048656940460205, + 0.002665129955857992, + 0.007390158250927925, + 0.001669017132371664 + ], + "acc_eval": 0.2109375, + "loss_eval": 2.1020355224609375, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 12.623483657836914, + 158915.890625, + 360070.6875, + 406906.3125, + 630641.3125 + ], + "hidden_norms_avg": [ + 315.0859680175781, + 172244.328125, + 490065.59375, + 1510240.375, + 1952914.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.403881783015095e-05, + 2.7625405962794503e-08, + 1.651102543576144e-08, + 1.1742161909467086e-08, + 1.0927361238088906e-08 + ], + "bp_grad_F": [ + 0.024832597002387047, + 1.8080392010233481e-06, + 7.246239306368807e-07, + 4.936595132676302e-07, + 4.0145107504940825e-07 + ], + "gamma_dfa": 0.006596001767320558, + "gamma_dfa_per_layer": [ + 0.016851693391799927, + 0.001910479972139001, + 0.0058369822800159454, + 0.0017848514253273606 + ], + "acc_eval": 0.2138671875, + "loss_eval": 2.1312928199768066, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 14.368335723876953, + 243332.8125, + 525771.0, + 593291.75, + 875288.5 + ], + "hidden_norms_avg": [ + 351.16015625, + 247222.375, + 640658.75, + 1855662.75, + 2391194.25 + ], + "bp_grad_per_sample_l2_med": [ + 2.87416060018586e-05, + 1.8018790015617014e-08, + 1.2651691250198382e-08, + 9.33115984480537e-09, + 8.563736386690834e-09 + ], + "bp_grad_F": [ + 0.017871394753456116, + 9.426115070709784e-07, + 4.7217255882969766e-07, + 3.564711050785263e-07, + 3.2240865266430774e-07 + ], + "gamma_dfa": 0.006289168493822217, + "gamma_dfa_per_layer": [ + 0.013373943977057934, + 0.0037157258484512568, + 0.00672483816742897, + 0.001342165982350707 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.0829837322235107, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 16.041412353515625, + 385486.09375, + 776263.875, + 869037.0, + 1191002.25 + ], + "hidden_norms_avg": [ + 383.5213317871094, + 383708.40625, + 941498.0, + 2793651.25, + 3510556.5 + ], + "bp_grad_per_sample_l2_med": [ + 2.8917142117279582e-05, + 1.1363525231899985e-08, + 8.616331648170217e-09, + 5.602694308493028e-09, + 5.260086588521062e-09 + ], + "bp_grad_F": [ + 0.024791762232780457, + 6.833873840150773e-07, + 3.100701633229619e-07, + 2.26619619070334e-07, + 2.1342954426017968e-07 + ], + "gamma_dfa": 0.00652129843365401, + "gamma_dfa_per_layer": [ + 0.014406262896955013, + 0.004345592111349106, + 0.006529162637889385, + 0.0008041760884225368 + ], + "acc_eval": 0.2197265625, + "loss_eval": 2.1437277793884277, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 17.677919387817383, + 582942.5, + 1148260.75, + 1279834.25, + 1709270.625 + ], + "hidden_norms_avg": [ + 416.1814880371094, + 530246.375, + 1201761.5, + 2944394.0, + 3732565.75 + ], + "bp_grad_per_sample_l2_med": [ + 3.369058686075732e-05, + 6.623859238885643e-09, + 4.513381224313662e-09, + 3.933114278709127e-09, + 3.794405678547719e-09 + ], + "bp_grad_F": [ + 0.01620429754257202, + 3.022730652446626e-07, + 1.9097409165169665e-07, + 1.773983058228623e-07, + 1.593236333974346e-07 + ], + "gamma_dfa": 0.006082151841837913, + "gamma_dfa_per_layer": [ + 0.01578153669834137, + 0.002655572956427932, + 0.005509376525878906, + 0.00038212118670344353 + ], + "acc_eval": 0.197265625, + "loss_eval": 2.089698314666748, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 19.31073760986328, + 843820.0625, + 1587423.25, + 1759006.0, + 2222149.5 + ], + "hidden_norms_avg": [ + 448.93133544921875, + 796172.1875, + 1678321.375, + 3888912.0, + 4810418.0 + ], + "bp_grad_per_sample_l2_med": [ + 4.445635568117723e-05, + 3.5140981236025937e-09, + 2.8926525619255017e-09, + 2.65975419466713e-09, + 2.6499111793754082e-09 + ], + "bp_grad_F": [ + 0.020245229825377464, + 2.6993967594535206e-07, + 1.701987457636278e-07, + 1.3198047099649557e-07, + 1.2469256205349666e-07 + ], + "gamma_dfa": 0.005559869911849091, + "gamma_dfa_per_layer": [ + 0.015185668133199215, + 0.0025689376052469015, + 0.004468783736228943, + 1.6090172721305862e-05 + ], + "acc_eval": 0.2314453125, + "loss_eval": 2.0838193893432617, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 20.861183166503906, + 1157778.75, + 2054207.5, + 2289084.5, + 2841995.0 + ], + "hidden_norms_avg": [ + 479.8387145996094, + 981138.875, + 2112497.25, + 4439588.0, + 5517614.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.176981772412546e-05, + 3.1782512177613853e-09, + 2.5456772245746606e-09, + 2.4393245201537184e-09, + 2.414718425214346e-09 + ], + "bp_grad_F": [ + 0.09368129819631577, + 9.166008680949744e-07, + 2.675243706562469e-07, + 1.0984689424731187e-07, + 1.0444787079677553e-07 + ], + "gamma_dfa": 0.004390636342577636, + "gamma_dfa_per_layer": [ + 0.011994147673249245, + 0.001997251994907856, + 0.003865728620439768, + -0.00029458291828632355 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0896079540252686, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 22.362810134887695, + 1504072.375, + 2527410.75, + 2870361.25, + 3557771.0 + ], + "hidden_norms_avg": [ + 510.81561279296875, + 1188843.375, + 2574796.25, + 5296089.0, + 6640932.5 + ], + "bp_grad_per_sample_l2_med": [ + 2.8154454412288032e-05, + 3.057065711686846e-09, + 2.121731013104977e-09, + 2.0999049166192663e-09, + 2.0892536589656174e-09 + ], + "bp_grad_F": [ + 0.011068353429436684, + 1.3467251847032458e-06, + 1.0581060649883511e-07, + 9.427417069218791e-08, + 9.197237460512042e-08 + ], + "gamma_dfa": 0.003989392673247494, + "gamma_dfa_per_layer": [ + 0.011822337284684181, + 0.001384879695251584, + 0.00329465395770967, + -0.0005443002446554601 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.077056407928467, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 23.812599182128906, + 1930070.0, + 2995981.75, + 3469627.0, + 4303896.0 + ], + "hidden_norms_avg": [ + 539.9255981445312, + 1589889.5, + 3066154.25, + 6015238.0, + 7540605.5 + ], + "bp_grad_per_sample_l2_med": [ + 3.170168929500505e-05, + 2.518652619798445e-09, + 1.924201020742089e-09, + 1.8520206479522017e-09, + 1.8417810609960839e-09 + ], + "bp_grad_F": [ + 0.032089244574308395, + 1.0142422297576559e-06, + 1.6566445992793888e-07, + 8.33219857554468e-08, + 7.640721122470495e-08 + ], + "gamma_dfa": 0.0029267592035466805, + "gamma_dfa_per_layer": [ + 0.008105762302875519, + 0.001629034522920847, + 0.0022919299080967903, + -0.000319689919706434 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0748229026794434, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 25.248563766479492, + 2452306.5, + 3664022.75, + 4168536.0, + 5106242.5 + ], + "hidden_norms_avg": [ + 570.19384765625, + 1965615.5, + 3710471.5, + 7372995.0, + 9239893.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.4190969270421192e-05, + 1.8390389211475622e-09, + 1.5613663695290825e-09, + 1.5359991056840272e-09, + 1.5388512686342892e-09 + ], + "bp_grad_F": [ + 0.015056902542710304, + 6.693913292110665e-06, + 1.241161982079575e-07, + 7.622224984515924e-08, + 6.743793790064956e-08 + ], + "gamma_dfa": 0.0022661721595795825, + "gamma_dfa_per_layer": [ + 0.006208081729710102, + 0.001149914925917983, + 0.0020575951784849167, + -0.0003509031957946718 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.0835204124450684, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 26.6426944732666, + 3107169.0, + 4381372.0, + 5027998.5, + 6065136.0 + ], + "hidden_norms_avg": [ + 596.7793579101562, + 2542559.0, + 4400625.5, + 8374831.5, + 10510773.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.787545781757217e-05, + 1.5701163702530607e-09, + 1.2841328000945396e-09, + 1.2669904014828148e-09, + 1.2700215323846464e-09 + ], + "bp_grad_F": [ + 0.006971500348299742, + 1.8619180991663598e-05, + 6.465826629664662e-08, + 5.84209978171657e-08, + 5.694714744208795e-08 + ], + "gamma_dfa": 0.0030232197314035147, + "gamma_dfa_per_layer": [ + 0.009539565071463585, + 0.0012945058988407254, + 0.0015697493217885494, + -0.0003109413664788008 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.058485507965088, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 27.95879364013672, + 3613966.25, + 5044349.0, + 5874924.0, + 7080756.0 + ], + "hidden_norms_avg": [ + 623.2052612304688, + 2844551.5, + 4942977.0, + 8742455.0, + 11094594.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8442762413760647e-05, + 1.629689605486817e-09, + 1.115437520127216e-09, + 1.0797144289753646e-09, + 1.0779978021346892e-09 + ], + "bp_grad_F": [ + 0.0072508929297327995, + 1.4132167507341364e-06, + 6.271753250075562e-08, + 4.991998281411725e-08, + 4.950436149897541e-08 + ], + "gamma_dfa": 0.001284227124415338, + "gamma_dfa_per_layer": [ + 0.00256139412522316, + 0.0014944188296794891, + 0.0013982560485601425, + -0.0003171605058014393 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0549392700195312, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 29.22184181213379, + 4211867.5, + 5636704.5, + 6891397.5, + 8559809.0 + ], + "hidden_norms_avg": [ + 647.4288330078125, + 3423908.25, + 5695376.5, + 10367815.0, + 13188250.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8086895326850936e-05, + 1.1501447572115353e-09, + 8.738501033889179e-10, + 8.528160400089746e-10, + 8.584906674435899e-10 + ], + "bp_grad_F": [ + 0.012267161160707474, + 1.591232035025314e-06, + 4.697067268466526e-08, + 4.271150899626264e-08, + 4.017679700041299e-08 + ], + "gamma_dfa": 0.0022953646985115483, + "gamma_dfa_per_layer": [ + 0.007007642649114132, + 0.0012370320037007332, + 0.0011846421984955668, + -0.0002478580572642386 + ], + "acc_eval": 0.228515625, + "loss_eval": 2.053128242492676, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 30.412078857421875, + 4986411.0, + 6504586.0, + 7889628.0, + 9783147.0 + ], + "hidden_norms_avg": [ + 670.3391723632812, + 3921667.0, + 6270645.0, + 10589857.0, + 13580617.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.768085505522322e-05, + 1.3132780418700918e-09, + 7.742924079678914e-10, + 7.418777814294231e-10, + 7.448673344789825e-10 + ], + "bp_grad_F": [ + 0.007575999945402145, + 1.7771724287740653e-06, + 5.529824420591467e-08, + 3.790939828718365e-08, + 3.6307092443621514e-08 + ], + "gamma_dfa": 0.0009071348831639625, + "gamma_dfa_per_layer": [ + 0.001273356145247817, + 0.001484773471020162, + 0.0010661636479198933, + -0.00019575373153202236 + ], + "acc_eval": 0.25390625, + "loss_eval": 2.0479414463043213, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 31.54771614074707, + 5502896.5, + 7070197.5, + 8994800.0, + 11604998.0 + ], + "hidden_norms_avg": [ + 692.4578247070312, + 4249610.0, + 6837255.0, + 11617683.0, + 15223152.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0367684303200804e-05, + 1.325711207478264e-09, + 6.525959217462685e-10, + 6.324714640904006e-10, + 6.32227936669949e-10 + ], + "bp_grad_F": [ + 0.0062190573662519455, + 1.129235442931531e-06, + 3.317861896334762e-08, + 3.131979653403505e-08, + 3.109861168582029e-08 + ], + "gamma_dfa": 0.0011510169642861001, + "gamma_dfa_per_layer": [ + 0.002568549243733287, + 0.0013005147920921445, + 0.0009535959688946605, + -0.00021859214757569134 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0359444618225098, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 32.638641357421875, + 6320697.0, + 7897073.5, + 10165307.0, + 13313912.0 + ], + "hidden_norms_avg": [ + 713.3525390625, + 4812640.5, + 7533297.5, + 12847435.0, + 16993420.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.871564695145935e-05, + 1.2221273992807369e-09, + 6.080098646776833e-10, + 5.917044632042234e-10, + 5.89539916884263e-10 + ], + "bp_grad_F": [ + 0.011915000155568123, + 6.25122083874885e-06, + 3.6603957198622084e-08, + 2.876341298474472e-08, + 2.8581927935533713e-08 + ], + "gamma_dfa": 0.0002986440376844257, + "gamma_dfa_per_layer": [ + -0.0004627959569916129, + 0.0009951044339686632, + 0.0008257199660874903, + -0.00016345229232683778 + ], + "acc_eval": 0.2626953125, + "loss_eval": 2.059875965118408, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 33.6330451965332, + 7264995.5, + 8758988.0, + 11785280.0, + 15874132.0 + ], + "hidden_norms_avg": [ + 732.8869018554688, + 5982206.0, + 8454064.0, + 14846262.0, + 19834080.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.5420635211048648e-05, + 7.56205986718328e-10, + 5.169706884800007e-10, + 5.026724592127607e-10, + 5.024383686880185e-10 + ], + "bp_grad_F": [ + 0.014803220517933369, + 4.478873961488716e-06, + 4.4555019229619575e-08, + 2.4910459472948787e-08, + 2.4745437698925343e-08 + ], + "gamma_dfa": 0.001046390665578656, + "gamma_dfa_per_layer": [ + 0.0027164756320416927, + 0.0009058329742401838, + 0.0007253356743603945, + -0.00016208161832764745 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0538365840911865, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 34.621524810791016, + 8089090.5, + 9671455.0, + 13086530.0, + 17616980.0 + ], + "hidden_norms_avg": [ + 751.2442016601562, + 6699752.5, + 9159771.0, + 15622865.0, + 21214146.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.7939373467233963e-05, + 7.656756340068682e-10, + 5.061054908495066e-10, + 4.837483191799663e-10, + 4.820439047925618e-10 + ], + "bp_grad_F": [ + 0.008210284635424614, + 3.91981393477181e-06, + 2.727725245676993e-08, + 2.349457695061119e-08, + 2.2768137597495297e-08 + ], + "gamma_dfa": 0.0013028495595790446, + "gamma_dfa_per_layer": [ + 0.0034610098227858543, + 0.0012297509238123894, + 0.0006837932160124183, + -0.00016315572429448366 + ], + "acc_eval": 0.2646484375, + "loss_eval": 2.0430214405059814, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 35.54478454589844, + 9145767.0, + 10558942.0, + 14636200.0, + 19721632.0 + ], + "hidden_norms_avg": [ + 768.5211791992188, + 7473006.0, + 10093548.0, + 17775052.0, + 24159262.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.364618532941677e-05, + 8.066202705769854e-10, + 4.5619852340195166e-10, + 4.4121445386124947e-10, + 4.323804370098827e-10 + ], + "bp_grad_F": [ + 0.09167197346687317, + 4.855019597016508e-06, + 2.689265521382822e-08, + 2.1627007740221416e-08, + 2.0867716443717654e-08 + ], + "gamma_dfa": 0.0001647558601689525, + "gamma_dfa_per_layer": [ + -0.0005364040262065828, + 0.0007433416321873665, + 0.0005910456529818475, + -0.00013895981828682125 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.0427517890930176, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 36.43881607055664, + 10216266.0, + 11478190.0, + 16476424.0, + 22393992.0 + ], + "hidden_norms_avg": [ + 785.1990966796875, + 8300483.0, + 10872433.0, + 18667924.0, + 25447926.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0938736017560586e-05, + 7.561202219896757e-10, + 4.2832748459176173e-10, + 4.0923736621678586e-10, + 4.0218126051705383e-10 + ], + "bp_grad_F": [ + 0.013463743962347507, + 1.9222785340389237e-05, + 2.2825457079989064e-08, + 1.9977358434175585e-08, + 1.9259800865256693e-08 + ], + "gamma_dfa": 0.0005702937960450072, + "gamma_dfa_per_layer": [ + 0.0011116554960608482, + 0.0007594762137159705, + 0.0005430461023934186, + -0.00013300262799020857 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0594615936279297, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 37.30263137817383, + 11623684.0, + 12776919.0, + 18306868.0, + 24740858.0 + ], + "hidden_norms_avg": [ + 800.9972534179688, + 9603253.0, + 12104963.0, + 20835068.0, + 28405318.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.261065648985095e-05, + 6.65525801135658e-10, + 3.838940831890625e-10, + 3.742672838313865e-10, + 3.7395189722566613e-10 + ], + "bp_grad_F": [ + 0.007853930816054344, + 1.2899076864414383e-06, + 1.9278010299217385e-08, + 1.8154999281705386e-08, + 1.7368931182204506e-08 + ], + "gamma_dfa": 0.00021361159815569408, + "gamma_dfa_per_layer": [ + -0.00034064118517562747, + 0.0008438127697445452, + 0.0004718025156762451, + -0.00012052770762238652 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0433781147003174, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 38.06776428222656, + 12599130.0, + 13703165.0, + 19834172.0, + 26867468.0 + ], + "hidden_norms_avg": [ + 816.2463989257812, + 10421772.0, + 12873138.0, + 21321398.0, + 29452538.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.774638414848596e-05, + 6.227232618449818e-10, + 3.566741624272396e-10, + 3.4781866276034634e-10, + 3.45437983773067e-10 + ], + "bp_grad_F": [ + 0.013920681551098824, + 3.4208371744171018e-06, + 2.1883508338760294e-08, + 1.7128741092165e-08, + 1.6603545205384762e-08 + ], + "gamma_dfa": 0.0008690126524015795, + "gamma_dfa_per_layer": [ + 0.0021882583387196064, + 0.0009064457844942808, + 0.0004841286572627723, + -0.00010278217087034136 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.0433974266052246, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 38.7847785949707, + 14429584.0, + 15438086.0, + 21566880.0, + 29267340.0 + ], + "hidden_norms_avg": [ + 830.9344482421875, + 11436777.0, + 13832175.0, + 22913616.0, + 32026754.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8682481570285745e-05, + 5.758302168423768e-10, + 3.3607527871737375e-10, + 3.304233830991876e-10, + 3.2846284026000205e-10 + ], + "bp_grad_F": [ + 0.012251574546098709, + 2.996052717207931e-05, + 2.7452134787608884e-08, + 1.577506480998636e-08, + 1.5141546683139495e-08 + ], + "gamma_dfa": 0.0004505918041104451, + "gamma_dfa_per_layer": [ + 0.00026967719895765185, + 0.001212525530718267, + 0.0004131481982767582, + -9.298371151089668e-05 + ], + "acc_eval": 0.2607421875, + "loss_eval": 2.039923667907715, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 39.49647521972656, + 15523604.0, + 16504434.0, + 23236370.0, + 31306890.0 + ], + "hidden_norms_avg": [ + 844.8562622070312, + 12856661.0, + 15124535.0, + 23633704.0, + 32995118.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.6219468054478057e-05, + 5.519696366640403e-10, + 3.2825916984613457e-10, + 3.235848811122821e-10, + 3.2190172749579915e-10 + ], + "bp_grad_F": [ + 0.012884745374321938, + 1.8329246813664213e-05, + 1.8323355277516384e-08, + 1.5584015855552025e-08, + 1.4755748622974352e-08 + ], + "gamma_dfa": 0.0006857650478195865, + "gamma_dfa_per_layer": [ + 0.0016966589028015733, + 0.0007126724813133478, + 0.0003994358121417463, + -6.570700497832149e-05 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0533735752105713, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 40.16881561279297, + 16141660.0, + 17137856.0, + 24286464.0, + 32903152.0 + ], + "hidden_norms_avg": [ + 857.8116455078125, + 12895693.0, + 15492559.0, + 23745768.0, + 33843860.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.2289473892888054e-05, + 6.340856728570543e-10, + 3.264067627295475e-10, + 3.149370209065694e-10, + 3.097411216401724e-10 + ], + "bp_grad_F": [ + 0.006337009835988283, + 1.7065680367522873e-05, + 5.785592804841144e-08, + 1.519365788738014e-08, + 1.464850551968766e-08 + ], + "gamma_dfa": 0.0005419648223323748, + "gamma_dfa_per_layer": [ + 0.00038546844734810293, + 0.0014093497302383184, + 0.0004054713645018637, + -3.243025275878608e-05 + ], + "acc_eval": 0.265625, + "loss_eval": 2.0390102863311768, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 40.790164947509766, + 18768648.0, + 19610716.0, + 26926266.0, + 36060360.0 + ], + "hidden_norms_avg": [ + 869.6182861328125, + 15248417.0, + 17480158.0, + 26928640.0, + 37555876.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.939497062470764e-05, + 5.127394064885493e-10, + 3.1137872835707014e-10, + 3.074558663218596e-10, + 3.04990144250894e-10 + ], + "bp_grad_F": [ + 0.03832927718758583, + 8.881174835551064e-06, + 2.5206949416656244e-08, + 1.4185034480362901e-08, + 1.3504863893842867e-08 + ], + "gamma_dfa": 0.0005767397606177838, + "gamma_dfa_per_layer": [ + 0.00058704090770334, + 0.0013887862442061305, + 0.0003486467176117003, + -1.751482705003582e-05 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.055915117263794, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 41.36415481567383, + 20590018.0, + 21418164.0, + 28674892.0, + 38102536.0 + ], + "hidden_norms_avg": [ + 880.8012084960938, + 15857472.0, + 18200580.0, + 27607590.0, + 38905496.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.6930878448183648e-05, + 5.041319584009329e-10, + 3.0716035270828e-10, + 2.9963459491355593e-10, + 2.9755845010193127e-10 + ], + "bp_grad_F": [ + 0.01052916795015335, + 1.7662874597590417e-05, + 1.8223250464188823e-08, + 1.4229329714510186e-08, + 1.2928855319671584e-08 + ], + "gamma_dfa": 0.0005623552362976625, + "gamma_dfa_per_layer": [ + 0.0005056762602180243, + 0.00140343327075243, + 0.0003372218052390963, + 3.0896089810994454e-06 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.054579734802246, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 41.9267578125, + 21995458.0, + 22701258.0, + 30227660.0, + 40381468.0 + ], + "hidden_norms_avg": [ + 891.6727294921875, + 17925388.0, + 19924592.0, + 29375846.0, + 41265952.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.4433691325830296e-05, + 4.786913088139499e-10, + 3.083476807219654e-10, + 3.030005690796145e-10, + 3.0202479406327143e-10 + ], + "bp_grad_F": [ + 0.006410651374608278, + 9.426087672181893e-06, + 1.748733602369157e-08, + 1.330249954634155e-08, + 1.2548162509062877e-08 + ], + "gamma_dfa": 0.0005204869294175296, + "gamma_dfa_per_layer": [ + 0.0004088875139132142, + 0.001322226831689477, + 0.00032363145146518946, + 2.7201920602237806e-05 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0504493713378906, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 42.43289566040039, + 23788478.0, + 24547006.0, + 32122702.0, + 42524392.0 + ], + "hidden_norms_avg": [ + 902.5420532226562, + 19126440.0, + 21210522.0, + 30872922.0, + 43207040.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8793765523005277e-05, + 4.69506655775831e-10, + 2.9882180063722785e-10, + 2.9027436010409247e-10, + 2.88086998700976e-10 + ], + "bp_grad_F": [ + 0.02046363614499569, + 1.535968840471469e-05, + 1.9181511490273806e-08, + 1.3211375105015577e-08, + 1.2052867148781843e-08 + ], + "gamma_dfa": 0.0005800028211524477, + "gamma_dfa_per_layer": [ + 0.0005789051647298038, + 0.001365642063319683, + 0.0003222030645702034, + 5.326099199010059e-05 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.056929349899292, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 42.88957595825195, + 24876160.0, + 25665632.0, + 33698024.0, + 44433192.0 + ], + "hidden_norms_avg": [ + 912.5694580078125, + 20388924.0, + 22492538.0, + 32293406.0, + 44758584.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.043079595954623e-05, + 4.6556239419182077e-10, + 3.0177585430557485e-10, + 2.9259758504984745e-10, + 2.8850585809259144e-10 + ], + "bp_grad_F": [ + 0.018651673570275307, + 8.0938043538481e-06, + 2.600621051840335e-08, + 1.3419185762586494e-08, + 1.200509913701353e-08 + ], + "gamma_dfa": 0.0008372370848519495, + "gamma_dfa_per_layer": [ + 0.001413366524502635, + 0.0015261531807482243, + 0.0003260627272538841, + 8.336590690305457e-05 + ], + "acc_eval": 0.2353515625, + "loss_eval": 2.060340404510498, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 43.32978057861328, + 25917158.0, + 26720118.0, + 34948196.0, + 46313048.0 + ], + "hidden_norms_avg": [ + 921.58642578125, + 21474648.0, + 23549474.0, + 33572188.0, + 46615396.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.262757672928274e-05, + 4.5062673037499223e-10, + 2.984587021970242e-10, + 2.923088993078693e-10, + 2.888300987269332e-10 + ], + "bp_grad_F": [ + 0.01846941001713276, + 2.4291131921927445e-05, + 2.994345393858566e-08, + 1.4564162320596097e-08, + 1.1765412644137996e-08 + ], + "gamma_dfa": 0.0007057133989292197, + "gamma_dfa_per_layer": [ + 0.0011925556464120746, + 0.0012432597577571869, + 0.0002897845406550914, + 9.725365089252591e-05 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0591180324554443, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 43.74128341674805, + 27200966.0, + 27911578.0, + 36161972.0, + 47854788.0 + ], + "hidden_norms_avg": [ + 930.2008666992188, + 22529414.0, + 24601434.0, + 34829948.0, + 48238220.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.328157981741242e-05, + 4.659617691693541e-10, + 2.8960928100119077e-10, + 2.8687860420539835e-10, + 2.800103759970085e-10 + ], + "bp_grad_F": [ + 0.004556785803288221, + 9.644008059694897e-06, + 1.5685751364458156e-08, + 1.2929571191477862e-08, + 1.1707988356590704e-08 + ], + "gamma_dfa": 0.0005315981106832623, + "gamma_dfa_per_layer": [ + 0.0004304055473767221, + 0.0012520912569016218, + 0.0003118191962130368, + 0.0001320764422416687 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.049736738204956, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 44.10750198364258, + 28860724.0, + 29566448.0, + 37605440.0, + 49767188.0 + ], + "hidden_norms_avg": [ + 938.7098999023438, + 24297102.0, + 26192510.0, + 36561148.0, + 49957968.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.900460640375968e-05, + 4.445998014190877e-10, + 2.888302930159625e-10, + 2.855987946137617e-10, + 2.818917876901139e-10 + ], + "bp_grad_F": [ + 0.013354518450796604, + 6.135221156000625e-06, + 1.780158420672251e-08, + 1.3947193622243503e-08, + 1.161484952660885e-08 + ], + "gamma_dfa": 0.0005519518890650943, + "gamma_dfa_per_layer": [ + 0.0005505518638528883, + 0.001156628131866455, + 0.00033354441984556615, + 0.0001670831406954676 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0527162551879883, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 44.42500305175781, + 30085758.0, + 30793664.0, + 39317268.0, + 51773680.0 + ], + "hidden_norms_avg": [ + 946.3699340820312, + 24723960.0, + 26763662.0, + 37607688.0, + 51575988.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9910466764704324e-05, + 4.753269444712771e-10, + 2.936461906966059e-10, + 2.873846438600225e-10, + 2.8520716344182517e-10 + ], + "bp_grad_F": [ + 0.00976789090782404, + 1.76885150722228e-05, + 1.7970489096796882e-08, + 1.3952313970833075e-08, + 1.130456972475713e-08 + ], + "gamma_dfa": 0.0009108289959840477, + "gamma_dfa_per_layer": [ + 0.0019160081865265965, + 0.0012680008076131344, + 0.00030145354685373604, + 0.00015785344294272363 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.0550765991210938, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 44.73127746582031, + 30730856.0, + 31431762.0, + 40187116.0, + 53148352.0 + ], + "hidden_norms_avg": [ + 953.6856079101562, + 24778752.0, + 27014248.0, + 38275640.0, + 52795456.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8919872420374304e-05, + 4.755910110176842e-10, + 2.84101492331601e-10, + 2.7933383384137755e-10, + 2.7627339305169585e-10 + ], + "bp_grad_F": [ + 0.009574169293045998, + 4.757252463605255e-05, + 1.5709005651842745e-08, + 1.3778580054690792e-08, + 1.1154800638735196e-08 + ], + "gamma_dfa": 0.0003838329284917563, + "gamma_dfa_per_layer": [ + -0.0004134870832785964, + 0.001480170525610447, + 0.0002943193248938769, + 0.00017432894674129784 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0383803844451904, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 44.999107360839844, + 32617970.0, + 33381886.0, + 41663220.0, + 54853168.0 + ], + "hidden_norms_avg": [ + 960.5386962890625, + 27910628.0, + 29647900.0, + 40418716.0, + 54716684.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9992028430569917e-05, + 4.221052118946744e-10, + 2.9753777219809763e-10, + 2.8370578109004896e-10, + 2.813366484222257e-10 + ], + "bp_grad_F": [ + 0.015446176752448082, + 3.8060017686802894e-05, + 5.211516906911129e-08, + 1.3235438522940512e-08, + 1.116207481999254e-08 + ], + "gamma_dfa": 0.0005705733274226077, + "gamma_dfa_per_layer": [ + 0.0006168894469738007, + 0.0011725829681381583, + 0.00029753358103334904, + 0.00019528731354512274 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0557656288146973, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 45.25053024291992, + 33936992.0, + 34621240.0, + 42946580.0, + 56031144.0 + ], + "hidden_norms_avg": [ + 966.2922973632812, + 28239400.0, + 30055502.0, + 41338012.0, + 56048388.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0256345780799165e-05, + 4.424338395647709e-10, + 2.9891861208497517e-10, + 2.8403482343897224e-10, + 2.798661857816853e-10 + ], + "bp_grad_F": [ + 0.006179355084896088, + 8.527667887392454e-06, + 2.116273023489157e-08, + 1.2261468285146293e-08, + 1.1058569171495947e-08 + ], + "gamma_dfa": 0.0009438929373573046, + "gamma_dfa_per_layer": [ + 0.00216879416257143, + 0.0010916339233517647, + 0.0003159396001137793, + 0.00019920406339224428 + ], + "acc_eval": 0.2470703125, + "loss_eval": 2.0517942905426025, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 45.481727600097656, + 34746476.0, + 35397348.0, + 43639664.0, + 57119836.0 + ], + "hidden_norms_avg": [ + 971.5364379882812, + 28891962.0, + 30705540.0, + 42078288.0, + 57065612.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9764614737359807e-05, + 4.5060349895820195e-10, + 3.0148228358228835e-10, + 2.912529661891483e-10, + 2.8715479993834947e-10 + ], + "bp_grad_F": [ + 0.02291245572268963, + 1.3926567589805927e-05, + 3.118159241921603e-08, + 2.1897225366274142e-08, + 1.1063916893760961e-08 + ], + "gamma_dfa": 0.00046937728620832786, + "gamma_dfa_per_layer": [ + -0.00010078266495838761, + 0.0014219002332538366, + 0.0003067174111492932, + 0.00024967416538856924 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.054462432861328, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 45.68215560913086, + 35169816.0, + 35827116.0, + 44266788.0, + 58219984.0 + ], + "hidden_norms_avg": [ + 976.61279296875, + 29302304.0, + 31207594.0, + 42541932.0, + 57918596.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.18697166221682e-05, + 4.4465031656670817e-10, + 3.0559865749069104e-10, + 2.891223926937414e-10, + 2.8127278284273416e-10 + ], + "bp_grad_F": [ + 0.02285478264093399, + 5.0576767534948885e-05, + 2.966898726697309e-08, + 1.374073210769211e-08, + 1.1011787037773502e-08 + ], + "gamma_dfa": 0.0006015256294631399, + "gamma_dfa_per_layer": [ + 0.0005435256171040237, + 0.0013653798960149288, + 0.000284912355709821, + 0.0002122846490237862 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0539493560791016, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 45.86240005493164, + 36071220.0, + 36702996.0, + 45105948.0, + 59117940.0 + ], + "hidden_norms_avg": [ + 980.9766845703125, + 29250424.0, + 31315982.0, + 42895240.0, + 58632240.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0838917155051604e-05, + 4.517226037670241e-10, + 3.037594897836726e-10, + 2.95300450758873e-10, + 2.8246391337027887e-10 + ], + "bp_grad_F": [ + 0.009441024623811245, + 2.5670700779301114e-05, + 2.221704953342396e-08, + 1.750507294673298e-08, + 1.1021731971538884e-08 + ], + "gamma_dfa": 0.00038505904376506805, + "gamma_dfa_per_layer": [ + -0.0006303560803644359, + 0.0016098625492304564, + 0.00032150247716344893, + 0.00023922722903080285 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0488905906677246, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 46.00979995727539, + 36876176.0, + 37547776.0, + 45586304.0, + 59641656.0 + ], + "hidden_norms_avg": [ + 984.9158935546875, + 29720264.0, + 31840778.0, + 43341952.0, + 59202960.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8270042093936354e-05, + 4.981586254615422e-10, + 3.011032534416813e-10, + 2.830454204350019e-10, + 2.763113071679868e-10 + ], + "bp_grad_F": [ + 0.01947774738073349, + 4.3539188482100144e-05, + 2.1426325602647012e-08, + 1.4225844502391283e-08, + 1.0958768115187922e-08 + ], + "gamma_dfa": 0.0003295415808679536, + "gamma_dfa_per_layer": [ + -0.0008024196140468121, + 0.0015490652294829488, + 0.0003235205076634884, + 0.0002480002003721893 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0367085933685303, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 46.14581298828125, + 37542628.0, + 38211032.0, + 46396536.0, + 60543468.0 + ], + "hidden_norms_avg": [ + 988.5308837890625, + 31589698.0, + 33421126.0, + 44806960.0, + 60355708.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.7766556740971282e-05, + 4.28473617697378e-10, + 3.07322972625812e-10, + 2.9381372335102185e-10, + 2.797302944834712e-10 + ], + "bp_grad_F": [ + 0.06864868849515915, + 3.788271715166047e-05, + 2.1370066605186366e-08, + 1.4025233419090455e-08, + 1.1044066994259083e-08 + ], + "gamma_dfa": 9.462468733545393e-05, + "gamma_dfa_per_layer": [ + -0.0015880623832345009, + 0.0014036648208275437, + 0.0003099621389992535, + 0.00025293417274951935 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0631895065307617, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 46.26278305053711, + 38372568.0, + 39046204.0, + 47148944.0, + 61308416.0 + ], + "hidden_norms_avg": [ + 991.4658813476562, + 31279712.0, + 33238512.0, + 44902484.0, + 60826544.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.812536695273593e-05, + 4.3919237691092405e-10, + 3.053821084897379e-10, + 2.9203767182295337e-10, + 2.833127066281804e-10 + ], + "bp_grad_F": [ + 0.011117708869278431, + 2.0018645955133252e-05, + 1.9244726701117543e-08, + 1.4165241424279884e-08, + 1.090406964721069e-08 + ], + "gamma_dfa": 0.00016991631855489686, + "gamma_dfa_per_layer": [ + -0.0015358870150521398, + 0.0016542371595278382, + 0.0003059905138798058, + 0.00025532461586408317 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0491740703582764, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 46.36857223510742, + 38788812.0, + 39461172.0, + 47582644.0, + 61831224.0 + ], + "hidden_norms_avg": [ + 994.04541015625, + 32215950.0, + 34096260.0, + 45599356.0, + 61425516.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0041363061172888e-05, + 4.480187609789965e-10, + 3.0562316566395964e-10, + 2.9085803210371353e-10, + 2.820148004012424e-10 + ], + "bp_grad_F": [ + 0.03149434179067612, + 6.209969433257356e-05, + 2.1469357847081483e-08, + 1.3228349970972886e-08, + 1.092844392758252e-08 + ], + "gamma_dfa": 0.00010758559074020013, + "gamma_dfa_per_layer": [ + -0.0014505982398986816, + 0.001327117788605392, + 0.0002981229918077588, + 0.0002556998224463314 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0554656982421875, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 46.4505729675293, + 38845108.0, + 39504860.0, + 47660992.0, + 62097052.0 + ], + "hidden_norms_avg": [ + 996.2877807617188, + 32178676.0, + 34106748.0, + 45494312.0, + 61553340.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0276962206698954e-05, + 4.5564105266571175e-10, + 3.0059965627771135e-10, + 2.8785077099691136e-10, + 2.794499076586021e-10 + ], + "bp_grad_F": [ + 0.011724308133125305, + 1.9755616449401714e-05, + 2.1592299503936374e-08, + 1.3796129572085647e-08, + 1.0886693324607677e-08 + ], + "gamma_dfa": 0.0002330350544070825, + "gamma_dfa_per_layer": [ + -0.0009828422917053103, + 0.0013922813814133406, + 0.00027237151516601443, + 0.00025032961275428534 + ], + "acc_eval": 0.2578125, + "loss_eval": 2.0504729747772217, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 46.521934509277344, + 39260604.0, + 39906660.0, + 48073644.0, + 62524844.0 + ], + "hidden_norms_avg": [ + 998.1359252929688, + 32138106.0, + 34129788.0, + 45757544.0, + 61958428.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9659293431905098e-05, + 4.597033309572396e-10, + 3.0463259692581346e-10, + 2.893623118893629e-10, + 2.780784769118583e-10 + ], + "bp_grad_F": [ + 0.009033501148223877, + 1.7998809198616073e-05, + 2.5067617315244206e-08, + 1.8738653295713448e-08, + 1.087139978039886e-08 + ], + "gamma_dfa": 0.00016801172751002014, + "gamma_dfa_per_layer": [ + -0.0013465819647535682, + 0.0014174225507304072, + 0.00031502131605520844, + 0.00028618500800803304 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0473151206970215, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 46.57882308959961, + 39427768.0, + 40090548.0, + 48369740.0, + 62859588.0 + ], + "hidden_norms_avg": [ + 999.5881958007812, + 32546802.0, + 34502940.0, + 46179212.0, + 62426560.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0221139240893535e-05, + 4.495410987903625e-10, + 3.065779852207129e-10, + 2.9148336522233365e-10, + 2.8107866034687845e-10 + ], + "bp_grad_F": [ + 0.016372976824641228, + 2.868929186661262e-05, + 2.4158071099122935e-08, + 2.1377838166358742e-08, + 1.0851396226030374e-08 + ], + "gamma_dfa": 0.00012949823576491326, + "gamma_dfa_per_layer": [ + -0.0014246907085180283, + 0.0013606694992631674, + 0.0003105594660155475, + 0.0002714546862989664 + ], + "acc_eval": 0.2568359375, + "loss_eval": 2.0468568801879883, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 46.621891021728516, + 39709320.0, + 40367452.0, + 48619224.0, + 63258040.0 + ], + "hidden_norms_avg": [ + 1000.7721557617188, + 33325650.0, + 35170832.0, + 47006208.0, + 63117408.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.0193185011739843e-05, + 4.388156504830931e-10, + 3.137757831339627e-10, + 2.8996427481331466e-10, + 2.7836044580453745e-10 + ], + "bp_grad_F": [ + 0.020163528621196747, + 3.054905027966015e-05, + 2.3064796295102497e-08, + 1.4526934322134366e-08, + 1.0852998499899513e-08 + ], + "gamma_dfa": 0.00017183857562486082, + "gamma_dfa_per_layer": [ + -0.0013185564894229174, + 0.0014156483812257648, + 0.00031098624458536506, + 0.00027927616611123085 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.054586410522461, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 46.65864562988281, + 39798476.0, + 40463920.0, + 48764504.0, + 63346472.0 + ], + "hidden_norms_avg": [ + 1001.6641845703125, + 33379128.0, + 35239452.0, + 46955488.0, + 63122060.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.965362000395544e-05, + 4.4001230437018535e-10, + 3.0546970508638083e-10, + 2.8820767994375274e-10, + 2.777780505613947e-10 + ], + "bp_grad_F": [ + 0.048469845205545425, + 4.790218736161478e-05, + 2.6222814142329298e-08, + 2.4079582772174035e-08, + 1.0861339383438917e-08 + ], + "gamma_dfa": -6.432890222640708e-05, + "gamma_dfa_per_layer": [ + -0.002126228529959917, + 0.0012497524730861187, + 0.00034036440774798393, + 0.0002787960402201861 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.0531256198883057, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 46.683528900146484, + 39922192.0, + 40544356.0, + 48855360.0, + 63435588.0 + ], + "hidden_norms_avg": [ + 1002.31494140625, + 33437468.0, + 35316604.0, + 47039952.0, + 63236136.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.79724281426752e-05, + 4.357196548010478e-10, + 3.0789479299464517e-10, + 2.8999944112761966e-10, + 2.7672003577450255e-10 + ], + "bp_grad_F": [ + 0.009082098491489887, + 6.448025487770792e-06, + 2.3372145108169207e-08, + 1.58603672417712e-08, + 1.0855457865943663e-08 + ], + "gamma_dfa": 8.819025242701173e-05, + "gamma_dfa_per_layer": [ + -0.0015805144794285297, + 0.0013432127889245749, + 0.000321696512401104, + 0.00026836618781089783 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.0517051219940186, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 46.70249938964844, + 40094040.0, + 40695052.0, + 48969004.0, + 63542232.0 + ], + "hidden_norms_avg": [ + 1002.7830810546875, + 33826664.0, + 35653116.0, + 47279168.0, + 63409756.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8208709409227595e-05, + 4.3868975119210063e-10, + 3.102354484418868e-10, + 2.8893865078316594e-10, + 2.794520170823489e-10 + ], + "bp_grad_F": [ + 0.012775770388543606, + 3.5907680285163224e-05, + 3.276610627267473e-08, + 1.9733393585852355e-08, + 1.0837335473468102e-08 + ], + "gamma_dfa": -7.604052370879799e-06, + "gamma_dfa_per_layer": [ + -0.0020841513760387897, + 0.001464233035221696, + 0.0003138828033115715, + 0.0002756193280220032 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.053762912750244, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 46.71390914916992, + 39990840.0, + 40613704.0, + 48947088.0, + 63626668.0 + ], + "hidden_norms_avg": [ + 1003.0780639648438, + 33512400.0, + 35398544.0, + 47052320.0, + 63319172.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.8852005925728008e-05, + 4.408986231663192e-10, + 3.0767774439333095e-10, + 2.8811911190196327e-10, + 2.780060626150771e-10 + ], + "bp_grad_F": [ + 0.017775027081370354, + 2.9518716473830864e-05, + 1.6785485001946654e-08, + 1.3991450664718741e-08, + 1.082214762249123e-08 + ], + "gamma_dfa": 0.0001292051310883835, + "gamma_dfa_per_layer": [ + -0.001528067048639059, + 0.0014583747833967209, + 0.0003044582554139197, + 0.0002820545341819525 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0512585639953613, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 46.72029495239258, + 40048976.0, + 40673908.0, + 49005780.0, + 63650516.0 + ], + "hidden_norms_avg": [ + 1003.2393188476562, + 33518072.0, + 35408260.0, + 47059300.0, + 63337588.0 + ], + "bp_grad_per_sample_l2_med": [ + 3.040391493414063e-05, + 4.422071042675668e-10, + 3.0922153726464785e-10, + 2.885988392709038e-10, + 2.7767882437856883e-10 + ], + "bp_grad_F": [ + 0.05996337905526161, + 4.702213846030645e-05, + 2.0060964445178797e-08, + 1.6814832193290385e-08, + 1.0825355722943186e-08 + ], + "gamma_dfa": 6.977042357902974e-05, + "gamma_dfa_per_layer": [ + -0.0016858375165611506, + 0.001342209754511714, + 0.00032920570811256766, + 0.00029350374825298786 + ], + "acc_eval": 0.25390625, + "loss_eval": 2.0525753498077393, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 46.723426818847656, + 40078224.0, + 40696452.0, + 49005116.0, + 63676392.0 + ], + "hidden_norms_avg": [ + 1003.3213500976562, + 33528454.0, + 35420932.0, + 47084140.0, + 63362884.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.9969949537189677e-05, + 4.438247824811725e-10, + 3.0574925924398144e-10, + 2.876155424935689e-10, + 2.772651552795935e-10 + ], + "bp_grad_F": [ + 0.015555496327579021, + 1.9468383470666595e-05, + 2.2645199493354085e-08, + 2.0153352764396004e-08, + 1.082723954937137e-08 + ], + "gamma_dfa": -2.766123361652717e-05, + "gamma_dfa_per_layer": [ + -0.0021022262517362833, + 0.0013793597463518381, + 0.0003187692491337657, + 0.0002934523217845708 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.05129337310791, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 46.72323226928711, + 40073516.0, + 40694276.0, + 48970848.0, + 63674696.0 + ], + "hidden_norms_avg": [ + 1003.3206176757812, + 33517796.0, + 35411552.0, + 47074216.0, + 63356572.0 + ], + "bp_grad_per_sample_l2_med": [ + 2.986433173646219e-05, + 4.4209438887499175e-10, + 3.069269838285038e-10, + 2.8717661582078335e-10, + 2.7721389073143143e-10 + ], + "bp_grad_F": [ + 0.011835500597953796, + 1.2977254300494678e-05, + 2.7325663509714104e-08, + 2.23609397664859e-08, + 1.0828303587118171e-08 + ], + "gamma_dfa": 4.879416519543156e-05, + "gamma_dfa_per_layer": [ + -0.0018596879672259092, + 0.0014319919282570481, + 0.0003201703366357833, + 0.00030270236311480403 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.051326274871826, + "epoch": 60 + } + ] +}
\ No newline at end of file |
