{ "config": { "output_dir": "results/snapshot_vit_v1", "epochs": 60, "lr": 0.001, "wd": 0.05, "seed": 456, "depth": 4, "d_model": 128, "n_heads": 4 }, "depth": 4, "d_model": 128, "architecture": "ViTMini", "bp_log": [ { "hidden_norms_cls": [ 0.3042769432067871, 3.2273340225219727, 4.6926493644714355, 6.003997802734375, 6.652705669403076 ], "hidden_norms_avg": [ 6.027750492095947, 7.1044697761535645, 7.910475730895996, 8.79189682006836, 9.458833694458008 ], "bp_grad_per_sample_l2_med": [ 0.005248428788036108, 0.0012287507997825742, 0.0010387187357991934, 0.0009678652859292924, 0.0009174557635560632 ], "bp_grad_F": [ 0.248850479722023, 0.0424945093691349, 0.0348997563123703, 0.03202275559306145, 0.030239813029766083 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.0791015625, "loss_eval": 2.544933319091797, "epoch": 0 }, { "hidden_norms_cls": [ 0.47296053171157837, 11.65749454498291, 18.3483943939209, 24.296405792236328, 29.94684410095215 ], "hidden_norms_avg": [ 4.04442834854126, 9.927255630493164, 14.762720108032227, 19.817049026489258, 24.69188690185547 ], "bp_grad_per_sample_l2_med": [ 0.0025219416711479425, 0.00024655580637045205, 0.00017099862452596426, 0.0001493149611633271, 0.00015047143097035587 ], "bp_grad_F": [ 0.11354690045118332, 0.00995445717126131, 0.006139951758086681, 0.005140931811183691, 0.005088545847684145 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.458984375, "loss_eval": 1.4817876815795898, "epoch": 1 }, { "hidden_norms_cls": [ 0.6174129843711853, 12.388140678405762, 20.656904220581055, 27.073535919189453, 32.43647003173828 ], "hidden_norms_avg": [ 3.8196825981140137, 10.982677459716797, 17.020437240600586, 22.471168518066406, 27.064218521118164 ], "bp_grad_per_sample_l2_med": [ 0.0020673249382525682, 0.0002501676499377936, 0.00015905944746918976, 0.00013718422269448638, 0.0001328626531176269 ], "bp_grad_F": [ 0.09556808322668076, 0.01051106583327055, 0.005822391714900732, 0.004766201134771109, 0.004577947780489922 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.498046875, "loss_eval": 1.356250286102295, "epoch": 2 }, { "hidden_norms_cls": [ 0.7216586470603943, 12.527997016906738, 19.815393447875977, 26.452791213989258, 30.71564483642578 ], "hidden_norms_avg": [ 3.8907485008239746, 11.261369705200195, 16.61492156982422, 21.57110023498535, 24.978900909423828 ], "bp_grad_per_sample_l2_med": [ 0.0021546317730098963, 0.00030062923906371, 0.00018509272194933146, 0.00013865686196368188, 0.00012920796871185303 ], "bp_grad_F": [ 0.10040326416492462, 0.012564396485686302, 0.007171053439378738, 0.005316051654517651, 0.004880763124674559 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5263671875, "loss_eval": 1.2655537128448486, "epoch": 3 }, { "hidden_norms_cls": [ 0.8026084899902344, 12.023736953735352, 20.35123062133789, 26.937381744384766, 31.122047424316406 ], "hidden_norms_avg": [ 3.9065797328948975, 11.544925689697266, 17.131011962890625, 22.292007446289062, 25.61225128173828 ], "bp_grad_per_sample_l2_med": [ 0.0019258656539022923, 0.00027825392317026854, 0.00017385024693794549, 0.0001323536125710234, 0.00012172113929409534 ], "bp_grad_F": [ 0.09238748997449875, 0.01207020040601492, 0.007036368828266859, 0.005208354443311691, 0.0047498126514256 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5673828125, "loss_eval": 1.1375834941864014, "epoch": 4 }, { "hidden_norms_cls": [ 0.8784403204917908, 11.689644813537598, 20.318578720092773, 27.47210121154785, 30.616111755371094 ], "hidden_norms_avg": [ 3.991969585418701, 11.499222755432129, 17.010013580322266, 21.869060516357422, 24.784456253051758 ], "bp_grad_per_sample_l2_med": [ 0.0017466156277805567, 0.00030884172883816063, 0.00018451173673383892, 0.00013519970525521785, 0.00011779358464991674 ], "bp_grad_F": [ 0.0881652981042862, 0.014197942800819874, 0.008167672902345657, 0.00570154283195734, 0.0048713223077356815 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.611328125, "loss_eval": 1.078152060508728, "epoch": 5 }, { "hidden_norms_cls": [ 0.9501535892486572, 12.59860610961914, 20.491111755371094, 27.280519485473633, 30.350204467773438 ], "hidden_norms_avg": [ 4.104201793670654, 12.098063468933105, 17.173715591430664, 21.416263580322266, 24.0885066986084 ], "bp_grad_per_sample_l2_med": [ 0.001603498705662787, 0.0003018827992491424, 0.00017963100981432945, 0.00013513887824956328, 0.00010907831892836839 ], "bp_grad_F": [ 0.08621370792388916, 0.01517424639314413, 0.008794959634542465, 0.006117440760135651, 0.0050094337202608585 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6337890625, "loss_eval": 1.0198562145233154, "epoch": 6 }, { "hidden_norms_cls": [ 1.000899076461792, 12.766633987426758, 21.096908569335938, 28.377235412597656, 31.630756378173828 ], "hidden_norms_avg": [ 4.143934726715088, 13.046825408935547, 18.295841217041016, 23.147098541259766, 25.70033836364746 ], "bp_grad_per_sample_l2_med": [ 0.0015043691964820027, 0.00027919537387788296, 0.0001850408734753728, 0.0001339056616416201, 0.00011227549111936241 ], "bp_grad_F": [ 0.07296615093946457, 0.012746848165988922, 0.00809843186289072, 0.005660817492753267, 0.00492064468562603 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6357421875, "loss_eval": 1.0125277042388916, "epoch": 7 }, { "hidden_norms_cls": [ 1.0544841289520264, 10.223775863647461, 18.59557342529297, 26.47129249572754, 29.77008819580078 ], "hidden_norms_avg": [ 4.213057994842529, 13.021050453186035, 18.172080993652344, 22.743032455444336, 25.225244522094727 ], "bp_grad_per_sample_l2_med": [ 0.001364147407002747, 0.0002890345931518823, 0.00017917664081323892, 0.000133156034280546, 0.00011372177687007934 ], "bp_grad_F": [ 0.07409710437059402, 0.015113108791410923, 0.00921319704502821, 0.006366679444909096, 0.005320113617926836 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6376953125, "loss_eval": 0.9630928039550781, "epoch": 8 }, { "hidden_norms_cls": [ 1.1071640253067017, 12.073644638061523, 19.524917602539062, 26.858781814575195, 30.318849563598633 ], "hidden_norms_avg": [ 4.280055522918701, 13.520170211791992, 18.620624542236328, 22.658164978027344, 25.25646209716797 ], "bp_grad_per_sample_l2_med": [ 0.0012990576215088367, 0.00027366873109713197, 0.00016998387582134455, 0.00012336595682427287, 9.77109739324078e-05 ], "bp_grad_F": [ 0.07662060856819153, 0.015166237019002438, 0.0096206646412611, 0.006477049086242914, 0.005294579081237316 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.654296875, "loss_eval": 0.9390516877174377, "epoch": 9 }, { "hidden_norms_cls": [ 1.1426520347595215, 12.005794525146484, 20.33642578125, 27.80829429626465, 31.22698974609375 ], "hidden_norms_avg": [ 4.328567981719971, 13.725446701049805, 19.644866943359375, 23.91346549987793, 26.409910202026367 ], "bp_grad_per_sample_l2_med": [ 0.0012125002685934305, 0.00027867915923707187, 0.00017298922466579825, 0.0001231397909577936, 0.00010014672443503514 ], "bp_grad_F": [ 0.06728038191795349, 0.014830472879111767, 0.008772061206400394, 0.006222804542630911, 0.00518346531316638 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6708984375, "loss_eval": 0.8987849950790405, "epoch": 10 }, { "hidden_norms_cls": [ 1.182861089706421, 11.343650817871094, 19.158103942871094, 26.537256240844727, 29.248126983642578 ], "hidden_norms_avg": [ 4.343320846557617, 13.940053939819336, 19.19382667541504, 23.443157196044922, 25.7342529296875 ], "bp_grad_per_sample_l2_med": [ 0.0012841055868193507, 0.00029811219428665936, 0.00019176788919139653, 0.0001351374085061252, 0.00010611475590849295 ], "bp_grad_F": [ 0.07373103499412537, 0.015750709921121597, 0.010071114636957645, 0.007257349323481321, 0.00578929902985692 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6708984375, "loss_eval": 0.9137783646583557, "epoch": 11 }, { "hidden_norms_cls": [ 1.2363859415054321, 11.583894729614258, 18.828346252441406, 26.30917739868164, 29.363861083984375 ], "hidden_norms_avg": [ 4.441896915435791, 13.568662643432617, 18.774181365966797, 22.73027801513672, 24.84675407409668 ], "bp_grad_per_sample_l2_med": [ 0.0011289563262835145, 0.00029387036920525134, 0.0001886928512249142, 0.00013024669897276908, 9.712533210404217e-05 ], "bp_grad_F": [ 0.06850193440914154, 0.016727343201637268, 0.010432050563395023, 0.00744031835347414, 0.0057919141836464405 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6865234375, "loss_eval": 0.8655319809913635, "epoch": 12 }, { "hidden_norms_cls": [ 1.276246428489685, 11.161674499511719, 18.18111801147461, 24.498512268066406, 28.472366333007812 ], "hidden_norms_avg": [ 4.438092231750488, 13.71449089050293, 18.358896255493164, 21.998794555664062, 24.44672966003418 ], "bp_grad_per_sample_l2_med": [ 0.001100392546504736, 0.0002873367629945278, 0.00018384194117970765, 0.0001337265275651589, 9.951705578714609e-05 ], "bp_grad_F": [ 0.06749056279659271, 0.01716373674571514, 0.010762249119579792, 0.007881316356360912, 0.005892573855817318 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6982421875, "loss_eval": 0.8163608908653259, "epoch": 13 }, { "hidden_norms_cls": [ 1.3131792545318604, 11.034884452819824, 17.936412811279297, 24.541194915771484, 28.02472496032715 ], "hidden_norms_avg": [ 4.504117012023926, 13.86273193359375, 18.456012725830078, 22.296085357666016, 24.57513427734375 ], "bp_grad_per_sample_l2_med": [ 0.0010489820269867778, 0.0002784461830742657, 0.00018129698582924902, 0.00013628850865643471, 0.00010334269609302282 ], "bp_grad_F": [ 0.06553377211093903, 0.016712775453925133, 0.010981550440192223, 0.007675213273614645, 0.006061363499611616 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.69921875, "loss_eval": 0.8088906407356262, "epoch": 14 }, { "hidden_norms_cls": [ 1.3631325960159302, 10.72367000579834, 17.147600173950195, 23.750171661376953, 26.97018051147461 ], "hidden_norms_avg": [ 4.5338335037231445, 13.55031967163086, 17.503305435180664, 21.003847122192383, 23.168630599975586 ], "bp_grad_per_sample_l2_med": [ 0.0010022176429629326, 0.0002914569922722876, 0.00018890199135057628, 0.00013593978655990213, 0.00010251985804643482 ], "bp_grad_F": [ 0.06372744590044022, 0.017576243728399277, 0.011715950444340706, 0.008481587283313274, 0.006441249046474695 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.701171875, "loss_eval": 0.815929651260376, "epoch": 15 }, { "hidden_norms_cls": [ 1.3926054239273071, 10.609240531921387, 17.234729766845703, 23.659292221069336, 27.24931526184082 ], "hidden_norms_avg": [ 4.513574600219727, 13.48448371887207, 17.66766929626465, 21.098644256591797, 23.213909149169922 ], "bp_grad_per_sample_l2_med": [ 0.0008784966776147485, 0.0002452125190757215, 0.0001629967155167833, 0.00012193062138976529, 8.820713992463425e-05 ], "bp_grad_F": [ 0.06515656411647797, 0.017664309591054916, 0.011493389494717121, 0.008405888453125954, 0.006338838487863541 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.71875, "loss_eval": 0.7755489349365234, "epoch": 16 }, { "hidden_norms_cls": [ 1.4288005828857422, 9.991934776306152, 16.30902671813965, 22.53181266784668, 25.98328971862793 ], "hidden_norms_avg": [ 4.606818199157715, 13.761014938354492, 18.061887741088867, 21.805465698242188, 23.856918334960938 ], "bp_grad_per_sample_l2_med": [ 0.0008885160204954445, 0.00026409278507344425, 0.0001749310758896172, 0.00012756467913277447, 8.965048618847504e-05 ], "bp_grad_F": [ 0.07283030450344086, 0.01973560079932213, 0.013354410417377949, 0.009586230851709843, 0.006897584535181522 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.693359375, "loss_eval": 0.8082709908485413, "epoch": 17 }, { "hidden_norms_cls": [ 1.4623849391937256, 9.794211387634277, 16.102649688720703, 21.62982940673828, 25.186201095581055 ], "hidden_norms_avg": [ 4.6317901611328125, 13.527764320373535, 17.6087589263916, 21.295202255249023, 23.361501693725586 ], "bp_grad_per_sample_l2_med": [ 0.0008634055848233402, 0.0002727442770265043, 0.00018466924666427076, 0.00013278424739837646, 8.995016105473042e-05 ], "bp_grad_F": [ 0.06913765519857407, 0.02126000076532364, 0.014007972553372383, 0.010056250728666782, 0.00732502993196249 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.720703125, "loss_eval": 0.7786685824394226, "epoch": 18 }, { "hidden_norms_cls": [ 1.4771180152893066, 9.776408195495605, 15.485087394714355, 21.054513931274414, 25.07387351989746 ], "hidden_norms_avg": [ 4.570744514465332, 13.13935375213623, 16.70624351501465, 20.002471923828125, 22.400487899780273 ], "bp_grad_per_sample_l2_med": [ 0.0008809147984720767, 0.00026235057157464325, 0.0001801249454729259, 0.0001285924663534388, 8.227767830248922e-05 ], "bp_grad_F": [ 0.07356031239032745, 0.02142982743680477, 0.014684871770441532, 0.010477974079549313, 0.007170504424721003 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7412109375, "loss_eval": 0.7548146843910217, "epoch": 19 }, { "hidden_norms_cls": [ 1.4932866096496582, 9.586905479431152, 15.190006256103516, 20.53044891357422, 23.871917724609375 ], "hidden_norms_avg": [ 4.640237808227539, 13.333914756774902, 16.603134155273438, 19.70735740661621, 21.712968826293945 ], "bp_grad_per_sample_l2_med": [ 0.0008201555465348065, 0.00025074987206608057, 0.00018013773660641164, 0.0001373633131152019, 8.871335012372583e-05 ], "bp_grad_F": [ 0.07453557848930359, 0.02180560864508152, 0.015117364004254341, 0.010920760221779346, 0.007648298051208258 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7294921875, "loss_eval": 0.7338082790374756, "epoch": 20 }, { "hidden_norms_cls": [ 1.5380369424819946, 8.941458702087402, 14.383026123046875, 19.64396858215332, 23.333805084228516 ], "hidden_norms_avg": [ 4.57804012298584, 12.777068138122559, 15.852535247802734, 19.008466720581055, 21.123043060302734 ], "bp_grad_per_sample_l2_med": [ 0.0007403296767733991, 0.00023140048142522573, 0.0001578826195327565, 0.00011260491737630218, 7.754044054308906e-05 ], "bp_grad_F": [ 0.07555028051137924, 0.024111615493893623, 0.01656532846391201, 0.01178746297955513, 0.007888367399573326 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.744140625, "loss_eval": 0.7344021201133728, "epoch": 21 }, { "hidden_norms_cls": [ 1.5561290979385376, 9.454068183898926, 14.400370597839355, 19.253843307495117, 22.27718734741211 ], "hidden_norms_avg": [ 4.687749862670898, 12.994861602783203, 15.969095230102539, 18.976381301879883, 20.873851776123047 ], "bp_grad_per_sample_l2_med": [ 0.0008383935783058405, 0.0002680755569599569, 0.000193025975022465, 0.00013935549941379577, 9.83258432825096e-05 ], "bp_grad_F": [ 0.06634547561407089, 0.021603766828775406, 0.01579204760491848, 0.011702721007168293, 0.008362310007214546 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.734375, "loss_eval": 0.7299590110778809, "epoch": 22 }, { "hidden_norms_cls": [ 1.5774884223937988, 8.741745948791504, 13.803518295288086, 18.90570831298828, 22.218149185180664 ], "hidden_norms_avg": [ 4.594933032989502, 12.66419506072998, 15.714310646057129, 19.085254669189453, 21.135629653930664 ], "bp_grad_per_sample_l2_med": [ 0.0006682098028250039, 0.00022848948719911277, 0.00016414522542618215, 0.0001115989507525228, 7.056116737658158e-05 ], "bp_grad_F": [ 0.07456765323877335, 0.024261610582470894, 0.01710386760532856, 0.012147205881774426, 0.008177526295185089 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7763671875, "loss_eval": 0.699420154094696, "epoch": 23 }, { "hidden_norms_cls": [ 1.576693058013916, 8.762345314025879, 13.443113327026367, 18.230920791625977, 22.07720375061035 ], "hidden_norms_avg": [ 4.667433738708496, 12.606098175048828, 15.544108390808105, 18.674053192138672, 20.65712547302246 ], "bp_grad_per_sample_l2_med": [ 0.0006520473980344832, 0.00022687950695399195, 0.0001629517209948972, 0.00011739470210159197, 7.377319707302377e-05 ], "bp_grad_F": [ 0.08037886768579483, 0.026545122265815735, 0.0190938338637352, 0.013439938426017761, 0.00869175884872675 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7353515625, "loss_eval": 0.733207106590271, "epoch": 24 }, { "hidden_norms_cls": [ 1.5915056467056274, 8.431538581848145, 13.075739860534668, 17.782840728759766, 20.799991607666016 ], "hidden_norms_avg": [ 4.626980304718018, 12.152971267700195, 14.936114311218262, 18.13477325439453, 19.853097915649414 ], "bp_grad_per_sample_l2_med": [ 0.0007118558278307319, 0.00024262107035610825, 0.0001753592659952119, 0.00012127246736781672, 7.87421886343509e-05 ], "bp_grad_F": [ 0.0734892264008522, 0.025602566078305244, 0.018658706918358803, 0.013666817918419838, 0.009108936414122581 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7578125, "loss_eval": 0.6893049478530884, "epoch": 25 }, { "hidden_norms_cls": [ 1.589570164680481, 8.064777374267578, 12.609880447387695, 17.195837020874023, 20.27288818359375 ], "hidden_norms_avg": [ 4.651576995849609, 12.02392578125, 14.5856351852417, 17.578563690185547, 19.327190399169922 ], "bp_grad_per_sample_l2_med": [ 0.0006660808576270938, 0.0002373493480263278, 0.0001695255923550576, 0.00012064678594470024, 7.89113255450502e-05 ], "bp_grad_F": [ 0.08072065562009811, 0.02827218733727932, 0.020335549488663673, 0.014427169226109982, 0.009556911885738373 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.755859375, "loss_eval": 0.7047942876815796, "epoch": 26 }, { "hidden_norms_cls": [ 1.6077263355255127, 7.734760284423828, 11.882841110229492, 15.991426467895508, 19.111549377441406 ], "hidden_norms_avg": [ 4.672310829162598, 11.994673728942871, 14.48837661743164, 16.922487258911133, 18.498437881469727 ], "bp_grad_per_sample_l2_med": [ 0.0005716760642826557, 0.00020494087948463857, 0.0001548439176985994, 0.00011144367454107851, 6.537805165862665e-05 ], "bp_grad_F": [ 0.08237622678279877, 0.03036416694521904, 0.022357620298862457, 0.01651921682059765, 0.010484294034540653 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7548828125, "loss_eval": 0.6863161325454712, "epoch": 27 }, { "hidden_norms_cls": [ 1.6167913675308228, 7.661223411560059, 11.857555389404297, 16.11384391784668, 19.207155227661133 ], "hidden_norms_avg": [ 4.6568603515625, 11.916447639465332, 14.127670288085938, 16.765464782714844, 18.548715591430664 ], "bp_grad_per_sample_l2_med": [ 0.0006015675025992095, 0.00022187062131706625, 0.00015665855607949197, 0.00011372221342753619, 6.673130701528862e-05 ], "bp_grad_F": [ 0.08522997796535492, 0.03222256526350975, 0.023626696318387985, 0.01693013124167919, 0.010611210018396378 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.75390625, "loss_eval": 0.6998279094696045, "epoch": 28 }, { "hidden_norms_cls": [ 1.6032800674438477, 7.3315229415893555, 11.458590507507324, 15.827820777893066, 19.03597640991211 ], "hidden_norms_avg": [ 4.592748641967773, 11.431793212890625, 13.694733619689941, 16.380725860595703, 17.913341522216797 ], "bp_grad_per_sample_l2_med": [ 0.0006015695980750024, 0.00023376141325570643, 0.00015724304830655456, 0.00010976113844662905, 6.412796210497618e-05 ], "bp_grad_F": [ 0.09064542502164841, 0.03456525132060051, 0.02491987682878971, 0.01721413992345333, 0.010797572322189808 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7734375, "loss_eval": 0.6845672130584717, "epoch": 29 }, { "hidden_norms_cls": [ 1.6067036390304565, 7.343894004821777, 11.072548866271973, 15.027584075927734, 17.731834411621094 ], "hidden_norms_avg": [ 4.656601428985596, 11.393535614013672, 13.465471267700195, 15.975980758666992, 17.53518295288086 ], "bp_grad_per_sample_l2_med": [ 0.0005384382093325257, 0.00021189975086599588, 0.0001552984758745879, 0.00010658086830517277, 6.326750008156523e-05 ], "bp_grad_F": [ 0.08886278420686722, 0.03500310331583023, 0.025932280346751213, 0.018638672307133675, 0.011571940965950489 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7666015625, "loss_eval": 0.6816176772117615, "epoch": 30 }, { "hidden_norms_cls": [ 1.6034201383590698, 7.28795051574707, 10.777915000915527, 14.885525703430176, 17.61635398864746 ], "hidden_norms_avg": [ 4.614856719970703, 11.156272888183594, 13.103291511535645, 15.514464378356934, 16.799636840820312 ], "bp_grad_per_sample_l2_med": [ 0.0005928887985646725, 0.0002398774668108672, 0.00018353872292209417, 0.00012629387492779642, 8.196983981179073e-05 ], "bp_grad_F": [ 0.09026212245225906, 0.03624382242560387, 0.027555860579013824, 0.019604889675974846, 0.012266743928194046 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7578125, "loss_eval": 0.6996170878410339, "epoch": 31 }, { "hidden_norms_cls": [ 1.611714243888855, 7.183743953704834, 10.724074363708496, 14.5570650100708, 17.022544860839844 ], "hidden_norms_avg": [ 4.623075485229492, 11.19589614868164, 13.009132385253906, 15.365489959716797, 16.62962532043457 ], "bp_grad_per_sample_l2_med": [ 0.00036223753704689443, 0.00014417112106457353, 0.00010984936670865864, 8.023829286685213e-05, 4.624977009370923e-05 ], "bp_grad_F": [ 0.09605100005865097, 0.03848516568541527, 0.029046298936009407, 0.021008647978305817, 0.012804670259356499 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7666015625, "loss_eval": 0.6707476377487183, "epoch": 32 }, { "hidden_norms_cls": [ 1.6100214719772339, 6.872183322906494, 10.294036865234375, 14.205705642700195, 17.145418167114258 ], "hidden_norms_avg": [ 4.6112518310546875, 11.086106300354004, 12.928976058959961, 15.350056648254395, 16.69057846069336 ], "bp_grad_per_sample_l2_med": [ 0.00041789902024902403, 0.00017518684035167098, 0.0001297849084949121, 8.867425640346482e-05, 4.886053648078814e-05 ], "bp_grad_F": [ 0.10439282655715942, 0.04290134832262993, 0.03223341330885887, 0.02269606664776802, 0.013486144132912159 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.759765625, "loss_eval": 0.7303465604782104, "epoch": 33 }, { "hidden_norms_cls": [ 1.5996708869934082, 6.756699085235596, 9.930717468261719, 13.55428695678711, 16.25560188293457 ], "hidden_norms_avg": [ 4.561036109924316, 10.72261905670166, 12.331817626953125, 14.622406005859375, 16.10407829284668 ], "bp_grad_per_sample_l2_med": [ 0.0004882134380750358, 0.0002138838026439771, 0.00016901774506550282, 0.0001125320850405842, 6.579834007425234e-05 ], "bp_grad_F": [ 0.10555483400821686, 0.043922487646341324, 0.03336327522993088, 0.02399253286421299, 0.013897648081183434 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7744140625, "loss_eval": 0.71100252866745, "epoch": 34 }, { "hidden_norms_cls": [ 1.5904232263565063, 6.662050247192383, 9.66409683227539, 13.113885879516602, 15.527644157409668 ], "hidden_norms_avg": [ 4.5454936027526855, 10.621905326843262, 12.306397438049316, 14.576898574829102, 15.954529762268066 ], "bp_grad_per_sample_l2_med": [ 0.0004819612659048289, 0.00020982844580430537, 0.00015760491078253835, 0.00010895934246946126, 5.958566543995403e-05 ], "bp_grad_F": [ 0.10991083830595016, 0.047212228178977966, 0.03634340688586235, 0.02575613744556904, 0.014786512590944767 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7705078125, "loss_eval": 0.7015272378921509, "epoch": 35 }, { "hidden_norms_cls": [ 1.5926766395568848, 6.752022743225098, 9.809683799743652, 13.14870548248291, 15.66618537902832 ], "hidden_norms_avg": [ 4.554390907287598, 10.59433650970459, 12.38070011138916, 14.597192764282227, 15.870081901550293 ], "bp_grad_per_sample_l2_med": [ 0.00043442551395855844, 0.0001767174544511363, 0.0001353291590930894, 9.88640749710612e-05, 5.115106250741519e-05 ], "bp_grad_F": [ 0.11412353813648224, 0.04936130344867706, 0.03786878660321236, 0.027230119332671165, 0.015144454315304756 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7734375, "loss_eval": 0.7246569395065308, "epoch": 36 }, { "hidden_norms_cls": [ 1.5873360633850098, 6.424077987670898, 9.43139934539795, 12.677597999572754, 15.172491073608398 ], "hidden_norms_avg": [ 4.4964070320129395, 10.287262916564941, 11.751147270202637, 13.867583274841309, 15.24795150756836 ], "bp_grad_per_sample_l2_med": [ 0.0004166838189121336, 0.0001985515555134043, 0.00014922211994417012, 0.0001073441599146463, 5.765057721873745e-05 ], "bp_grad_F": [ 0.11522030830383301, 0.05126715078949928, 0.039791759103536606, 0.028239542618393898, 0.015849631279706955 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.76953125, "loss_eval": 0.7268451452255249, "epoch": 37 }, { "hidden_norms_cls": [ 1.5890607833862305, 6.295929431915283, 9.119135856628418, 12.20608901977539, 14.642122268676758 ], "hidden_norms_avg": [ 4.5021796226501465, 10.095436096191406, 11.7933988571167, 13.924290657043457, 15.25149917602539 ], "bp_grad_per_sample_l2_med": [ 0.0004105751868337393, 0.00017681249300949275, 0.00014306302182376385, 9.77686358965002e-05, 5.147796036908403e-05 ], "bp_grad_F": [ 0.12662801146507263, 0.057947222143411636, 0.044759348034858704, 0.03212600201368332, 0.017064588144421577 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7587890625, "loss_eval": 0.7464388012886047, "epoch": 38 }, { "hidden_norms_cls": [ 1.5761758089065552, 6.18004846572876, 9.069403648376465, 12.180702209472656, 14.516327857971191 ], "hidden_norms_avg": [ 4.492326736450195, 9.971968650817871, 11.50478744506836, 13.5086669921875, 14.760706901550293 ], "bp_grad_per_sample_l2_med": [ 0.0003273288893979043, 0.00015071693633217365, 0.00011665018246276304, 8.30927092465572e-05, 4.371673639980145e-05 ], "bp_grad_F": [ 0.1212363913655281, 0.055609479546546936, 0.04309426248073578, 0.0311796423047781, 0.016882745549082756 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7783203125, "loss_eval": 0.7176246643066406, "epoch": 39 }, { "hidden_norms_cls": [ 1.5679142475128174, 6.109372615814209, 8.818140029907227, 11.853668212890625, 14.200343132019043 ], "hidden_norms_avg": [ 4.478363037109375, 9.777668952941895, 11.217857360839844, 13.170299530029297, 14.35566520690918 ], "bp_grad_per_sample_l2_med": [ 0.0003435175749473274, 0.00015563883061986417, 0.00011927648301934823, 8.298752072732896e-05, 4.157157673034817e-05 ], "bp_grad_F": [ 0.13136376440525055, 0.06076597049832344, 0.046719472855329514, 0.033368490636348724, 0.01777712069451809 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.78125, "loss_eval": 0.7149413228034973, "epoch": 40 }, { "hidden_norms_cls": [ 1.5576080083847046, 6.149768829345703, 8.711091041564941, 11.498035430908203, 13.903903007507324 ], "hidden_norms_avg": [ 4.435859680175781, 9.742182731628418, 10.966800689697266, 12.826833724975586, 13.987249374389648 ], "bp_grad_per_sample_l2_med": [ 0.0002820935333147645, 0.00013546310947276652, 0.00010691316856537014, 7.935341272968799e-05, 4.027710747322999e-05 ], "bp_grad_F": [ 0.1424364149570465, 0.0660286620259285, 0.05190045386552811, 0.037452246993780136, 0.019488148391246796 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.759765625, "loss_eval": 0.7794969081878662, "epoch": 41 }, { "hidden_norms_cls": [ 1.55929696559906, 6.027406215667725, 8.56254768371582, 11.315313339233398, 13.816405296325684 ], "hidden_norms_avg": [ 4.444095611572266, 9.598461151123047, 11.017721176147461, 12.939472198486328, 14.150469779968262 ], "bp_grad_per_sample_l2_med": [ 0.00028881963226012886, 0.00014081982953939587, 0.00010864014620892704, 7.903494406491518e-05, 3.460505831753835e-05 ], "bp_grad_F": [ 0.14435029029846191, 0.06792720407247543, 0.05288391932845116, 0.03809889778494835, 0.0192741546779871 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7783203125, "loss_eval": 0.7500836253166199, "epoch": 42 }, { "hidden_norms_cls": [ 1.5569288730621338, 5.83992338180542, 8.285759925842285, 11.15902328491211, 13.44404125213623 ], "hidden_norms_avg": [ 4.416918754577637, 9.525116920471191, 10.900503158569336, 12.753186225891113, 13.810358047485352 ], "bp_grad_per_sample_l2_med": [ 0.0003584402147680521, 0.00016757070261519402, 0.000135006892378442, 8.858168439473957e-05, 4.690655987360515e-05 ], "bp_grad_F": [ 0.14751866459846497, 0.07057010382413864, 0.05518123507499695, 0.039941366761922836, 0.019994540140032768 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.783203125, "loss_eval": 0.7740926146507263, "epoch": 43 }, { "hidden_norms_cls": [ 1.5507482290267944, 5.7182297706604, 8.143424034118652, 10.900334358215332, 13.179159164428711 ], "hidden_norms_avg": [ 4.415921688079834, 9.42380142211914, 10.672327995300293, 12.439417839050293, 13.481410026550293 ], "bp_grad_per_sample_l2_med": [ 0.0002743537479545921, 0.00013802653120364994, 0.00010440178448334336, 7.395831926260144e-05, 3.546295192791149e-05 ], "bp_grad_F": [ 0.15799099206924438, 0.0763181671500206, 0.060047682374715805, 0.043460771441459656, 0.02125636488199234 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.78125, "loss_eval": 0.7693630456924438, "epoch": 44 }, { "hidden_norms_cls": [ 1.5424573421478271, 5.688177585601807, 7.995815753936768, 10.642090797424316, 12.71364688873291 ], "hidden_norms_avg": [ 4.399099349975586, 9.228434562683105, 10.541167259216309, 12.30521297454834, 13.311983108520508 ], "bp_grad_per_sample_l2_med": [ 0.00024789522285573184, 0.0001290303043788299, 9.614775626687333e-05, 6.680067599518225e-05, 3.041914533241652e-05 ], "bp_grad_F": [ 0.16617916524410248, 0.08274275809526443, 0.06457101553678513, 0.04608331620693207, 0.02214660868048668 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.77734375, "loss_eval": 0.7963705062866211, "epoch": 45 }, { "hidden_norms_cls": [ 1.5373201370239258, 5.651702880859375, 7.870075702667236, 10.383352279663086, 12.742950439453125 ], "hidden_norms_avg": [ 4.359274387359619, 9.120989799499512, 10.328361511230469, 11.979691505432129, 13.047332763671875 ], "bp_grad_per_sample_l2_med": [ 0.00020789829432033002, 0.00010236673551844433, 8.31241559353657e-05, 5.5589163821423426e-05, 2.5046059818123467e-05 ], "bp_grad_F": [ 0.1711728274822235, 0.08452030271291733, 0.06641850620508194, 0.048034753650426865, 0.022233933210372925 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.796875, "loss_eval": 0.787158727645874, "epoch": 46 }, { "hidden_norms_cls": [ 1.534119725227356, 5.64213752746582, 7.87826681137085, 10.351583480834961, 12.802285194396973 ], "hidden_norms_avg": [ 4.381091594696045, 9.210761070251465, 10.374320030212402, 12.017292976379395, 13.094472885131836 ], "bp_grad_per_sample_l2_med": [ 0.00020434240286704153, 9.69645261648111e-05, 7.39863608032465e-05, 5.592328670900315e-05, 2.489626240276266e-05 ], "bp_grad_F": [ 0.17339713871479034, 0.08632633090019226, 0.06861955672502518, 0.05006933584809303, 0.022428762167692184 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7919921875, "loss_eval": 0.7851632833480835, "epoch": 47 }, { "hidden_norms_cls": [ 1.5289297103881836, 5.52672004699707, 7.675796985626221, 10.204718589782715, 12.873387336730957 ], "hidden_norms_avg": [ 4.3382954597473145, 8.994754791259766, 10.112909317016602, 11.741432189941406, 12.863862037658691 ], "bp_grad_per_sample_l2_med": [ 0.0001689869095571339, 8.723067730898038e-05, 6.962454062886536e-05, 4.9918842705665156e-05, 2.0077559383935295e-05 ], "bp_grad_F": [ 0.1893138736486435, 0.09529414772987366, 0.07472710311412811, 0.053626082837581635, 0.023708311840891838 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7802734375, "loss_eval": 0.8306612968444824, "epoch": 48 }, { "hidden_norms_cls": [ 1.5282790660858154, 5.412533760070801, 7.559310436248779, 10.040712356567383, 12.344849586486816 ], "hidden_norms_avg": [ 4.344850063323975, 8.943357467651367, 10.036619186401367, 11.63318157196045, 12.690427780151367 ], "bp_grad_per_sample_l2_med": [ 0.00015994974819477648, 8.589095523348078e-05, 6.632162694586441e-05, 4.7776728024473414e-05, 1.923311901919078e-05 ], "bp_grad_F": [ 0.19004860520362854, 0.09673094749450684, 0.07585947215557098, 0.05484768748283386, 0.02464146539568901 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7880859375, "loss_eval": 0.8193543553352356, "epoch": 49 }, { "hidden_norms_cls": [ 1.5247719287872314, 5.414742469787598, 7.496610164642334, 9.884673118591309, 12.301740646362305 ], "hidden_norms_avg": [ 4.334397792816162, 8.873777389526367, 9.937097549438477, 11.524014472961426, 12.564128875732422 ], "bp_grad_per_sample_l2_med": [ 0.00016137116472236812, 8.459146192763001e-05, 7.113611354725435e-05, 4.750298467115499e-05, 1.9900418919860385e-05 ], "bp_grad_F": [ 0.1871533840894699, 0.09687218815088272, 0.0768747329711914, 0.05509059876203537, 0.024593451991677284 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.80078125, "loss_eval": 0.810278058052063, "epoch": 50 }, { "hidden_norms_cls": [ 1.5175530910491943, 5.423762798309326, 7.493518352508545, 9.848480224609375, 12.152653694152832 ], "hidden_norms_avg": [ 4.333771228790283, 8.846830368041992, 9.895172119140625, 11.470880508422852, 12.51230239868164 ], "bp_grad_per_sample_l2_med": [ 0.00018688049749471247, 9.502686589257792e-05, 7.833576091798022e-05, 5.505367516889237e-05, 2.1109613953740336e-05 ], "bp_grad_F": [ 0.19925038516521454, 0.10273440927267075, 0.08146088570356369, 0.05800405889749527, 0.025326546281576157 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.79296875, "loss_eval": 0.8315975069999695, "epoch": 51 }, { "hidden_norms_cls": [ 1.5154390335083008, 5.332769870758057, 7.351593971252441, 9.726226806640625, 12.217824935913086 ], "hidden_norms_avg": [ 4.312089443206787, 8.77189826965332, 9.80828857421875, 11.376079559326172, 12.424320220947266 ], "bp_grad_per_sample_l2_med": [ 0.0001625730947125703, 8.300685294670984e-05, 6.064521585358307e-05, 4.498598718782887e-05, 1.878884904726874e-05 ], "bp_grad_F": [ 0.20003639161586761, 0.10495735704898834, 0.08297032862901688, 0.059033025056123734, 0.02547283098101616 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7890625, "loss_eval": 0.8281288146972656, "epoch": 52 }, { "hidden_norms_cls": [ 1.5136713981628418, 5.367674827575684, 7.355134963989258, 9.682082176208496, 12.047696113586426 ], "hidden_norms_avg": [ 4.316784381866455, 8.783827781677246, 9.812792778015137, 11.395760536193848, 12.420063018798828 ], "bp_grad_per_sample_l2_med": [ 0.00016071743448264897, 7.887884567026049e-05, 6.097723598941229e-05, 4.243743751430884e-05, 1.8102018657373264e-05 ], "bp_grad_F": [ 0.20199808478355408, 0.10541712492704391, 0.0835103914141655, 0.05967256799340248, 0.025771932676434517 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7890625, "loss_eval": 0.8389135599136353, "epoch": 53 }, { "hidden_norms_cls": [ 1.5129119157791138, 5.326069355010986, 7.275172233581543, 9.633310317993164, 12.064473152160645 ], "hidden_norms_avg": [ 4.308472633361816, 8.717856407165527, 9.717677116394043, 11.28734016418457, 12.3176851272583 ], "bp_grad_per_sample_l2_med": [ 0.00015608215471729636, 8.108095789793879e-05, 6.294465129030868e-05, 4.2116138502024114e-05, 1.7733293134369887e-05 ], "bp_grad_F": [ 0.20727074146270752, 0.10958535224199295, 0.08667060732841492, 0.06113011762499809, 0.026037005707621574 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.787109375, "loss_eval": 0.8504288792610168, "epoch": 54 }, { "hidden_norms_cls": [ 1.5120813846588135, 5.313214302062988, 7.253427982330322, 9.583664894104004, 12.01283073425293 ], "hidden_norms_avg": [ 4.303354263305664, 8.709893226623535, 9.714727401733398, 11.287162780761719, 12.301621437072754 ], "bp_grad_per_sample_l2_med": [ 0.00014261712203733623, 8.006545249372721e-05, 6.104232306824997e-05, 4.1361305193277076e-05, 1.670202073000837e-05 ], "bp_grad_F": [ 0.20587928593158722, 0.10970292240381241, 0.0869779959321022, 0.06163511052727699, 0.02630491554737091 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7919921875, "loss_eval": 0.8500803709030151, "epoch": 55 }, { "hidden_norms_cls": [ 1.5113301277160645, 5.33270263671875, 7.255039215087891, 9.560588836669922, 11.935233116149902 ], "hidden_norms_avg": [ 4.311485767364502, 8.737537384033203, 9.710383415222168, 11.27385425567627, 12.309149742126465 ], "bp_grad_per_sample_l2_med": [ 0.00014448253205046058, 7.629570609424263e-05, 6.040706284693442e-05, 4.236707536620088e-05, 1.7641770682530478e-05 ], "bp_grad_F": [ 0.20638784766197205, 0.10957971960306168, 0.08719436824321747, 0.06181200593709946, 0.026369713246822357 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7900390625, "loss_eval": 0.8525989055633545, "epoch": 56 }, { "hidden_norms_cls": [ 1.5115892887115479, 5.313480377197266, 7.247244834899902, 9.550230979919434, 11.989883422851562 ], "hidden_norms_avg": [ 4.3022141456604, 8.688987731933594, 9.685582160949707, 11.234566688537598, 12.270132064819336 ], "bp_grad_per_sample_l2_med": [ 0.0001483379164710641, 7.948598067741841e-05, 6.1946535424795e-05, 4.4680935388896614e-05, 1.6852744010975584e-05 ], "bp_grad_F": [ 0.21088635921478271, 0.11181779950857162, 0.08855349570512772, 0.06269123405218124, 0.026410162448883057 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7890625, "loss_eval": 0.8474454879760742, "epoch": 57 }, { "hidden_norms_cls": [ 1.5110703706741333, 5.306856632232666, 7.230412483215332, 9.542105674743652, 11.942556381225586 ], "hidden_norms_avg": [ 4.305404186248779, 8.697504997253418, 9.679413795471191, 11.226194381713867, 12.25047492980957 ], "bp_grad_per_sample_l2_med": [ 0.00014003549586050212, 7.460260530933738e-05, 6.204132660059258e-05, 3.912465035682544e-05, 1.6441039406345226e-05 ], "bp_grad_F": [ 0.20991134643554688, 0.11143218725919724, 0.08832813799381256, 0.06269684433937073, 0.026480402797460556 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.791015625, "loss_eval": 0.8496487140655518, "epoch": 58 }, { "hidden_norms_cls": [ 1.5111491680145264, 5.304075717926025, 7.234795093536377, 9.53318977355957, 11.964473724365234 ], "hidden_norms_avg": [ 4.304405689239502, 8.697833061218262, 9.683843612670898, 11.22890853881836, 12.259684562683105 ], "bp_grad_per_sample_l2_med": [ 0.00014237761206459254, 7.472094148397446e-05, 5.683211929863319e-05, 4.049929339089431e-05, 1.4964447473175824e-05 ], "bp_grad_F": [ 0.21009324491024017, 0.11155029386281967, 0.08846566081047058, 0.06290413439273834, 0.026488499715924263 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.794921875, "loss_eval": 0.8498167395591736, "epoch": 59 }, { "hidden_norms_cls": [ 1.5111573934555054, 5.304897785186768, 7.23397970199585, 9.53254508972168, 11.969621658325195 ], "hidden_norms_avg": [ 4.304327964782715, 8.696623802185059, 9.681411743164062, 11.225934982299805, 12.255182266235352 ], "bp_grad_per_sample_l2_med": [ 0.0001376860454911366, 7.4876043072436e-05, 5.8659916248871014e-05, 4.048796836286783e-05, 1.5446972611243837e-05 ], "bp_grad_F": [ 0.210032656788826, 0.11159469932317734, 0.08847951143980026, 0.06288634985685349, 0.02649829164147377 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.791015625, "loss_eval": 0.8496516942977905, "epoch": 60 } ], "dfa_log": [ { "hidden_norms_cls": [ 0.3042769432067871, 3.2273340225219727, 4.6926493644714355, 6.003997802734375, 6.652705669403076 ], "hidden_norms_avg": [ 6.027750492095947, 7.1044697761535645, 7.910475730895996, 8.79189682006836, 9.458833694458008 ], "bp_grad_per_sample_l2_med": [ 0.005248428788036108, 0.0012287507997825742, 0.0010387187357991934, 0.0009678652859292924, 0.0009174557635560632 ], "bp_grad_F": [ 0.248850479722023, 0.0424945093691349, 0.0348997563123703, 0.03202275559306145, 0.030239813029766083 ], "gamma_dfa": -0.0027123973850393668, "gamma_dfa_per_layer": [ -0.0010305923642590642, -0.01111956313252449, 0.0014823779929429293, -0.00018181203631684184 ], "acc_eval": 0.0791015625, "loss_eval": 2.544933319091797, "epoch": 0 }, { "hidden_norms_cls": [ 1.8898234367370605, 1755.5985107421875, 3812.865966796875, 4063.967529296875, 6749.62646484375 ], "hidden_norms_avg": [ 48.02373504638672, 2610.970458984375, 7442.5693359375, 13001.9443359375, 19569.59765625 ], "bp_grad_per_sample_l2_med": [ 0.0006367825553752482, 1.061867237694969e-06, 9.113553005590802e-07, 8.042399599617056e-07, 7.901451226643985e-07 ], "bp_grad_F": [ 0.11358296871185303, 5.570299981627613e-05, 4.605366484611295e-05, 3.752685370272957e-05, 3.027659113286063e-05 ], "gamma_dfa": 0.007312511210329831, "gamma_dfa_per_layer": [ 0.01007317565381527, 0.008024577051401138, 0.008248038589954376, 0.0029042535461485386 ], "acc_eval": 0.2333984375, "loss_eval": 2.0879125595092773, "epoch": 1 }, { "hidden_norms_cls": [ 3.704786777496338, 7219.806640625, 19592.4140625, 21808.44921875, 46117.11328125 ], "hidden_norms_avg": [ 97.33866882324219, 9787.240234375, 35216.66015625, 64377.67578125, 97116.8125 ], "bp_grad_per_sample_l2_med": [ 9.637367475079373e-05, 1.6794896851024532e-07, 1.5954641696680483e-07, 1.4061814113119908e-07, 1.445507677999558e-07 ], "bp_grad_F": [ 0.04642009362578392, 2.128358573827427e-05, 2.0123250578762963e-05, 6.922710781509522e-06, 6.6381039687257726e-06 ], "gamma_dfa": 0.007922766148112714, "gamma_dfa_per_layer": [ 0.016379408538341522, 0.005931380204856396, 0.007020577322691679, 0.0023596985265612602 ], "acc_eval": 0.205078125, "loss_eval": 2.1287283897399902, "epoch": 2 }, { "hidden_norms_cls": [ 5.554904937744141, 16081.3388671875, 48028.96875, 51717.93359375, 100197.7265625 ], "hidden_norms_avg": [ 147.4190216064453, 22860.939453125, 90670.5078125, 172520.15625, 247624.09375 ], "bp_grad_per_sample_l2_med": [ 3.051399289688561e-05, 9.248702070863146e-08, 7.303499671706959e-08, 6.487525183729304e-08, 6.620962977876843e-08 ], "bp_grad_F": [ 0.034720927476882935, 1.6823112673591822e-05, 1.1384844583517406e-05, 3.0318508379423292e-06, 2.624829903652426e-06 ], "gamma_dfa": 0.0067759081866825, "gamma_dfa_per_layer": [ 0.014651123434305191, 0.004187515936791897, 0.007594288792461157, 0.0006707045831717551 ], "acc_eval": 0.20703125, "loss_eval": 2.107574462890625, "epoch": 3 }, { "hidden_norms_cls": [ 7.38655424118042, 30113.763671875, 92815.4375, 102848.4453125, 183389.40625 ], "hidden_norms_avg": [ 194.20396423339844, 39156.78515625, 166144.453125, 360300.25, 500574.96875 ], "bp_grad_per_sample_l2_med": [ 2.7757007046602666e-05, 6.177719313882335e-08, 4.3474216226968565e-08, 3.8972562066419414e-08, 3.9463689205376795e-08 ], "bp_grad_F": [ 0.03289186581969261, 5.563175363931805e-06, 2.151713033526903e-06, 1.463158696424216e-06, 1.3795681752526434e-06 ], "gamma_dfa": 0.006396490931365406, "gamma_dfa_per_layer": [ 0.015158161520957947, 0.0035972977057099342, 0.006714952643960714, 0.00011555185483302921 ], "acc_eval": 0.203125, "loss_eval": 2.1379737854003906, "epoch": 4 }, { "hidden_norms_cls": [ 9.15835189819336, 53591.8984375, 170615.734375, 181427.171875, 289063.5625 ], "hidden_norms_avg": [ 238.28347778320312, 61062.31640625, 250187.6875, 548101.3125, 724058.1875 ], "bp_grad_per_sample_l2_med": [ 2.960537312901579e-05, 4.670241438020639e-08, 3.080446120407032e-08, 2.670985388419922e-08, 2.6331489877406966e-08 ], "bp_grad_F": [ 0.016260992735624313, 4.766869551531272e-06, 2.067620698653627e-06, 9.787106591829797e-07, 8.912123234949831e-07 ], "gamma_dfa": 0.0068261599517427385, "gamma_dfa_per_layer": [ 0.014116348698735237, 0.003242844482883811, 0.008411802351474762, 0.0015336442738771439 ], "acc_eval": 0.1962890625, "loss_eval": 2.1309733390808105, "epoch": 5 }, { "hidden_norms_cls": [ 10.888343811035156, 91755.1171875, 249917.8125, 274005.3125, 444277.53125 ], "hidden_norms_avg": [ 276.9202880859375, 104021.7109375, 349872.5, 931915.875, 1222273.75 ], "bp_grad_per_sample_l2_med": [ 2.7342781322658993e-05, 3.6854661544794e-08, 2.4993127567540796e-08, 1.8662358769461207e-08, 1.7811659702715588e-08 ], "bp_grad_F": [ 0.022468894720077515, 3.493201802484691e-06, 1.1520894531713566e-06, 7.113425795068906e-07, 6.108040793151304e-07 ], "gamma_dfa": 0.007193240569904447, "gamma_dfa_per_layer": [ 0.017048656940460205, 0.002665129955857992, 0.007390158250927925, 0.001669017132371664 ], "acc_eval": 0.2109375, "loss_eval": 2.1020355224609375, "epoch": 6 }, { "hidden_norms_cls": [ 12.623483657836914, 158915.890625, 360070.6875, 406906.3125, 630641.3125 ], "hidden_norms_avg": [ 315.0859680175781, 172244.328125, 490065.59375, 1510240.375, 1952914.5 ], "bp_grad_per_sample_l2_med": [ 3.403881783015095e-05, 2.7625405962794503e-08, 1.651102543576144e-08, 1.1742161909467086e-08, 1.0927361238088906e-08 ], "bp_grad_F": [ 0.024832597002387047, 1.8080392010233481e-06, 7.246239306368807e-07, 4.936595132676302e-07, 4.0145107504940825e-07 ], "gamma_dfa": 0.006596001767320558, "gamma_dfa_per_layer": [ 0.016851693391799927, 0.001910479972139001, 0.0058369822800159454, 0.0017848514253273606 ], "acc_eval": 0.2138671875, "loss_eval": 2.1312928199768066, "epoch": 7 }, { "hidden_norms_cls": [ 14.368335723876953, 243332.8125, 525771.0, 593291.75, 875288.5 ], "hidden_norms_avg": [ 351.16015625, 247222.375, 640658.75, 1855662.75, 2391194.25 ], "bp_grad_per_sample_l2_med": [ 2.87416060018586e-05, 1.8018790015617014e-08, 1.2651691250198382e-08, 9.33115984480537e-09, 8.563736386690834e-09 ], "bp_grad_F": [ 0.017871394753456116, 9.426115070709784e-07, 4.7217255882969766e-07, 3.564711050785263e-07, 3.2240865266430774e-07 ], "gamma_dfa": 0.006289168493822217, "gamma_dfa_per_layer": [ 0.013373943977057934, 0.0037157258484512568, 0.00672483816742897, 0.001342165982350707 ], "acc_eval": 0.220703125, "loss_eval": 2.0829837322235107, "epoch": 8 }, { "hidden_norms_cls": [ 16.041412353515625, 385486.09375, 776263.875, 869037.0, 1191002.25 ], "hidden_norms_avg": [ 383.5213317871094, 383708.40625, 941498.0, 2793651.25, 3510556.5 ], "bp_grad_per_sample_l2_med": [ 2.8917142117279582e-05, 1.1363525231899985e-08, 8.616331648170217e-09, 5.602694308493028e-09, 5.260086588521062e-09 ], "bp_grad_F": [ 0.024791762232780457, 6.833873840150773e-07, 3.100701633229619e-07, 2.26619619070334e-07, 2.1342954426017968e-07 ], "gamma_dfa": 0.00652129843365401, "gamma_dfa_per_layer": [ 0.014406262896955013, 0.004345592111349106, 0.006529162637889385, 0.0008041760884225368 ], "acc_eval": 0.2197265625, "loss_eval": 2.1437277793884277, "epoch": 9 }, { "hidden_norms_cls": [ 17.677919387817383, 582942.5, 1148260.75, 1279834.25, 1709270.625 ], "hidden_norms_avg": [ 416.1814880371094, 530246.375, 1201761.5, 2944394.0, 3732565.75 ], "bp_grad_per_sample_l2_med": [ 3.369058686075732e-05, 6.623859238885643e-09, 4.513381224313662e-09, 3.933114278709127e-09, 3.794405678547719e-09 ], "bp_grad_F": [ 0.01620429754257202, 3.022730652446626e-07, 1.9097409165169665e-07, 1.773983058228623e-07, 1.593236333974346e-07 ], "gamma_dfa": 0.006082151841837913, "gamma_dfa_per_layer": [ 0.01578153669834137, 0.002655572956427932, 0.005509376525878906, 0.00038212118670344353 ], "acc_eval": 0.197265625, "loss_eval": 2.089698314666748, "epoch": 10 }, { "hidden_norms_cls": [ 19.31073760986328, 843820.0625, 1587423.25, 1759006.0, 2222149.5 ], "hidden_norms_avg": [ 448.93133544921875, 796172.1875, 1678321.375, 3888912.0, 4810418.0 ], "bp_grad_per_sample_l2_med": [ 4.445635568117723e-05, 3.5140981236025937e-09, 2.8926525619255017e-09, 2.65975419466713e-09, 2.6499111793754082e-09 ], "bp_grad_F": [ 0.020245229825377464, 2.6993967594535206e-07, 1.701987457636278e-07, 1.3198047099649557e-07, 1.2469256205349666e-07 ], "gamma_dfa": 0.005559869911849091, "gamma_dfa_per_layer": [ 0.015185668133199215, 0.0025689376052469015, 0.004468783736228943, 1.6090172721305862e-05 ], "acc_eval": 0.2314453125, "loss_eval": 2.0838193893432617, "epoch": 11 }, { "hidden_norms_cls": [ 20.861183166503906, 1157778.75, 2054207.5, 2289084.5, 2841995.0 ], "hidden_norms_avg": [ 479.8387145996094, 981138.875, 2112497.25, 4439588.0, 5517614.5 ], "bp_grad_per_sample_l2_med": [ 3.176981772412546e-05, 3.1782512177613853e-09, 2.5456772245746606e-09, 2.4393245201537184e-09, 2.414718425214346e-09 ], "bp_grad_F": [ 0.09368129819631577, 9.166008680949744e-07, 2.675243706562469e-07, 1.0984689424731187e-07, 1.0444787079677553e-07 ], "gamma_dfa": 0.004390636342577636, "gamma_dfa_per_layer": [ 0.011994147673249245, 0.001997251994907856, 0.003865728620439768, -0.00029458291828632355 ], "acc_eval": 0.224609375, "loss_eval": 2.0896079540252686, "epoch": 12 }, { "hidden_norms_cls": [ 22.362810134887695, 1504072.375, 2527410.75, 2870361.25, 3557771.0 ], "hidden_norms_avg": [ 510.81561279296875, 1188843.375, 2574796.25, 5296089.0, 6640932.5 ], "bp_grad_per_sample_l2_med": [ 2.8154454412288032e-05, 3.057065711686846e-09, 2.121731013104977e-09, 2.0999049166192663e-09, 2.0892536589656174e-09 ], "bp_grad_F": [ 0.011068353429436684, 1.3467251847032458e-06, 1.0581060649883511e-07, 9.427417069218791e-08, 9.197237460512042e-08 ], "gamma_dfa": 0.003989392673247494, "gamma_dfa_per_layer": [ 0.011822337284684181, 0.001384879695251584, 0.00329465395770967, -0.0005443002446554601 ], "acc_eval": 0.244140625, "loss_eval": 2.077056407928467, "epoch": 13 }, { "hidden_norms_cls": [ 23.812599182128906, 1930070.0, 2995981.75, 3469627.0, 4303896.0 ], "hidden_norms_avg": [ 539.9255981445312, 1589889.5, 3066154.25, 6015238.0, 7540605.5 ], "bp_grad_per_sample_l2_med": [ 3.170168929500505e-05, 2.518652619798445e-09, 1.924201020742089e-09, 1.8520206479522017e-09, 1.8417810609960839e-09 ], "bp_grad_F": [ 0.032089244574308395, 1.0142422297576559e-06, 1.6566445992793888e-07, 8.33219857554468e-08, 7.640721122470495e-08 ], "gamma_dfa": 0.0029267592035466805, "gamma_dfa_per_layer": [ 0.008105762302875519, 0.001629034522920847, 0.0022919299080967903, -0.000319689919706434 ], "acc_eval": 0.224609375, "loss_eval": 2.0748229026794434, "epoch": 14 }, { "hidden_norms_cls": [ 25.248563766479492, 2452306.5, 3664022.75, 4168536.0, 5106242.5 ], "hidden_norms_avg": [ 570.19384765625, 1965615.5, 3710471.5, 7372995.0, 9239893.0 ], "bp_grad_per_sample_l2_med": [ 2.4190969270421192e-05, 1.8390389211475622e-09, 1.5613663695290825e-09, 1.5359991056840272e-09, 1.5388512686342892e-09 ], "bp_grad_F": [ 0.015056902542710304, 6.693913292110665e-06, 1.241161982079575e-07, 7.622224984515924e-08, 6.743793790064956e-08 ], "gamma_dfa": 0.0022661721595795825, "gamma_dfa_per_layer": [ 0.006208081729710102, 0.001149914925917983, 0.0020575951784849167, -0.0003509031957946718 ], "acc_eval": 0.236328125, "loss_eval": 2.0835204124450684, "epoch": 15 }, { "hidden_norms_cls": [ 26.6426944732666, 3107169.0, 4381372.0, 5027998.5, 6065136.0 ], "hidden_norms_avg": [ 596.7793579101562, 2542559.0, 4400625.5, 8374831.5, 10510773.0 ], "bp_grad_per_sample_l2_med": [ 2.787545781757217e-05, 1.5701163702530607e-09, 1.2841328000945396e-09, 1.2669904014828148e-09, 1.2700215323846464e-09 ], "bp_grad_F": [ 0.006971500348299742, 1.8619180991663598e-05, 6.465826629664662e-08, 5.84209978171657e-08, 5.694714744208795e-08 ], "gamma_dfa": 0.0030232197314035147, "gamma_dfa_per_layer": [ 0.009539565071463585, 0.0012945058988407254, 0.0015697493217885494, -0.0003109413664788008 ], "acc_eval": 0.236328125, "loss_eval": 2.058485507965088, "epoch": 16 }, { "hidden_norms_cls": [ 27.95879364013672, 3613966.25, 5044349.0, 5874924.0, 7080756.0 ], "hidden_norms_avg": [ 623.2052612304688, 2844551.5, 4942977.0, 8742455.0, 11094594.0 ], "bp_grad_per_sample_l2_med": [ 2.8442762413760647e-05, 1.629689605486817e-09, 1.115437520127216e-09, 1.0797144289753646e-09, 1.0779978021346892e-09 ], "bp_grad_F": [ 0.0072508929297327995, 1.4132167507341364e-06, 6.271753250075562e-08, 4.991998281411725e-08, 4.950436149897541e-08 ], "gamma_dfa": 0.001284227124415338, "gamma_dfa_per_layer": [ 0.00256139412522316, 0.0014944188296794891, 0.0013982560485601425, -0.0003171605058014393 ], "acc_eval": 0.240234375, "loss_eval": 2.0549392700195312, "epoch": 17 }, { "hidden_norms_cls": [ 29.22184181213379, 4211867.5, 5636704.5, 6891397.5, 8559809.0 ], "hidden_norms_avg": [ 647.4288330078125, 3423908.25, 5695376.5, 10367815.0, 13188250.0 ], "bp_grad_per_sample_l2_med": [ 2.8086895326850936e-05, 1.1501447572115353e-09, 8.738501033889179e-10, 8.528160400089746e-10, 8.584906674435899e-10 ], "bp_grad_F": [ 0.012267161160707474, 1.591232035025314e-06, 4.697067268466526e-08, 4.271150899626264e-08, 4.017679700041299e-08 ], "gamma_dfa": 0.0022953646985115483, "gamma_dfa_per_layer": [ 0.007007642649114132, 0.0012370320037007332, 0.0011846421984955668, -0.0002478580572642386 ], "acc_eval": 0.228515625, "loss_eval": 2.053128242492676, "epoch": 18 }, { "hidden_norms_cls": [ 30.412078857421875, 4986411.0, 6504586.0, 7889628.0, 9783147.0 ], "hidden_norms_avg": [ 670.3391723632812, 3921667.0, 6270645.0, 10589857.0, 13580617.0 ], "bp_grad_per_sample_l2_med": [ 2.768085505522322e-05, 1.3132780418700918e-09, 7.742924079678914e-10, 7.418777814294231e-10, 7.448673344789825e-10 ], "bp_grad_F": [ 0.007575999945402145, 1.7771724287740653e-06, 5.529824420591467e-08, 3.790939828718365e-08, 3.6307092443621514e-08 ], "gamma_dfa": 0.0009071348831639625, "gamma_dfa_per_layer": [ 0.001273356145247817, 0.001484773471020162, 0.0010661636479198933, -0.00019575373153202236 ], "acc_eval": 0.25390625, "loss_eval": 2.0479414463043213, "epoch": 19 }, { "hidden_norms_cls": [ 31.54771614074707, 5502896.5, 7070197.5, 8994800.0, 11604998.0 ], "hidden_norms_avg": [ 692.4578247070312, 4249610.0, 6837255.0, 11617683.0, 15223152.0 ], "bp_grad_per_sample_l2_med": [ 3.0367684303200804e-05, 1.325711207478264e-09, 6.525959217462685e-10, 6.324714640904006e-10, 6.32227936669949e-10 ], "bp_grad_F": [ 0.0062190573662519455, 1.129235442931531e-06, 3.317861896334762e-08, 3.131979653403505e-08, 3.109861168582029e-08 ], "gamma_dfa": 0.0011510169642861001, "gamma_dfa_per_layer": [ 0.002568549243733287, 0.0013005147920921445, 0.0009535959688946605, -0.00021859214757569134 ], "acc_eval": 0.255859375, "loss_eval": 2.0359444618225098, "epoch": 20 }, { "hidden_norms_cls": [ 32.638641357421875, 6320697.0, 7897073.5, 10165307.0, 13313912.0 ], "hidden_norms_avg": [ 713.3525390625, 4812640.5, 7533297.5, 12847435.0, 16993420.0 ], "bp_grad_per_sample_l2_med": [ 3.871564695145935e-05, 1.2221273992807369e-09, 6.080098646776833e-10, 5.917044632042234e-10, 5.89539916884263e-10 ], "bp_grad_F": [ 0.011915000155568123, 6.25122083874885e-06, 3.6603957198622084e-08, 2.876341298474472e-08, 2.8581927935533713e-08 ], "gamma_dfa": 0.0002986440376844257, "gamma_dfa_per_layer": [ -0.0004627959569916129, 0.0009951044339686632, 0.0008257199660874903, -0.00016345229232683778 ], "acc_eval": 0.2626953125, "loss_eval": 2.059875965118408, "epoch": 21 }, { "hidden_norms_cls": [ 33.6330451965332, 7264995.5, 8758988.0, 11785280.0, 15874132.0 ], "hidden_norms_avg": [ 732.8869018554688, 5982206.0, 8454064.0, 14846262.0, 19834080.0 ], "bp_grad_per_sample_l2_med": [ 2.5420635211048648e-05, 7.56205986718328e-10, 5.169706884800007e-10, 5.026724592127607e-10, 5.024383686880185e-10 ], "bp_grad_F": [ 0.014803220517933369, 4.478873961488716e-06, 4.4555019229619575e-08, 2.4910459472948787e-08, 2.4745437698925343e-08 ], "gamma_dfa": 0.001046390665578656, "gamma_dfa_per_layer": [ 0.0027164756320416927, 0.0009058329742401838, 0.0007253356743603945, -0.00016208161832764745 ], "acc_eval": 0.255859375, "loss_eval": 2.0538365840911865, "epoch": 22 }, { "hidden_norms_cls": [ 34.621524810791016, 8089090.5, 9671455.0, 13086530.0, 17616980.0 ], "hidden_norms_avg": [ 751.2442016601562, 6699752.5, 9159771.0, 15622865.0, 21214146.0 ], "bp_grad_per_sample_l2_med": [ 2.7939373467233963e-05, 7.656756340068682e-10, 5.061054908495066e-10, 4.837483191799663e-10, 4.820439047925618e-10 ], "bp_grad_F": [ 0.008210284635424614, 3.91981393477181e-06, 2.727725245676993e-08, 2.349457695061119e-08, 2.2768137597495297e-08 ], "gamma_dfa": 0.0013028495595790446, "gamma_dfa_per_layer": [ 0.0034610098227858543, 0.0012297509238123894, 0.0006837932160124183, -0.00016315572429448366 ], "acc_eval": 0.2646484375, "loss_eval": 2.0430214405059814, "epoch": 23 }, { "hidden_norms_cls": [ 35.54478454589844, 9145767.0, 10558942.0, 14636200.0, 19721632.0 ], "hidden_norms_avg": [ 768.5211791992188, 7473006.0, 10093548.0, 17775052.0, 24159262.0 ], "bp_grad_per_sample_l2_med": [ 3.364618532941677e-05, 8.066202705769854e-10, 4.5619852340195166e-10, 4.4121445386124947e-10, 4.323804370098827e-10 ], "bp_grad_F": [ 0.09167197346687317, 4.855019597016508e-06, 2.689265521382822e-08, 2.1627007740221416e-08, 2.0867716443717654e-08 ], "gamma_dfa": 0.0001647558601689525, "gamma_dfa_per_layer": [ -0.0005364040262065828, 0.0007433416321873665, 0.0005910456529818475, -0.00013895981828682125 ], "acc_eval": 0.23046875, "loss_eval": 2.0427517890930176, "epoch": 24 }, { "hidden_norms_cls": [ 36.43881607055664, 10216266.0, 11478190.0, 16476424.0, 22393992.0 ], "hidden_norms_avg": [ 785.1990966796875, 8300483.0, 10872433.0, 18667924.0, 25447926.0 ], "bp_grad_per_sample_l2_med": [ 3.0938736017560586e-05, 7.561202219896757e-10, 4.2832748459176173e-10, 4.0923736621678586e-10, 4.0218126051705383e-10 ], "bp_grad_F": [ 0.013463743962347507, 1.9222785340389237e-05, 2.2825457079989064e-08, 1.9977358434175585e-08, 1.9259800865256693e-08 ], "gamma_dfa": 0.0005702937960450072, "gamma_dfa_per_layer": [ 0.0011116554960608482, 0.0007594762137159705, 0.0005430461023934186, -0.00013300262799020857 ], "acc_eval": 0.2568359375, "loss_eval": 2.0594615936279297, "epoch": 25 }, { "hidden_norms_cls": [ 37.30263137817383, 11623684.0, 12776919.0, 18306868.0, 24740858.0 ], "hidden_norms_avg": [ 800.9972534179688, 9603253.0, 12104963.0, 20835068.0, 28405318.0 ], "bp_grad_per_sample_l2_med": [ 3.261065648985095e-05, 6.65525801135658e-10, 3.838940831890625e-10, 3.742672838313865e-10, 3.7395189722566613e-10 ], "bp_grad_F": [ 0.007853930816054344, 1.2899076864414383e-06, 1.9278010299217385e-08, 1.8154999281705386e-08, 1.7368931182204506e-08 ], "gamma_dfa": 0.00021361159815569408, "gamma_dfa_per_layer": [ -0.00034064118517562747, 0.0008438127697445452, 0.0004718025156762451, -0.00012052770762238652 ], "acc_eval": 0.255859375, "loss_eval": 2.0433781147003174, "epoch": 26 }, { "hidden_norms_cls": [ 38.06776428222656, 12599130.0, 13703165.0, 19834172.0, 26867468.0 ], "hidden_norms_avg": [ 816.2463989257812, 10421772.0, 12873138.0, 21321398.0, 29452538.0 ], "bp_grad_per_sample_l2_med": [ 2.774638414848596e-05, 6.227232618449818e-10, 3.566741624272396e-10, 3.4781866276034634e-10, 3.45437983773067e-10 ], "bp_grad_F": [ 0.013920681551098824, 3.4208371744171018e-06, 2.1883508338760294e-08, 1.7128741092165e-08, 1.6603545205384762e-08 ], "gamma_dfa": 0.0008690126524015795, "gamma_dfa_per_layer": [ 0.0021882583387196064, 0.0009064457844942808, 0.0004841286572627723, -0.00010278217087034136 ], "acc_eval": 0.2529296875, "loss_eval": 2.0433974266052246, "epoch": 27 }, { "hidden_norms_cls": [ 38.7847785949707, 14429584.0, 15438086.0, 21566880.0, 29267340.0 ], "hidden_norms_avg": [ 830.9344482421875, 11436777.0, 13832175.0, 22913616.0, 32026754.0 ], "bp_grad_per_sample_l2_med": [ 2.8682481570285745e-05, 5.758302168423768e-10, 3.3607527871737375e-10, 3.304233830991876e-10, 3.2846284026000205e-10 ], "bp_grad_F": [ 0.012251574546098709, 2.996052717207931e-05, 2.7452134787608884e-08, 1.577506480998636e-08, 1.5141546683139495e-08 ], "gamma_dfa": 0.0004505918041104451, "gamma_dfa_per_layer": [ 0.00026967719895765185, 0.001212525530718267, 0.0004131481982767582, -9.298371151089668e-05 ], "acc_eval": 0.2607421875, "loss_eval": 2.039923667907715, "epoch": 28 }, { "hidden_norms_cls": [ 39.49647521972656, 15523604.0, 16504434.0, 23236370.0, 31306890.0 ], "hidden_norms_avg": [ 844.8562622070312, 12856661.0, 15124535.0, 23633704.0, 32995118.0 ], "bp_grad_per_sample_l2_med": [ 2.6219468054478057e-05, 5.519696366640403e-10, 3.2825916984613457e-10, 3.235848811122821e-10, 3.2190172749579915e-10 ], "bp_grad_F": [ 0.012884745374321938, 1.8329246813664213e-05, 1.8323355277516384e-08, 1.5584015855552025e-08, 1.4755748622974352e-08 ], "gamma_dfa": 0.0006857650478195865, "gamma_dfa_per_layer": [ 0.0016966589028015733, 0.0007126724813133478, 0.0003994358121417463, -6.570700497832149e-05 ], "acc_eval": 0.2451171875, "loss_eval": 2.0533735752105713, "epoch": 29 }, { "hidden_norms_cls": [ 40.16881561279297, 16141660.0, 17137856.0, 24286464.0, 32903152.0 ], "hidden_norms_avg": [ 857.8116455078125, 12895693.0, 15492559.0, 23745768.0, 33843860.0 ], "bp_grad_per_sample_l2_med": [ 3.2289473892888054e-05, 6.340856728570543e-10, 3.264067627295475e-10, 3.149370209065694e-10, 3.097411216401724e-10 ], "bp_grad_F": [ 0.006337009835988283, 1.7065680367522873e-05, 5.785592804841144e-08, 1.519365788738014e-08, 1.464850551968766e-08 ], "gamma_dfa": 0.0005419648223323748, "gamma_dfa_per_layer": [ 0.00038546844734810293, 0.0014093497302383184, 0.0004054713645018637, -3.243025275878608e-05 ], "acc_eval": 0.265625, "loss_eval": 2.0390102863311768, "epoch": 30 }, { "hidden_norms_cls": [ 40.790164947509766, 18768648.0, 19610716.0, 26926266.0, 36060360.0 ], "hidden_norms_avg": [ 869.6182861328125, 15248417.0, 17480158.0, 26928640.0, 37555876.0 ], "bp_grad_per_sample_l2_med": [ 2.939497062470764e-05, 5.127394064885493e-10, 3.1137872835707014e-10, 3.074558663218596e-10, 3.04990144250894e-10 ], "bp_grad_F": [ 0.03832927718758583, 8.881174835551064e-06, 2.5206949416656244e-08, 1.4185034480362901e-08, 1.3504863893842867e-08 ], "gamma_dfa": 0.0005767397606177838, "gamma_dfa_per_layer": [ 0.00058704090770334, 0.0013887862442061305, 0.0003486467176117003, -1.751482705003582e-05 ], "acc_eval": 0.232421875, "loss_eval": 2.055915117263794, "epoch": 31 }, { "hidden_norms_cls": [ 41.36415481567383, 20590018.0, 21418164.0, 28674892.0, 38102536.0 ], "hidden_norms_avg": [ 880.8012084960938, 15857472.0, 18200580.0, 27607590.0, 38905496.0 ], "bp_grad_per_sample_l2_med": [ 2.6930878448183648e-05, 5.041319584009329e-10, 3.0716035270828e-10, 2.9963459491355593e-10, 2.9755845010193127e-10 ], "bp_grad_F": [ 0.01052916795015335, 1.7662874597590417e-05, 1.8223250464188823e-08, 1.4229329714510186e-08, 1.2928855319671584e-08 ], "gamma_dfa": 0.0005623552362976625, "gamma_dfa_per_layer": [ 0.0005056762602180243, 0.00140343327075243, 0.0003372218052390963, 3.0896089810994454e-06 ], "acc_eval": 0.2451171875, "loss_eval": 2.054579734802246, "epoch": 32 }, { "hidden_norms_cls": [ 41.9267578125, 21995458.0, 22701258.0, 30227660.0, 40381468.0 ], "hidden_norms_avg": [ 891.6727294921875, 17925388.0, 19924592.0, 29375846.0, 41265952.0 ], "bp_grad_per_sample_l2_med": [ 3.4433691325830296e-05, 4.786913088139499e-10, 3.083476807219654e-10, 3.030005690796145e-10, 3.0202479406327143e-10 ], "bp_grad_F": [ 0.006410651374608278, 9.426087672181893e-06, 1.748733602369157e-08, 1.330249954634155e-08, 1.2548162509062877e-08 ], "gamma_dfa": 0.0005204869294175296, "gamma_dfa_per_layer": [ 0.0004088875139132142, 0.001322226831689477, 0.00032363145146518946, 2.7201920602237806e-05 ], "acc_eval": 0.2568359375, "loss_eval": 2.0504493713378906, "epoch": 33 }, { "hidden_norms_cls": [ 42.43289566040039, 23788478.0, 24547006.0, 32122702.0, 42524392.0 ], "hidden_norms_avg": [ 902.5420532226562, 19126440.0, 21210522.0, 30872922.0, 43207040.0 ], "bp_grad_per_sample_l2_med": [ 2.8793765523005277e-05, 4.69506655775831e-10, 2.9882180063722785e-10, 2.9027436010409247e-10, 2.88086998700976e-10 ], "bp_grad_F": [ 0.02046363614499569, 1.535968840471469e-05, 1.9181511490273806e-08, 1.3211375105015577e-08, 1.2052867148781843e-08 ], "gamma_dfa": 0.0005800028211524477, "gamma_dfa_per_layer": [ 0.0005789051647298038, 0.001365642063319683, 0.0003222030645702034, 5.326099199010059e-05 ], "acc_eval": 0.236328125, "loss_eval": 2.056929349899292, "epoch": 34 }, { "hidden_norms_cls": [ 42.88957595825195, 24876160.0, 25665632.0, 33698024.0, 44433192.0 ], "hidden_norms_avg": [ 912.5694580078125, 20388924.0, 22492538.0, 32293406.0, 44758584.0 ], "bp_grad_per_sample_l2_med": [ 3.043079595954623e-05, 4.6556239419182077e-10, 3.0177585430557485e-10, 2.9259758504984745e-10, 2.8850585809259144e-10 ], "bp_grad_F": [ 0.018651673570275307, 8.0938043538481e-06, 2.600621051840335e-08, 1.3419185762586494e-08, 1.200509913701353e-08 ], "gamma_dfa": 0.0008372370848519495, "gamma_dfa_per_layer": [ 0.001413366524502635, 0.0015261531807482243, 0.0003260627272538841, 8.336590690305457e-05 ], "acc_eval": 0.2353515625, "loss_eval": 2.060340404510498, "epoch": 35 }, { "hidden_norms_cls": [ 43.32978057861328, 25917158.0, 26720118.0, 34948196.0, 46313048.0 ], "hidden_norms_avg": [ 921.58642578125, 21474648.0, 23549474.0, 33572188.0, 46615396.0 ], "bp_grad_per_sample_l2_med": [ 3.262757672928274e-05, 4.5062673037499223e-10, 2.984587021970242e-10, 2.923088993078693e-10, 2.888300987269332e-10 ], "bp_grad_F": [ 0.01846941001713276, 2.4291131921927445e-05, 2.994345393858566e-08, 1.4564162320596097e-08, 1.1765412644137996e-08 ], "gamma_dfa": 0.0007057133989292197, "gamma_dfa_per_layer": [ 0.0011925556464120746, 0.0012432597577571869, 0.0002897845406550914, 9.725365089252591e-05 ], "acc_eval": 0.2451171875, "loss_eval": 2.0591180324554443, "epoch": 36 }, { "hidden_norms_cls": [ 43.74128341674805, 27200966.0, 27911578.0, 36161972.0, 47854788.0 ], "hidden_norms_avg": [ 930.2008666992188, 22529414.0, 24601434.0, 34829948.0, 48238220.0 ], "bp_grad_per_sample_l2_med": [ 3.328157981741242e-05, 4.659617691693541e-10, 2.8960928100119077e-10, 2.8687860420539835e-10, 2.800103759970085e-10 ], "bp_grad_F": [ 0.004556785803288221, 9.644008059694897e-06, 1.5685751364458156e-08, 1.2929571191477862e-08, 1.1707988356590704e-08 ], "gamma_dfa": 0.0005315981106832623, "gamma_dfa_per_layer": [ 0.0004304055473767221, 0.0012520912569016218, 0.0003118191962130368, 0.0001320764422416687 ], "acc_eval": 0.255859375, "loss_eval": 2.049736738204956, "epoch": 37 }, { "hidden_norms_cls": [ 44.10750198364258, 28860724.0, 29566448.0, 37605440.0, 49767188.0 ], "hidden_norms_avg": [ 938.7098999023438, 24297102.0, 26192510.0, 36561148.0, 49957968.0 ], "bp_grad_per_sample_l2_med": [ 2.900460640375968e-05, 4.445998014190877e-10, 2.888302930159625e-10, 2.855987946137617e-10, 2.818917876901139e-10 ], "bp_grad_F": [ 0.013354518450796604, 6.135221156000625e-06, 1.780158420672251e-08, 1.3947193622243503e-08, 1.161484952660885e-08 ], "gamma_dfa": 0.0005519518890650943, "gamma_dfa_per_layer": [ 0.0005505518638528883, 0.001156628131866455, 0.00033354441984556615, 0.0001670831406954676 ], "acc_eval": 0.2412109375, "loss_eval": 2.0527162551879883, "epoch": 38 }, { "hidden_norms_cls": [ 44.42500305175781, 30085758.0, 30793664.0, 39317268.0, 51773680.0 ], "hidden_norms_avg": [ 946.3699340820312, 24723960.0, 26763662.0, 37607688.0, 51575988.0 ], "bp_grad_per_sample_l2_med": [ 2.9910466764704324e-05, 4.753269444712771e-10, 2.936461906966059e-10, 2.873846438600225e-10, 2.8520716344182517e-10 ], "bp_grad_F": [ 0.00976789090782404, 1.76885150722228e-05, 1.7970489096796882e-08, 1.3952313970833075e-08, 1.130456972475713e-08 ], "gamma_dfa": 0.0009108289959840477, "gamma_dfa_per_layer": [ 0.0019160081865265965, 0.0012680008076131344, 0.00030145354685373604, 0.00015785344294272363 ], "acc_eval": 0.2412109375, "loss_eval": 2.0550765991210938, "epoch": 39 }, { "hidden_norms_cls": [ 44.73127746582031, 30730856.0, 31431762.0, 40187116.0, 53148352.0 ], "hidden_norms_avg": [ 953.6856079101562, 24778752.0, 27014248.0, 38275640.0, 52795456.0 ], "bp_grad_per_sample_l2_med": [ 2.8919872420374304e-05, 4.755910110176842e-10, 2.84101492331601e-10, 2.7933383384137755e-10, 2.7627339305169585e-10 ], "bp_grad_F": [ 0.009574169293045998, 4.757252463605255e-05, 1.5709005651842745e-08, 1.3778580054690792e-08, 1.1154800638735196e-08 ], "gamma_dfa": 0.0003838329284917563, "gamma_dfa_per_layer": [ -0.0004134870832785964, 0.001480170525610447, 0.0002943193248938769, 0.00017432894674129784 ], "acc_eval": 0.255859375, "loss_eval": 2.0383803844451904, "epoch": 40 }, { "hidden_norms_cls": [ 44.999107360839844, 32617970.0, 33381886.0, 41663220.0, 54853168.0 ], "hidden_norms_avg": [ 960.5386962890625, 27910628.0, 29647900.0, 40418716.0, 54716684.0 ], "bp_grad_per_sample_l2_med": [ 2.9992028430569917e-05, 4.221052118946744e-10, 2.9753777219809763e-10, 2.8370578109004896e-10, 2.813366484222257e-10 ], "bp_grad_F": [ 0.015446176752448082, 3.8060017686802894e-05, 5.211516906911129e-08, 1.3235438522940512e-08, 1.116207481999254e-08 ], "gamma_dfa": 0.0005705733274226077, "gamma_dfa_per_layer": [ 0.0006168894469738007, 0.0011725829681381583, 0.00029753358103334904, 0.00019528731354512274 ], "acc_eval": 0.240234375, "loss_eval": 2.0557656288146973, "epoch": 41 }, { "hidden_norms_cls": [ 45.25053024291992, 33936992.0, 34621240.0, 42946580.0, 56031144.0 ], "hidden_norms_avg": [ 966.2922973632812, 28239400.0, 30055502.0, 41338012.0, 56048388.0 ], "bp_grad_per_sample_l2_med": [ 3.0256345780799165e-05, 4.424338395647709e-10, 2.9891861208497517e-10, 2.8403482343897224e-10, 2.798661857816853e-10 ], "bp_grad_F": [ 0.006179355084896088, 8.527667887392454e-06, 2.116273023489157e-08, 1.2261468285146293e-08, 1.1058569171495947e-08 ], "gamma_dfa": 0.0009438929373573046, "gamma_dfa_per_layer": [ 0.00216879416257143, 0.0010916339233517647, 0.0003159396001137793, 0.00019920406339224428 ], "acc_eval": 0.2470703125, "loss_eval": 2.0517942905426025, "epoch": 42 }, { "hidden_norms_cls": [ 45.481727600097656, 34746476.0, 35397348.0, 43639664.0, 57119836.0 ], "hidden_norms_avg": [ 971.5364379882812, 28891962.0, 30705540.0, 42078288.0, 57065612.0 ], "bp_grad_per_sample_l2_med": [ 2.9764614737359807e-05, 4.5060349895820195e-10, 3.0148228358228835e-10, 2.912529661891483e-10, 2.8715479993834947e-10 ], "bp_grad_F": [ 0.02291245572268963, 1.3926567589805927e-05, 3.118159241921603e-08, 2.1897225366274142e-08, 1.1063916893760961e-08 ], "gamma_dfa": 0.00046937728620832786, "gamma_dfa_per_layer": [ -0.00010078266495838761, 0.0014219002332538366, 0.0003067174111492932, 0.00024967416538856924 ], "acc_eval": 0.2451171875, "loss_eval": 2.054462432861328, "epoch": 43 }, { "hidden_norms_cls": [ 45.68215560913086, 35169816.0, 35827116.0, 44266788.0, 58219984.0 ], "hidden_norms_avg": [ 976.61279296875, 29302304.0, 31207594.0, 42541932.0, 57918596.0 ], "bp_grad_per_sample_l2_med": [ 3.18697166221682e-05, 4.4465031656670817e-10, 3.0559865749069104e-10, 2.891223926937414e-10, 2.8127278284273416e-10 ], "bp_grad_F": [ 0.02285478264093399, 5.0576767534948885e-05, 2.966898726697309e-08, 1.374073210769211e-08, 1.1011787037773502e-08 ], "gamma_dfa": 0.0006015256294631399, "gamma_dfa_per_layer": [ 0.0005435256171040237, 0.0013653798960149288, 0.000284912355709821, 0.0002122846490237862 ], "acc_eval": 0.244140625, "loss_eval": 2.0539493560791016, "epoch": 44 }, { "hidden_norms_cls": [ 45.86240005493164, 36071220.0, 36702996.0, 45105948.0, 59117940.0 ], "hidden_norms_avg": [ 980.9766845703125, 29250424.0, 31315982.0, 42895240.0, 58632240.0 ], "bp_grad_per_sample_l2_med": [ 3.0838917155051604e-05, 4.517226037670241e-10, 3.037594897836726e-10, 2.95300450758873e-10, 2.8246391337027887e-10 ], "bp_grad_F": [ 0.009441024623811245, 2.5670700779301114e-05, 2.221704953342396e-08, 1.750507294673298e-08, 1.1021731971538884e-08 ], "gamma_dfa": 0.00038505904376506805, "gamma_dfa_per_layer": [ -0.0006303560803644359, 0.0016098625492304564, 0.00032150247716344893, 0.00023922722903080285 ], "acc_eval": 0.244140625, "loss_eval": 2.0488905906677246, "epoch": 45 }, { "hidden_norms_cls": [ 46.00979995727539, 36876176.0, 37547776.0, 45586304.0, 59641656.0 ], "hidden_norms_avg": [ 984.9158935546875, 29720264.0, 31840778.0, 43341952.0, 59202960.0 ], "bp_grad_per_sample_l2_med": [ 2.8270042093936354e-05, 4.981586254615422e-10, 3.011032534416813e-10, 2.830454204350019e-10, 2.763113071679868e-10 ], "bp_grad_F": [ 0.01947774738073349, 4.3539188482100144e-05, 2.1426325602647012e-08, 1.4225844502391283e-08, 1.0958768115187922e-08 ], "gamma_dfa": 0.0003295415808679536, "gamma_dfa_per_layer": [ -0.0008024196140468121, 0.0015490652294829488, 0.0003235205076634884, 0.0002480002003721893 ], "acc_eval": 0.2568359375, "loss_eval": 2.0367085933685303, "epoch": 46 }, { "hidden_norms_cls": [ 46.14581298828125, 37542628.0, 38211032.0, 46396536.0, 60543468.0 ], "hidden_norms_avg": [ 988.5308837890625, 31589698.0, 33421126.0, 44806960.0, 60355708.0 ], "bp_grad_per_sample_l2_med": [ 2.7766556740971282e-05, 4.28473617697378e-10, 3.07322972625812e-10, 2.9381372335102185e-10, 2.797302944834712e-10 ], "bp_grad_F": [ 0.06864868849515915, 3.788271715166047e-05, 2.1370066605186366e-08, 1.4025233419090455e-08, 1.1044066994259083e-08 ], "gamma_dfa": 9.462468733545393e-05, "gamma_dfa_per_layer": [ -0.0015880623832345009, 0.0014036648208275437, 0.0003099621389992535, 0.00025293417274951935 ], "acc_eval": 0.244140625, "loss_eval": 2.0631895065307617, "epoch": 47 }, { "hidden_norms_cls": [ 46.26278305053711, 38372568.0, 39046204.0, 47148944.0, 61308416.0 ], "hidden_norms_avg": [ 991.4658813476562, 31279712.0, 33238512.0, 44902484.0, 60826544.0 ], "bp_grad_per_sample_l2_med": [ 2.812536695273593e-05, 4.3919237691092405e-10, 3.053821084897379e-10, 2.9203767182295337e-10, 2.833127066281804e-10 ], "bp_grad_F": [ 0.011117708869278431, 2.0018645955133252e-05, 1.9244726701117543e-08, 1.4165241424279884e-08, 1.090406964721069e-08 ], "gamma_dfa": 0.00016991631855489686, "gamma_dfa_per_layer": [ -0.0015358870150521398, 0.0016542371595278382, 0.0003059905138798058, 0.00025532461586408317 ], "acc_eval": 0.2548828125, "loss_eval": 2.0491740703582764, "epoch": 48 }, { "hidden_norms_cls": [ 46.36857223510742, 38788812.0, 39461172.0, 47582644.0, 61831224.0 ], "hidden_norms_avg": [ 994.04541015625, 32215950.0, 34096260.0, 45599356.0, 61425516.0 ], "bp_grad_per_sample_l2_med": [ 3.0041363061172888e-05, 4.480187609789965e-10, 3.0562316566395964e-10, 2.9085803210371353e-10, 2.820148004012424e-10 ], "bp_grad_F": [ 0.03149434179067612, 6.209969433257356e-05, 2.1469357847081483e-08, 1.3228349970972886e-08, 1.092844392758252e-08 ], "gamma_dfa": 0.00010758559074020013, "gamma_dfa_per_layer": [ -0.0014505982398986816, 0.001327117788605392, 0.0002981229918077588, 0.0002556998224463314 ], "acc_eval": 0.244140625, "loss_eval": 2.0554656982421875, "epoch": 49 }, { "hidden_norms_cls": [ 46.4505729675293, 38845108.0, 39504860.0, 47660992.0, 62097052.0 ], "hidden_norms_avg": [ 996.2877807617188, 32178676.0, 34106748.0, 45494312.0, 61553340.0 ], "bp_grad_per_sample_l2_med": [ 3.0276962206698954e-05, 4.5564105266571175e-10, 3.0059965627771135e-10, 2.8785077099691136e-10, 2.794499076586021e-10 ], "bp_grad_F": [ 0.011724308133125305, 1.9755616449401714e-05, 2.1592299503936374e-08, 1.3796129572085647e-08, 1.0886693324607677e-08 ], "gamma_dfa": 0.0002330350544070825, "gamma_dfa_per_layer": [ -0.0009828422917053103, 0.0013922813814133406, 0.00027237151516601443, 0.00025032961275428534 ], "acc_eval": 0.2578125, "loss_eval": 2.0504729747772217, "epoch": 50 }, { "hidden_norms_cls": [ 46.521934509277344, 39260604.0, 39906660.0, 48073644.0, 62524844.0 ], "hidden_norms_avg": [ 998.1359252929688, 32138106.0, 34129788.0, 45757544.0, 61958428.0 ], "bp_grad_per_sample_l2_med": [ 2.9659293431905098e-05, 4.597033309572396e-10, 3.0463259692581346e-10, 2.893623118893629e-10, 2.780784769118583e-10 ], "bp_grad_F": [ 0.009033501148223877, 1.7998809198616073e-05, 2.5067617315244206e-08, 1.8738653295713448e-08, 1.087139978039886e-08 ], "gamma_dfa": 0.00016801172751002014, "gamma_dfa_per_layer": [ -0.0013465819647535682, 0.0014174225507304072, 0.00031502131605520844, 0.00028618500800803304 ], "acc_eval": 0.255859375, "loss_eval": 2.0473151206970215, "epoch": 51 }, { "hidden_norms_cls": [ 46.57882308959961, 39427768.0, 40090548.0, 48369740.0, 62859588.0 ], "hidden_norms_avg": [ 999.5881958007812, 32546802.0, 34502940.0, 46179212.0, 62426560.0 ], "bp_grad_per_sample_l2_med": [ 3.0221139240893535e-05, 4.495410987903625e-10, 3.065779852207129e-10, 2.9148336522233365e-10, 2.8107866034687845e-10 ], "bp_grad_F": [ 0.016372976824641228, 2.868929186661262e-05, 2.4158071099122935e-08, 2.1377838166358742e-08, 1.0851396226030374e-08 ], "gamma_dfa": 0.00012949823576491326, "gamma_dfa_per_layer": [ -0.0014246907085180283, 0.0013606694992631674, 0.0003105594660155475, 0.0002714546862989664 ], "acc_eval": 0.2568359375, "loss_eval": 2.0468568801879883, "epoch": 52 }, { "hidden_norms_cls": [ 46.621891021728516, 39709320.0, 40367452.0, 48619224.0, 63258040.0 ], "hidden_norms_avg": [ 1000.7721557617188, 33325650.0, 35170832.0, 47006208.0, 63117408.0 ], "bp_grad_per_sample_l2_med": [ 3.0193185011739843e-05, 4.388156504830931e-10, 3.137757831339627e-10, 2.8996427481331466e-10, 2.7836044580453745e-10 ], "bp_grad_F": [ 0.020163528621196747, 3.054905027966015e-05, 2.3064796295102497e-08, 1.4526934322134366e-08, 1.0852998499899513e-08 ], "gamma_dfa": 0.00017183857562486082, "gamma_dfa_per_layer": [ -0.0013185564894229174, 0.0014156483812257648, 0.00031098624458536506, 0.00027927616611123085 ], "acc_eval": 0.2529296875, "loss_eval": 2.054586410522461, "epoch": 53 }, { "hidden_norms_cls": [ 46.65864562988281, 39798476.0, 40463920.0, 48764504.0, 63346472.0 ], "hidden_norms_avg": [ 1001.6641845703125, 33379128.0, 35239452.0, 46955488.0, 63122060.0 ], "bp_grad_per_sample_l2_med": [ 2.965362000395544e-05, 4.4001230437018535e-10, 3.0546970508638083e-10, 2.8820767994375274e-10, 2.777780505613947e-10 ], "bp_grad_F": [ 0.048469845205545425, 4.790218736161478e-05, 2.6222814142329298e-08, 2.4079582772174035e-08, 1.0861339383438917e-08 ], "gamma_dfa": -6.432890222640708e-05, "gamma_dfa_per_layer": [ -0.002126228529959917, 0.0012497524730861187, 0.00034036440774798393, 0.0002787960402201861 ], "acc_eval": 0.2509765625, "loss_eval": 2.0531256198883057, "epoch": 54 }, { "hidden_norms_cls": [ 46.683528900146484, 39922192.0, 40544356.0, 48855360.0, 63435588.0 ], "hidden_norms_avg": [ 1002.31494140625, 33437468.0, 35316604.0, 47039952.0, 63236136.0 ], "bp_grad_per_sample_l2_med": [ 2.79724281426752e-05, 4.357196548010478e-10, 3.0789479299464517e-10, 2.8999944112761966e-10, 2.7672003577450255e-10 ], "bp_grad_F": [ 0.009082098491489887, 6.448025487770792e-06, 2.3372145108169207e-08, 1.58603672417712e-08, 1.0855457865943663e-08 ], "gamma_dfa": 8.819025242701173e-05, "gamma_dfa_per_layer": [ -0.0015805144794285297, 0.0013432127889245749, 0.000321696512401104, 0.00026836618781089783 ], "acc_eval": 0.2529296875, "loss_eval": 2.0517051219940186, "epoch": 55 }, { "hidden_norms_cls": [ 46.70249938964844, 40094040.0, 40695052.0, 48969004.0, 63542232.0 ], "hidden_norms_avg": [ 1002.7830810546875, 33826664.0, 35653116.0, 47279168.0, 63409756.0 ], "bp_grad_per_sample_l2_med": [ 2.8208709409227595e-05, 4.3868975119210063e-10, 3.102354484418868e-10, 2.8893865078316594e-10, 2.794520170823489e-10 ], "bp_grad_F": [ 0.012775770388543606, 3.5907680285163224e-05, 3.276610627267473e-08, 1.9733393585852355e-08, 1.0837335473468102e-08 ], "gamma_dfa": -7.604052370879799e-06, "gamma_dfa_per_layer": [ -0.0020841513760387897, 0.001464233035221696, 0.0003138828033115715, 0.0002756193280220032 ], "acc_eval": 0.2509765625, "loss_eval": 2.053762912750244, "epoch": 56 }, { "hidden_norms_cls": [ 46.71390914916992, 39990840.0, 40613704.0, 48947088.0, 63626668.0 ], "hidden_norms_avg": [ 1003.0780639648438, 33512400.0, 35398544.0, 47052320.0, 63319172.0 ], "bp_grad_per_sample_l2_med": [ 2.8852005925728008e-05, 4.408986231663192e-10, 3.0767774439333095e-10, 2.8811911190196327e-10, 2.780060626150771e-10 ], "bp_grad_F": [ 0.017775027081370354, 2.9518716473830864e-05, 1.6785485001946654e-08, 1.3991450664718741e-08, 1.082214762249123e-08 ], "gamma_dfa": 0.0001292051310883835, "gamma_dfa_per_layer": [ -0.001528067048639059, 0.0014583747833967209, 0.0003044582554139197, 0.0002820545341819525 ], "acc_eval": 0.2548828125, "loss_eval": 2.0512585639953613, "epoch": 57 }, { "hidden_norms_cls": [ 46.72029495239258, 40048976.0, 40673908.0, 49005780.0, 63650516.0 ], "hidden_norms_avg": [ 1003.2393188476562, 33518072.0, 35408260.0, 47059300.0, 63337588.0 ], "bp_grad_per_sample_l2_med": [ 3.040391493414063e-05, 4.422071042675668e-10, 3.0922153726464785e-10, 2.885988392709038e-10, 2.7767882437856883e-10 ], "bp_grad_F": [ 0.05996337905526161, 4.702213846030645e-05, 2.0060964445178797e-08, 1.6814832193290385e-08, 1.0825355722943186e-08 ], "gamma_dfa": 6.977042357902974e-05, "gamma_dfa_per_layer": [ -0.0016858375165611506, 0.001342209754511714, 0.00032920570811256766, 0.00029350374825298786 ], "acc_eval": 0.25390625, "loss_eval": 2.0525753498077393, "epoch": 58 }, { "hidden_norms_cls": [ 46.723426818847656, 40078224.0, 40696452.0, 49005116.0, 63676392.0 ], "hidden_norms_avg": [ 1003.3213500976562, 33528454.0, 35420932.0, 47084140.0, 63362884.0 ], "bp_grad_per_sample_l2_med": [ 2.9969949537189677e-05, 4.438247824811725e-10, 3.0574925924398144e-10, 2.876155424935689e-10, 2.772651552795935e-10 ], "bp_grad_F": [ 0.015555496327579021, 1.9468383470666595e-05, 2.2645199493354085e-08, 2.0153352764396004e-08, 1.082723954937137e-08 ], "gamma_dfa": -2.766123361652717e-05, "gamma_dfa_per_layer": [ -0.0021022262517362833, 0.0013793597463518381, 0.0003187692491337657, 0.0002934523217845708 ], "acc_eval": 0.2529296875, "loss_eval": 2.05129337310791, "epoch": 59 }, { "hidden_norms_cls": [ 46.72323226928711, 40073516.0, 40694276.0, 48970848.0, 63674696.0 ], "hidden_norms_avg": [ 1003.3206176757812, 33517796.0, 35411552.0, 47074216.0, 63356572.0 ], "bp_grad_per_sample_l2_med": [ 2.986433173646219e-05, 4.4209438887499175e-10, 3.069269838285038e-10, 2.8717661582078335e-10, 2.7721389073143143e-10 ], "bp_grad_F": [ 0.011835500597953796, 1.2977254300494678e-05, 2.7325663509714104e-08, 2.23609397664859e-08, 1.0828303587118171e-08 ], "gamma_dfa": 4.879416519543156e-05, "gamma_dfa_per_layer": [ -0.0018596879672259092, 0.0014319919282570481, 0.0003201703366357833, 0.00030270236311480403 ], "acc_eval": 0.2529296875, "loss_eval": 2.051326274871826, "epoch": 60 } ] }