diff options
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_fa_s42.json')
| -rw-r--r-- | results/snapshot_evolution_v2/snapshot_fa_s42.json | 2734 |
1 files changed, 2734 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_fa_s42.json b/results/snapshot_evolution_v2/snapshot_fa_s42.json new file mode 100644 index 0000000..277acec --- /dev/null +++ b/results/snapshot_evolution_v2/snapshot_fa_s42.json @@ -0,0 +1,2734 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": NaN, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 1156.72998046875, + 7932.5859375, + 11656.220703125, + 13101.765625, + 12094.2197265625 + ], + "bp_grad_norms_per_sample_med": [ + 1.5287704400179791e-06, + 8.219874985115894e-07, + 8.303726986014226e-07, + 8.411634553340264e-07, + 8.074007382674608e-07 + ], + "bp_grad_norms_F": [ + 0.0005889489548280835, + 0.0001249020715476945, + 0.00010261647548759356, + 8.311456622323021e-05, + 6.362409476423636e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2431640625, + "loss_eval": 2.0429816246032715, + "epoch": 1 + }, + { + "hidden_norms": [ + 2267.652099609375, + 33227.19921875, + 62863.03515625, + 73248.0546875, + 64100.21875 + ], + "bp_grad_norms_per_sample_med": [ + 6.826750791333325e-07, + 1.582481274908787e-07, + 1.5909284911685972e-07, + 1.6235998145930353e-07, + 1.57003455569793e-07 + ], + "bp_grad_norms_F": [ + 9.194230369757861e-05, + 3.062757241423242e-05, + 2.5034905775100924e-05, + 1.2339382010395639e-05, + 1.1088715837104246e-05 + ], + "gamma_dfa": NaN, + "acc_eval": 0.234375, + "loss_eval": 2.053070068359375, + "epoch": 2 + }, + { + "hidden_norms": [ + 3317.195556640625, + 69574.59375, + 208893.703125, + 272473.75, + 236858.453125 + ], + "bp_grad_norms_per_sample_med": [ + 5.585509370575892e-07, + 5.853191709093153e-08, + 5.772180244889569e-08, + 5.9099026117337417e-08, + 5.743537911939711e-08 + ], + "bp_grad_norms_F": [ + 5.4304215154843405e-05, + 1.798659286578186e-05, + 6.792580734327203e-06, + 5.748081548517803e-06, + 5.4292308959702495e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2529296875, + "loss_eval": 2.109177350997925, + "epoch": 3 + }, + { + "hidden_norms": [ + 4279.80322265625, + 131147.296875, + 524522.6875, + 669556.125, + 582199.5 + ], + "bp_grad_norms_per_sample_med": [ + 4.5417544924930553e-07, + 2.7819011094720736e-08, + 2.7284025705398562e-08, + 2.7924896173203706e-08, + 2.717020919362767e-08 + ], + "bp_grad_norms_F": [ + 2.7083517124992795e-05, + 3.1135298286244506e-06, + 2.188051212215214e-06, + 1.643483983571059e-06, + 1.5356297353719128e-06 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2314453125, + "loss_eval": 2.1304922103881836, + "epoch": 4 + }, + { + "hidden_norms": [ + 5095.1298828125, + 222828.6875, + 891649.1875, + 1124229.75, + 978070.3125 + ], + "bp_grad_norms_per_sample_med": [ + 3.9661114215050475e-07, + 1.7936926610673254e-08, + 1.787710601774961e-08, + 1.8164961090860743e-08, + 1.7773361449258118e-08 + ], + "bp_grad_norms_F": [ + 2.5229386665159836e-05, + 1.7291312133238534e-06, + 8.046768016356509e-07, + 6.81868698393373e-07, + 6.581432785424113e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2275390625, + "loss_eval": 2.1189823150634766, + "epoch": 5 + }, + { + "hidden_norms": [ + 5762.8369140625, + 345252.125, + 1352057.25, + 1685390.25, + 1472510.375 + ], + "bp_grad_norms_per_sample_med": [ + 3.5811123666462663e-07, + 1.2679316263586315e-08, + 1.2558022177699968e-08, + 1.2735733356805667e-08, + 1.2553626582700872e-08 + ], + "bp_grad_norms_F": [ + 1.9819366571027786e-05, + 7.985001957422355e-07, + 4.666244706186262e-07, + 4.659337093926297e-07, + 4.531105162186577e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2314453125, + "loss_eval": 2.1147799491882324, + "epoch": 6 + }, + { + "hidden_norms": [ + 6342.46337890625, + 489436.21875, + 1846600.125, + 2298539.25, + 2010095.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.2295056939801725e-07, + 9.47152134500584e-09, + 9.449903082270339e-09, + 9.579181003971371e-09, + 9.398083200551355e-09 + ], + "bp_grad_norms_F": [ + 1.761323437676765e-05, + 3.5219920846429886e-07, + 3.464733993041591e-07, + 3.515923765462503e-07, + 3.4331398524045653e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.263671875, + "loss_eval": 2.0468926429748535, + "epoch": 7 + }, + { + "hidden_norms": [ + 6895.3232421875, + 642604.125, + 2340199.25, + 2912852.0, + 2551695.75 + ], + "bp_grad_norms_per_sample_med": [ + 3.2115181625158584e-07, + 8.011411978259275e-09, + 8.093356207439228e-09, + 8.185297772911326e-09, + 8.036058929405954e-09 + ], + "bp_grad_norms_F": [ + 1.6510130080860108e-05, + 2.8924068828928284e-07, + 2.88436524442659e-07, + 2.9188095140852965e-07, + 2.860562631212815e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2373046875, + "loss_eval": 2.0705394744873047, + "epoch": 8 + }, + { + "hidden_norms": [ + 7418.32666015625, + 802952.8125, + 2905706.5, + 3629847.25, + 3176127.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9990744110364176e-07, + 6.746414982217175e-09, + 6.801009533319302e-09, + 6.844500521907548e-09, + 6.780156436292373e-09 + ], + "bp_grad_norms_F": [ + 1.5715995687060058e-05, + 2.419061502223485e-07, + 2.416737459043361e-07, + 2.441595654545381e-07, + 2.39673738633428e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.271484375, + "loss_eval": 2.03157901763916, + "epoch": 9 + }, + { + "hidden_norms": [ + 8026.80126953125, + 964342.4375, + 3455197.75, + 4322591.0, + 3777789.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.9810524893036927e-07, + 5.931947377746383e-09, + 5.9767870652649435e-09, + 6.012730313642578e-09, + 5.922320855944463e-09 + ], + "bp_grad_norms_F": [ + 1.546428757137619e-05, + 2.1311132059054216e-07, + 2.1318879817044945e-07, + 2.1529912430651166e-07, + 2.115393868962201e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2421875, + "loss_eval": 2.029039144515991, + "epoch": 10 + }, + { + "hidden_norms": [ + 8568.4677734375, + 1146051.75, + 4149878.75, + 5211595.5, + 4551772.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.77834743656058e-07, + 5.156825633179096e-09, + 5.185044393840599e-09, + 5.243859568793141e-09, + 5.148059312176656e-09 + ], + "bp_grad_norms_F": [ + 1.4489689419860952e-05, + 1.8374593935277517e-07, + 1.8364994502917398e-07, + 1.8539546431384224e-07, + 1.8235705567803961e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.279296875, + "loss_eval": 2.015061855316162, + "epoch": 11 + }, + { + "hidden_norms": [ + 9099.6689453125, + 1306440.25, + 4712579.5, + 5930700.5, + 5167806.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.789404618397384e-07, + 4.740023484828271e-09, + 4.688871069191691e-09, + 4.722021884617789e-09, + 4.664129082954105e-09 + ], + "bp_grad_norms_F": [ + 1.440922096662689e-05, + 1.6886964715467911e-07, + 1.6845007166921278e-07, + 1.6997903173887607e-07, + 1.673002003599322e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.279296875, + "loss_eval": 2.0080716609954834, + "epoch": 12 + }, + { + "hidden_norms": [ + 9619.3310546875, + 1468314.25, + 5278606.0, + 6647205.0, + 5776389.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.678217470020172e-07, + 4.431488953571261e-09, + 4.461886859985498e-09, + 4.481298443437254e-09, + 4.434627776106481e-09 + ], + "bp_grad_norms_F": [ + 1.4280021787271835e-05, + 1.5716064183379785e-07, + 1.5650925888621714e-07, + 1.5793726504398364e-07, + 1.5547414022876183e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 2.003105401992798, + "epoch": 13 + }, + { + "hidden_norms": [ + 10185.365234375, + 1637280.875, + 5941891.0, + 7477497.0, + 6482495.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.580181046596408e-07, + 4.108497098087582e-09, + 4.027958855346014e-09, + 4.0670666834330405e-09, + 4.01310229491969e-09 + ], + "bp_grad_norms_F": [ + 1.3607143955596257e-05, + 1.4447114438098652e-07, + 1.4335948606003512e-07, + 1.4459322983384482e-07, + 1.424295135166176e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2841796875, + "loss_eval": 1.9895731210708618, + "epoch": 14 + }, + { + "hidden_norms": [ + 10773.4443359375, + 1777185.125, + 6485962.5, + 8158632.5, + 7057802.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.536919225804013e-07, + 3.8119583045670424e-09, + 3.815232130222057e-09, + 3.836773565524254e-09, + 3.790971536687948e-09 + ], + "bp_grad_norms_F": [ + 1.3741724615101703e-05, + 1.3785883368200302e-07, + 1.3661090747518756e-07, + 1.3781669849777245e-07, + 1.3573732360327995e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.263671875, + "loss_eval": 2.0124382972717285, + "epoch": 15 + }, + { + "hidden_norms": [ + 11403.58984375, + 1931677.0, + 7089585.5, + 8906384.0, + 7683122.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.446777500608732e-07, + 3.674859083702131e-09, + 3.648833679648078e-09, + 3.6761997890266684e-09, + 3.624884392650074e-09 + ], + "bp_grad_norms_F": [ + 1.3561247214965988e-05, + 1.2985380237751087e-07, + 1.2829688955662277e-07, + 1.294151275033073e-07, + 1.2746555455578346e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.26953125, + "loss_eval": 2.0030646324157715, + "epoch": 16 + }, + { + "hidden_norms": [ + 12115.1162109375, + 2091857.0, + 7735447.5, + 9727085.0, + 8371443.5 + ], + "bp_grad_norms_per_sample_med": [ + 2.378987460360804e-07, + 3.4695852857424825e-09, + 3.42812689346772e-09, + 3.4526042025362358e-09, + 3.40047856539627e-09 + ], + "bp_grad_norms_F": [ + 1.3279566701385193e-05, + 1.2257437731477694e-07, + 1.2078584177288576e-07, + 1.2181956776657898e-07, + 1.1999593141354126e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2939453125, + "loss_eval": 1.9935777187347412, + "epoch": 17 + }, + { + "hidden_norms": [ + 12755.7646484375, + 2248501.0, + 8338276.5, + 10490721.0, + 8991669.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.3127104498144035e-07, + 3.35100103221464e-09, + 3.3095433060736923e-09, + 3.326423581029303e-09, + 3.2682878625678313e-09 + ], + "bp_grad_norms_F": [ + 1.3015700460528024e-05, + 1.1814677947086238e-07, + 1.1589928305966168e-07, + 1.1685516199122503e-07, + 1.1511789210771894e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2900390625, + "loss_eval": 1.9912320375442505, + "epoch": 18 + }, + { + "hidden_norms": [ + 13395.4189453125, + 2393670.0, + 8949124.0, + 11235038.0, + 9603954.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.2520477216403378e-07, + 3.2867890631393948e-09, + 3.2246825210080488e-09, + 3.250592239822936e-09, + 3.201830800492189e-09 + ], + "bp_grad_norms_F": [ + 1.3049841072643176e-05, + 1.1301781910333375e-07, + 1.1090982354744483e-07, + 1.1187000836798688e-07, + 1.101881252907333e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2626953125, + "loss_eval": 2.0112197399139404, + "epoch": 19 + }, + { + "hidden_norms": [ + 14034.6982421875, + 2529761.5, + 9576616.0, + 12035853.0, + 10258897.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.1533313088184514e-07, + 3.174721152632287e-09, + 3.1246687459685063e-09, + 3.149874805430386e-09, + 3.09314329705046e-09 + ], + "bp_grad_norms_F": [ + 1.26855793496361e-05, + 1.0948959072720754e-07, + 1.0680034279175743e-07, + 1.0768705749342189e-07, + 1.0610038714276016e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.25, + "loss_eval": 2.0056447982788086, + "epoch": 20 + }, + { + "hidden_norms": [ + 14717.9462890625, + 2650771.25, + 10157696.0, + 12784758.0, + 10849881.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.086567434389508e-07, + 2.999795301050767e-09, + 2.966421552841325e-09, + 2.9786708655166194e-09, + 2.947827537624903e-09 + ], + "bp_grad_norms_F": [ + 1.2321271242399234e-05, + 1.0535904237940485e-07, + 1.0280631101977633e-07, + 1.0365675251478024e-07, + 1.021143916091205e-07 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 1.9869788885116577, + "epoch": 21 + }, + { + "hidden_norms": [ + 15327.8466796875, + 2777500.75, + 10776735.0, + 13573723.0, + 11474654.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0232576503076416e-07, + 2.9384910060770153e-09, + 2.867603710043909e-09, + 2.8935454032819052e-09, + 2.8441446975335793e-09 + ], + "bp_grad_norms_F": [ + 1.231426631420618e-05, + 1.0333050681765599e-07, + 1.0039466502576033e-07, + 1.0124550442469626e-07, + 9.972216474807283e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2939453125, + "loss_eval": 1.9892809391021729, + "epoch": 22 + }, + { + "hidden_norms": [ + 15945.8837890625, + 2878910.75, + 11304857.0, + 14241028.0, + 11994238.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0171727044271393e-07, + 2.9479860774728195e-09, + 2.8580404709543927e-09, + 2.8716116151628057e-09, + 2.8270419338838337e-09 + ], + "bp_grad_norms_F": [ + 1.2025901924062055e-05, + 1.0096052704966496e-07, + 9.789676624905042e-08, + 9.872773176766714e-08, + 9.722123195388122e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2802734375, + "loss_eval": 1.9858973026275635, + "epoch": 23 + }, + { + "hidden_norms": [ + 16595.853515625, + 3002464.5, + 11949546.0, + 15061732.0, + 12646630.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.9120048477816454e-07, + 2.8694004949869623e-09, + 2.772703400211185e-09, + 2.777924779095997e-09, + 2.7492945697815685e-09 + ], + "bp_grad_norms_F": [ + 1.2024025636492297e-05, + 9.894926478182242e-08, + 9.581360416177631e-08, + 9.663772715384766e-08, + 9.51538083882042e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.296875, + "loss_eval": 1.9969089031219482, + "epoch": 24 + }, + { + "hidden_norms": [ + 17227.1640625, + 3125553.25, + 12574712.0, + 15844785.0, + 13247150.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8941717883080855e-07, + 2.8377846739147117e-09, + 2.7375035571708395e-09, + 2.7606503749666444e-09, + 2.7206534802814986e-09 + ], + "bp_grad_norms_F": [ + 1.153391167463269e-05, + 9.671435208247203e-08, + 9.34372863525823e-08, + 9.424089597587226e-08, + 9.280081059159784e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.294921875, + "loss_eval": 1.9766383171081543, + "epoch": 25 + }, + { + "hidden_norms": [ + 17808.20703125, + 3256055.25, + 13319775.0, + 16758460.0, + 13956453.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8628608700055338e-07, + 2.7554525328099544e-09, + 2.625358597185823e-09, + 2.6348250248275917e-09, + 2.614828797931068e-09 + ], + "bp_grad_norms_F": [ + 1.0964491593767889e-05, + 9.419229485274627e-08, + 9.09606185928169e-08, + 9.175563775443152e-08, + 9.03681396380307e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2919921875, + "loss_eval": 1.9645390510559082, + "epoch": 26 + }, + { + "hidden_norms": [ + 18401.28125, + 3393640.75, + 14088409.0, + 17726368.0, + 14707189.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7694672749257734e-07, + 2.722393421805691e-09, + 2.634128470901942e-09, + 2.6627771099185793e-09, + 2.6215960513553682e-09 + ], + "bp_grad_norms_F": [ + 1.1054430615331512e-05, + 9.26544814205954e-08, + 8.924564554035896e-08, + 9.002578593708677e-08, + 8.865336553753878e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2861328125, + "loss_eval": 1.974367618560791, + "epoch": 27 + }, + { + "hidden_norms": [ + 18936.51953125, + 3515726.25, + 14734875.0, + 18530786.0, + 15301454.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7923295558830432e-07, + 2.6605673220103654e-09, + 2.530292642077825e-09, + 2.5396913461150916e-09, + 2.517351882502794e-09 + ], + "bp_grad_norms_F": [ + 1.1157896551594604e-05, + 9.233546904852119e-08, + 8.888883229474231e-08, + 8.968125086994405e-08, + 8.831575115664236e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.2841796875, + "loss_eval": 1.986099362373352, + "epoch": 28 + }, + { + "hidden_norms": [ + 19457.962890625, + 3664789.5, + 15342228.0, + 19308666.0, + 15894652.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7488744674665213e-07, + 2.6636790551037848e-09, + 2.4992619085395518e-09, + 2.507181573463413e-09, + 2.486318262384657e-09 + ], + "bp_grad_norms_F": [ + 1.092042657546699e-05, + 9.157383118463258e-08, + 8.810303597783786e-08, + 8.888122238204232e-08, + 8.75455583582152e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9868172407150269, + "epoch": 29 + }, + { + "hidden_norms": [ + 19933.78515625, + 3775119.25, + 16017107.0, + 20154288.0, + 16541561.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.715164188453855e-07, + 2.5937807457410145e-09, + 2.4676627408126706e-09, + 2.4873916260048645e-09, + 2.4605657511500567e-09 + ], + "bp_grad_norms_F": [ + 1.0760413715615869e-05, + 9.029215419786851e-08, + 8.696353148707203e-08, + 8.772182269467521e-08, + 8.64171596504093e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.291015625, + "loss_eval": 1.9754526615142822, + "epoch": 30 + }, + { + "hidden_norms": [ + 20432.466796875, + 3910461.25, + 16712518.0, + 21021696.0, + 17196572.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.710603356741558e-07, + 2.6387678708772455e-09, + 2.524718212271182e-09, + 2.5378650292395832e-09, + 2.5052109275947032e-09 + ], + "bp_grad_norms_F": [ + 1.0587626093183644e-05, + 8.93876332952459e-08, + 8.59824282883892e-08, + 8.675493745613494e-08, + 8.546451368829366e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9657469987869263, + "epoch": 31 + }, + { + "hidden_norms": [ + 20875.439453125, + 4054334.0, + 17463474.0, + 21948092.0, + 17887228.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.729485461510194e-07, + 2.6252673368531987e-09, + 2.4720219204965588e-09, + 2.491059358789016e-09, + 2.4621127359125694e-09 + ], + "bp_grad_norms_F": [ + 1.0830392966454383e-05, + 8.912193294463577e-08, + 8.547249308321625e-08, + 8.626851411008829e-08, + 8.495522507701025e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.31640625, + "loss_eval": 1.9752991199493408, + "epoch": 32 + }, + { + "hidden_norms": [ + 21372.0234375, + 4181554.25, + 18179600.0, + 22866024.0, + 18562826.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6644050049308134e-07, + 2.5652076018900516e-09, + 2.4415069965755265e-09, + 2.4562532008332028e-09, + 2.423905742787724e-09 + ], + "bp_grad_norms_F": [ + 1.0476498573552817e-05, + 8.780278903941507e-08, + 8.420673225373321e-08, + 8.501019266304866e-08, + 8.373319104748589e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.9647243022918701, + "epoch": 33 + }, + { + "hidden_norms": [ + 21698.390625, + 4323451.5, + 18873394.0, + 23742746.0, + 19211736.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6982900774564769e-07, + 2.6139097553112833e-09, + 2.4535891096633122e-09, + 2.465766257842006e-09, + 2.4349082750063644e-09 + ], + "bp_grad_norms_F": [ + 1.0547244528424926e-05, + 8.761546865798664e-08, + 8.380350635661671e-08, + 8.460440881208342e-08, + 8.332586531878405e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9688763618469238, + "epoch": 34 + }, + { + "hidden_norms": [ + 22000.6484375, + 4419910.5, + 19288578.0, + 24275390.0, + 19571482.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6632812105399353e-07, + 2.5976403250638214e-09, + 2.4608304283191273e-09, + 2.4786184216196716e-09, + 2.4511619400868767e-09 + ], + "bp_grad_norms_F": [ + 1.0402384759800043e-05, + 8.75945431744185e-08, + 8.378519567031617e-08, + 8.458554390244899e-08, + 8.331597456390227e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.962469458580017, + "epoch": 35 + }, + { + "hidden_norms": [ + 22332.140625, + 4505425.5, + 19876824.0, + 24999434.0, + 20098762.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.673159886195208e-07, + 2.5706452522200607e-09, + 2.4236175288905315e-09, + 2.4205843995872556e-09, + 2.4001298726261666e-09 + ], + "bp_grad_norms_F": [ + 1.0201652912655845e-05, + 8.668673245892933e-08, + 8.301810083821692e-08, + 8.384706973174616e-08, + 8.257533323785538e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3046875, + "loss_eval": 1.9482183456420898, + "epoch": 36 + }, + { + "hidden_norms": [ + 22704.90625, + 4601120.5, + 20416742.0, + 25650594.0, + 20558608.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6260217705621471e-07, + 2.501829188261695e-09, + 2.37497355115579e-09, + 2.379827890308661e-09, + 2.364261231235787e-09 + ], + "bp_grad_norms_F": [ + 1.0307686352462042e-05, + 8.687224806180893e-08, + 8.317324073914278e-08, + 8.40014422465174e-08, + 8.273995177887628e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.9718880653381348, + "epoch": 37 + }, + { + "hidden_norms": [ + 22953.462890625, + 4708118.5, + 21018216.0, + 26396430.0, + 21081344.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6642815126033383e-07, + 2.5344910614677474e-09, + 2.3881991939589398e-09, + 2.393568676595237e-09, + 2.366601137282487e-09 + ], + "bp_grad_norms_F": [ + 1.0291260878148023e-05, + 8.597661604881068e-08, + 8.222435354809932e-08, + 8.30701907261755e-08, + 8.179645050176987e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9656648635864258, + "epoch": 38 + }, + { + "hidden_norms": [ + 23329.68359375, + 4813138.0, + 21547542.0, + 27050624.0, + 21536360.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6755477361130033e-07, + 2.5133575221047977e-09, + 2.3339741250794077e-09, + 2.3630628565030065e-09, + 2.3331871989995534e-09 + ], + "bp_grad_norms_F": [ + 1.0207740160694811e-05, + 8.593145395252577e-08, + 8.217772773377874e-08, + 8.303662468733819e-08, + 8.176558452532845e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9581431150436401, + "epoch": 39 + }, + { + "hidden_norms": [ + 23598.361328125, + 4903029.0, + 22069792.0, + 27713646.0, + 21984984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6272531411232194e-07, + 2.4648321161890863e-09, + 2.360529327560812e-09, + 2.364856310776986e-09, + 2.3259458803437383e-09 + ], + "bp_grad_norms_F": [ + 1.0116659723280463e-05, + 8.537404028174933e-08, + 8.159113207284463e-08, + 8.246142613188567e-08, + 8.120937167177544e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3212890625, + "loss_eval": 1.9615185260772705, + "epoch": 40 + }, + { + "hidden_norms": [ + 23904.275390625, + 5004298.0, + 22611816.0, + 28369744.0, + 22444866.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6563248550482967e-07, + 2.5165425299178423e-09, + 2.3475779098447447e-09, + 2.3561286255358027e-09, + 2.3397561665916555e-09 + ], + "bp_grad_norms_F": [ + 1.0093037417391315e-05, + 8.496893855181042e-08, + 8.129408968216012e-08, + 8.217033098389948e-08, + 8.091691228173659e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3056640625, + "loss_eval": 1.9596519470214844, + "epoch": 41 + }, + { + "hidden_norms": [ + 24124.95703125, + 5079679.0, + 23056108.0, + 28905466.0, + 22810520.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.650763863381144e-07, + 2.5150639348936465e-09, + 2.375127650111608e-09, + 2.3864086262648243e-09, + 2.3595001508169844e-09 + ], + "bp_grad_norms_F": [ + 1.0080430001835339e-05, + 8.473855928059493e-08, + 8.099364379177132e-08, + 8.18785963474511e-08, + 8.06336757364079e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3251953125, + "loss_eval": 1.9462497234344482, + "epoch": 42 + }, + { + "hidden_norms": [ + 24350.154296875, + 5170977.5, + 23526890.0, + 29466298.0, + 23191828.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6226854882006592e-07, + 2.5123039204544284e-09, + 2.381558061870237e-09, + 2.391710607341224e-09, + 2.3734676446451886e-09 + ], + "bp_grad_norms_F": [ + 1.0192407899012323e-05, + 8.457134015316115e-08, + 8.096912296196024e-08, + 8.18817795789073e-08, + 8.06216249316094e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.950229287147522, + "epoch": 43 + }, + { + "hidden_norms": [ + 24543.87890625, + 5230886.0, + 23931748.0, + 29937192.0, + 23499106.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6538373870389478e-07, + 2.4975805867910594e-09, + 2.3630661871720804e-09, + 2.3725827968945623e-09, + 2.3566677498365607e-09 + ], + "bp_grad_norms_F": [ + 1.0082419976242818e-05, + 8.452050792584487e-08, + 8.1015215869229e-08, + 8.194035672204336e-08, + 8.06845363854336e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.30078125, + "loss_eval": 1.9453504085540771, + "epoch": 44 + }, + { + "hidden_norms": [ + 24711.091796875, + 5298309.0, + 24318082.0, + 30413608.0, + 23808788.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6054062257353507e-07, + 2.4891384509118097e-09, + 2.358970574434238e-09, + 2.368707230360201e-09, + 2.3476884880579973e-09 + ], + "bp_grad_norms_F": [ + 1.0053097867057659e-05, + 8.462841805112475e-08, + 8.112137095395155e-08, + 8.206667700960679e-08, + 8.080490943029872e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3076171875, + "loss_eval": 1.9472556114196777, + "epoch": 45 + }, + { + "hidden_norms": [ + 24881.759765625, + 5378830.0, + 24836314.0, + 31031698.0, + 24231208.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.623594982902432e-07, + 2.4946655852176036e-09, + 2.3718913499948258e-09, + 2.3750907907071905e-09, + 2.3478305966051494e-09 + ], + "bp_grad_norms_F": [ + 1.012617394735571e-05, + 8.473565316080567e-08, + 8.116323613194254e-08, + 8.212452939915238e-08, + 8.085635272436775e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3125, + "loss_eval": 1.9553910493850708, + "epoch": 46 + }, + { + "hidden_norms": [ + 25032.86328125, + 5446721.0, + 25258438.0, + 31534450.0, + 24555236.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.632960788811033e-07, + 2.470913029739563e-09, + 2.316862923734675e-09, + 2.3169177687520914e-09, + 2.3029997908707855e-09 + ], + "bp_grad_norms_F": [ + 9.900480108626653e-06, + 8.452943944803337e-08, + 8.106712812150363e-08, + 8.2038923210348e-08, + 8.077390845073751e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9489891529083252, + "epoch": 47 + }, + { + "hidden_norms": [ + 25306.201171875, + 5468743.5, + 25525060.0, + 31867246.0, + 24722362.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5847486167785974e-07, + 2.4746471538605874e-09, + 2.3425053008452323e-09, + 2.3598758502885175e-09, + 2.3311046426499615e-09 + ], + "bp_grad_norms_F": [ + 9.7980091595673e-06, + 8.43976621922593e-08, + 8.096849057892541e-08, + 8.195242884312393e-08, + 8.069165602364592e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3134765625, + "loss_eval": 1.9313395023345947, + "epoch": 48 + }, + { + "hidden_norms": [ + 25419.810546875, + 5521521.5, + 25869234.0, + 32269302.0, + 24978000.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6377224199004559e-07, + 2.4982107493798367e-09, + 2.3510355884326373e-09, + 2.359785478134313e-09, + 2.3393140757832498e-09 + ], + "bp_grad_norms_F": [ + 1.003210672934074e-05, + 8.464159151344575e-08, + 8.12287339613249e-08, + 8.224073155815859e-08, + 8.095251047279817e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3095703125, + "loss_eval": 1.94147527217865, + "epoch": 49 + }, + { + "hidden_norms": [ + 25543.001953125, + 5573999.0, + 26298990.0, + 32786014.0, + 25316304.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.593823384382631e-07, + 2.512666297249666e-09, + 2.392667397543846e-09, + 2.4054993552624637e-09, + 2.386617126148849e-09 + ], + "bp_grad_norms_F": [ + 1.0020607987826224e-05, + 8.429628906014841e-08, + 8.090298564411569e-08, + 8.193208600459911e-08, + 8.064517231787249e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9412651062011719, + "epoch": 50 + }, + { + "hidden_norms": [ + 25755.05859375, + 5633394.5, + 26712786.0, + 33270568.0, + 25632750.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.615333218296655e-07, + 2.483285133081381e-09, + 2.346244309947565e-09, + 2.3569415308344333e-09, + 2.342600557980745e-09 + ], + "bp_grad_norms_F": [ + 9.841775863606017e-06, + 8.406106388747503e-08, + 8.07588094176026e-08, + 8.180128219237304e-08, + 8.051125632846379e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3193359375, + "loss_eval": 1.9356749057769775, + "epoch": 51 + }, + { + "hidden_norms": [ + 25838.6875, + 5676516.5, + 26956640.0, + 33554564.0, + 25797852.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5953406773405732e-07, + 2.4927520048123597e-09, + 2.379676899977312e-09, + 2.3930151193951588e-09, + 2.37515118683973e-09 + ], + "bp_grad_norms_F": [ + 1.0000761903938837e-05, + 8.431718612200712e-08, + 8.108807492135384e-08, + 8.215462798943918e-08, + 8.085050495765245e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.322265625, + "loss_eval": 1.9513205289840698, + "epoch": 52 + }, + { + "hidden_norms": [ + 25925.244140625, + 5739893.0, + 27348932.0, + 34049508.0, + 26115016.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5941535025376652e-07, + 2.4419115618457e-09, + 2.335727167235291e-09, + 2.3481498967470316e-09, + 2.335213800108704e-09 + ], + "bp_grad_norms_F": [ + 9.962137482943945e-06, + 8.399173623274692e-08, + 8.08289613019042e-08, + 8.190350797576684e-08, + 8.060307266077871e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9443122148513794, + "epoch": 53 + }, + { + "hidden_norms": [ + 26078.8125, + 5808761.5, + 27799278.0, + 34615776.0, + 26499736.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5867621527831943e-07, + 2.4137036813698387e-09, + 2.31744068379669e-09, + 2.327602111051874e-09, + 2.313133462550354e-09 + ], + "bp_grad_norms_F": [ + 9.748204320203513e-06, + 8.347069524461403e-08, + 8.032785814293675e-08, + 8.14167648854891e-08, + 8.011366503524187e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.314453125, + "loss_eval": 1.9361423254013062, + "epoch": 54 + }, + { + "hidden_norms": [ + 26192.453125, + 5875144.0, + 28166196.0, + 35073324.0, + 26791154.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5812705100870517e-07, + 2.4364927853071094e-09, + 2.339390015038134e-09, + 2.3421220518571317e-09, + 2.328011117214146e-09 + ], + "bp_grad_norms_F": [ + 9.899279575620312e-06, + 8.359175751593284e-08, + 8.043829780035594e-08, + 8.154502495472116e-08, + 8.023434361348336e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.940393090248108, + "epoch": 55 + }, + { + "hidden_norms": [ + 26281.6796875, + 5935011.0, + 28625862.0, + 35638648.0, + 27180628.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6062698193763936e-07, + 2.4364579243041362e-09, + 2.3309267849214166e-09, + 2.3373505353418977e-09, + 2.3235424695400297e-09 + ], + "bp_grad_norms_F": [ + 9.917155693983659e-06, + 8.292303022017222e-08, + 7.976373694873473e-08, + 8.087503999831824e-08, + 7.955991776498195e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.945765495300293, + "epoch": 56 + }, + { + "hidden_norms": [ + 26394.865234375, + 5988690.5, + 28944822.0, + 36062032.0, + 27426714.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6303006589168945e-07, + 2.4247555074907723e-09, + 2.309517688203755e-09, + 2.3198174492478074e-09, + 2.3075219512946887e-09 + ], + "bp_grad_norms_F": [ + 1.0007075616158545e-05, + 8.301859821813196e-08, + 7.986342609456187e-08, + 8.099387827087412e-08, + 7.966451676111319e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.9433667659759521, + "epoch": 57 + }, + { + "hidden_norms": [ + 26515.357421875, + 6051740.5, + 29293128.0, + 36499980.0, + 27690768.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5923862406452827e-07, + 2.3941215676615e-09, + 2.28924412759568e-09, + 2.2969097734915067e-09, + 2.280708066848547e-09 + ], + "bp_grad_norms_F": [ + 9.82554138317937e-06, + 8.282027863515395e-08, + 7.976368721074323e-08, + 8.090249536962801e-08, + 7.957222436516531e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.306640625, + "loss_eval": 1.944448709487915, + "epoch": 58 + }, + { + "hidden_norms": [ + 26621.947265625, + 6089471.5, + 29639332.0, + 36907412.0, + 27955134.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5679145803915162e-07, + 2.3988511177464034e-09, + 2.303158996852517e-09, + 2.3152970651807436e-09, + 2.2871571303539895e-09 + ], + "bp_grad_norms_F": [ + 9.731273166835308e-06, + 8.24191062065438e-08, + 7.936159107657659e-08, + 8.050036370832458e-08, + 7.917343225471996e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3125, + "loss_eval": 1.9350972175598145, + "epoch": 59 + }, + { + "hidden_norms": [ + 26731.64453125, + 6146909.5, + 30036422.0, + 37405476.0, + 28295768.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5779031059537374e-07, + 2.4025526013105036e-09, + 2.3019863792939077e-09, + 2.3154580475193143e-09, + 2.293559120403188e-09 + ], + "bp_grad_norms_F": [ + 9.80158438323997e-06, + 8.19560526110763e-08, + 7.889645559089331e-08, + 8.003749485396838e-08, + 7.871490481647925e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.328125, + "loss_eval": 1.941221833229065, + "epoch": 60 + }, + { + "hidden_norms": [ + 26842.380859375, + 6189510.0, + 30305302.0, + 37746040.0, + 28515236.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5621530735643319e-07, + 2.3939163984465495e-09, + 2.3025825690581314e-09, + 2.3148469807665606e-09, + 2.2962292067774115e-09 + ], + "bp_grad_norms_F": [ + 9.731598765938543e-06, + 8.167720011442725e-08, + 7.863504691840717e-08, + 7.977818938798009e-08, + 7.845925864558012e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3408203125, + "loss_eval": 1.9333854913711548, + "epoch": 61 + }, + { + "hidden_norms": [ + 26940.765625, + 6243737.5, + 30559802.0, + 38046748.0, + 28709922.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5672847553105385e-07, + 2.3640371882294176e-09, + 2.2657933307357325e-09, + 2.2837092217287136e-09, + 2.2615944672566e-09 + ], + "bp_grad_norms_F": [ + 9.668071470514406e-06, + 8.165712017671467e-08, + 7.869160612017367e-08, + 7.984421301898692e-08, + 7.851971872696595e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3203125, + "loss_eval": 1.9349033832550049, + "epoch": 62 + }, + { + "hidden_norms": [ + 27024.9140625, + 6285780.0, + 30783454.0, + 38328276.0, + 28883832.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5834399391678744e-07, + 2.3645019275875256e-09, + 2.2709001346044033e-09, + 2.2806179167389473e-09, + 2.2639952135250496e-09 + ], + "bp_grad_norms_F": [ + 9.799305189517327e-06, + 8.167254605950802e-08, + 7.873082097376027e-08, + 7.989201833424886e-08, + 7.856029071717785e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.31640625, + "loss_eval": 1.9409070014953613, + "epoch": 63 + }, + { + "hidden_norms": [ + 27131.298828125, + 6330564.0, + 31012118.0, + 38625700.0, + 29050708.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.588112752415327e-07, + 2.403508059245496e-09, + 2.2917150399592856e-09, + 2.3033945861783423e-09, + 2.2864310444958846e-09 + ], + "bp_grad_norms_F": [ + 9.54241204453865e-06, + 8.120213124129805e-08, + 7.823086889402475e-08, + 7.938096047155341e-08, + 7.805995494436502e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9211525917053223, + "epoch": 64 + }, + { + "hidden_norms": [ + 27208.25, + 6368866.0, + 31290472.0, + 38967492.0, + 29272872.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5740459957669373e-07, + 2.3837900542389434e-09, + 2.284773703564724e-09, + 2.298153001234482e-09, + 2.2881960770604337e-09 + ], + "bp_grad_norms_F": [ + 9.658318958827294e-06, + 8.104061777203242e-08, + 7.810449886846982e-08, + 7.925908818151584e-08, + 7.793548206791456e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.341796875, + "loss_eval": 1.9278589487075806, + "epoch": 65 + }, + { + "hidden_norms": [ + 27276.62890625, + 6418036.5, + 31545874.0, + 39283716.0, + 29477138.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5503043471198907e-07, + 2.357751327508595e-09, + 2.2688111389612686e-09, + 2.2810615618595875e-09, + 2.2629353946257424e-09 + ], + "bp_grad_norms_F": [ + 9.6196936283377e-06, + 8.082280089638516e-08, + 7.795324563630857e-08, + 7.91092062968346e-08, + 7.778949395742529e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33984375, + "loss_eval": 1.9305698871612549, + "epoch": 66 + }, + { + "hidden_norms": [ + 27340.607421875, + 6465153.0, + 31796498.0, + 39598816.0, + 29679376.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5558319432784629e-07, + 2.3627866330144798e-09, + 2.2779722552712656e-09, + 2.2912376440586968e-09, + 2.2693087409209056e-09 + ], + "bp_grad_norms_F": [ + 9.68782387644751e-06, + 8.066198375900058e-08, + 7.781451927257876e-08, + 7.897661191691441e-08, + 7.765357423750174e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3173828125, + "loss_eval": 1.9328408241271973, + "epoch": 67 + }, + { + "hidden_norms": [ + 27396.21484375, + 6507270.5, + 32041844.0, + 39890444.0, + 29881876.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5313091239477217e-07, + 2.336748128328736e-09, + 2.2449873071650472e-09, + 2.2587733905510277e-09, + 2.237245722014336e-09 + ], + "bp_grad_norms_F": [ + 9.509177289146464e-06, + 8.020302288969106e-08, + 7.739499352510393e-08, + 7.854830386122558e-08, + 7.723401296289012e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.318359375, + "loss_eval": 1.9248214960098267, + "epoch": 68 + }, + { + "hidden_norms": [ + 27461.697265625, + 6534744.5, + 32295470.0, + 40216712.0, + 30089670.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5820302223801264e-07, + 2.3342023869332706e-09, + 2.2277899525136036e-09, + 2.237228180490547e-09, + 2.2202666372095337e-09 + ], + "bp_grad_norms_F": [ + 9.662662705522962e-06, + 8.017656227821135e-08, + 7.73198536307973e-08, + 7.847864225141166e-08, + 7.715301109101347e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9348523616790771, + "epoch": 69 + }, + { + "hidden_norms": [ + 27519.265625, + 6576646.0, + 32533798.0, + 40497036.0, + 30273994.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5546247311704064e-07, + 2.332068760324546e-09, + 2.2422437240265936e-09, + 2.259832765361125e-09, + 2.2382042885737974e-09 + ], + "bp_grad_norms_F": [ + 9.630303793528583e-06, + 7.993662620719988e-08, + 7.707911464649442e-08, + 7.823470582479786e-08, + 7.691809855714382e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3212890625, + "loss_eval": 1.9298650026321411, + "epoch": 70 + }, + { + "hidden_norms": [ + 27578.833984375, + 6611492.0, + 32783444.0, + 40806224.0, + 30475316.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5486573090583988e-07, + 2.310989177800593e-09, + 2.214788796806033e-09, + 2.2242498953772838e-09, + 2.209040284029129e-09 + ], + "bp_grad_norms_F": [ + 9.58504097070545e-06, + 7.973878268785484e-08, + 7.692549530702308e-08, + 7.808419866250915e-08, + 7.67675771840004e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.314453125, + "loss_eval": 1.9349405765533447, + "epoch": 71 + }, + { + "hidden_norms": [ + 27637.01953125, + 6652277.0, + 32940606.0, + 41021348.0, + 30603354.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5176895828972192e-07, + 2.309274771405967e-09, + 2.2196366966653613e-09, + 2.2291524182094236e-09, + 2.212444005778025e-09 + ], + "bp_grad_norms_F": [ + 9.506617061560974e-06, + 7.949277147645262e-08, + 7.665874335316403e-08, + 7.781166289078101e-08, + 7.6499844681166e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.32421875, + "loss_eval": 1.9272165298461914, + "epoch": 72 + }, + { + "hidden_norms": [ + 27665.341796875, + 6675607.5, + 33128100.0, + 41256448.0, + 30754874.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.570084151580886e-07, + 2.2943660304974856e-09, + 2.2026656054663363e-09, + 2.2121668941110784e-09, + 2.1966797270067673e-09 + ], + "bp_grad_norms_F": [ + 9.71559165918734e-06, + 7.9600532387758e-08, + 7.679192037812754e-08, + 7.795681966626944e-08, + 7.663498990950757e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3115234375, + "loss_eval": 1.941681146621704, + "epoch": 73 + }, + { + "hidden_norms": [ + 27715.794921875, + 6709802.5, + 33331388.0, + 41504024.0, + 30915288.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5387240637210198e-07, + 2.3100528157016242e-09, + 2.2238448860179005e-09, + 2.2321375858780357e-09, + 2.2150188350167355e-09 + ], + "bp_grad_norms_F": [ + 9.473335921938997e-06, + 7.898351128687864e-08, + 7.616839781121598e-08, + 7.73214452465254e-08, + 7.601196472251104e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33203125, + "loss_eval": 1.9246938228607178, + "epoch": 74 + }, + { + "hidden_norms": [ + 27766.177734375, + 6726091.5, + 33455028.0, + 41663816.0, + 31007976.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5595279023727926e-07, + 2.298697898694968e-09, + 2.2091579676697393e-09, + 2.215150729512061e-09, + 2.1983310727335947e-09 + ], + "bp_grad_norms_F": [ + 9.587340173311532e-06, + 7.91313112813441e-08, + 7.627861009495973e-08, + 7.743443575236597e-08, + 7.611913588334573e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3232421875, + "loss_eval": 1.931347370147705, + "epoch": 75 + }, + { + "hidden_norms": [ + 27818.396484375, + 6749941.5, + 33562528.0, + 41806788.0, + 31089946.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.542799026310604e-07, + 2.3069177679246877e-09, + 2.2149184708553094e-09, + 2.2274431188407107e-09, + 2.2138819666395193e-09 + ], + "bp_grad_norms_F": [ + 9.57066185947042e-06, + 7.899650000808833e-08, + 7.612889874053508e-08, + 7.72842909668725e-08, + 7.59681810791335e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.328125, + "loss_eval": 1.9290614128112793, + "epoch": 76 + }, + { + "hidden_norms": [ + 27874.181640625, + 6776020.5, + 33686440.0, + 41956108.0, + 31183962.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5547591658560123e-07, + 2.2904955709890373e-09, + 2.199639581590418e-09, + 2.2111712461025945e-09, + 2.1966135577144996e-09 + ], + "bp_grad_norms_F": [ + 9.538461199554149e-06, + 7.882318442398173e-08, + 7.600280582664709e-08, + 7.715882333059199e-08, + 7.58423581714851e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3369140625, + "loss_eval": 1.9268429279327393, + "epoch": 77 + }, + { + "hidden_norms": [ + 27928.552734375, + 6790532.0, + 33797660.0, + 42095308.0, + 31270040.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5469180425498053e-07, + 2.3010513494625684e-09, + 2.2103030516973377e-09, + 2.2237711672090654e-09, + 2.206205884647261e-09 + ], + "bp_grad_norms_F": [ + 9.510661584499758e-06, + 7.866238149745186e-08, + 7.584375794067455e-08, + 7.699873805222524e-08, + 7.568271342961452e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3291015625, + "loss_eval": 1.9229360818862915, + "epoch": 78 + }, + { + "hidden_norms": [ + 27959.18359375, + 6814900.0, + 33951204.0, + 42283796.0, + 31402056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5280090792657575e-07, + 2.2722823622700616e-09, + 2.182985348042621e-09, + 2.195454484876791e-09, + 2.1783830295163398e-09 + ], + "bp_grad_norms_F": [ + 9.445489922654815e-06, + 7.852113270701011e-08, + 7.573528648663341e-08, + 7.688608150147047e-08, + 7.557830628002193e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3232421875, + "loss_eval": 1.9262363910675049, + "epoch": 79 + }, + { + "hidden_norms": [ + 27969.6171875, + 6828402.0, + 34031784.0, + 42376960.0, + 31453510.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5404552300424257e-07, + 2.2810822120078456e-09, + 2.1932544669311937e-09, + 2.216228756068972e-09, + 2.193953241302893e-09 + ], + "bp_grad_norms_F": [ + 9.498375220573507e-06, + 7.844284510838406e-08, + 7.562837112118359e-08, + 7.677955693452532e-08, + 7.546795188773103e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.330078125, + "loss_eval": 1.925222396850586, + "epoch": 80 + }, + { + "hidden_norms": [ + 27976.40625, + 6839237.5, + 34096948.0, + 42451852.0, + 31495834.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5588855717396655e-07, + 2.290766465407046e-09, + 2.2075170580393433e-09, + 2.2167860880273338e-09, + 2.1972801356184846e-09 + ], + "bp_grad_norms_F": [ + 9.528901500743814e-06, + 7.844620597552421e-08, + 7.561048676052451e-08, + 7.67637402532273e-08, + 7.544804248027503e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3427734375, + "loss_eval": 1.9254777431488037, + "epoch": 81 + }, + { + "hidden_norms": [ + 28004.76953125, + 6848695.0, + 34154160.0, + 42523512.0, + 31536314.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.562642069075082e-07, + 2.289735068217169e-09, + 2.2051671599854217e-09, + 2.2135104860154797e-09, + 2.188419445658951e-09 + ], + "bp_grad_norms_F": [ + 9.512452379567549e-06, + 7.840634452804807e-08, + 7.557503778343744e-08, + 7.672917234913257e-08, + 7.541159163793054e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.341796875, + "loss_eval": 1.9253835678100586, + "epoch": 82 + }, + { + "hidden_norms": [ + 28036.138671875, + 6859844.5, + 34231564.0, + 42620400.0, + 31595422.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5447380974364933e-07, + 2.2824857559555767e-09, + 2.1902821778496673e-09, + 2.2037338620606306e-09, + 2.183933034416441e-09 + ], + "bp_grad_norms_F": [ + 9.456872248847503e-06, + 7.838458770947909e-08, + 7.556796077778927e-08, + 7.67221948194674e-08, + 7.540831603591869e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9241688251495361, + "epoch": 83 + }, + { + "hidden_norms": [ + 28063.341796875, + 6866642.0, + 34298612.0, + 42705280.0, + 31647722.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.550155843688117e-07, + 2.281024480410565e-09, + 2.1895063540000592e-09, + 2.20287676988562e-09, + 2.1853003850935693e-09 + ], + "bp_grad_norms_F": [ + 9.501630302111153e-06, + 7.833479287455702e-08, + 7.55063354063168e-08, + 7.666048418286664e-08, + 7.534579538059916e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9253199100494385, + "epoch": 84 + }, + { + "hidden_norms": [ + 28090.240234375, + 6875769.0, + 34361584.0, + 42782612.0, + 31697334.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.536338629648526e-07, + 2.267983800763318e-09, + 2.1772310621059887e-09, + 2.1934687399749464e-09, + 2.1765453883659802e-09 + ], + "bp_grad_norms_F": [ + 9.536663128528744e-06, + 7.836315774056857e-08, + 7.554304914947352e-08, + 7.669789425790441e-08, + 7.538390178751797e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3203125, + "loss_eval": 1.9292113780975342, + "epoch": 85 + }, + { + "hidden_norms": [ + 28114.236328125, + 6884728.0, + 34407252.0, + 42840440.0, + 31732750.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5464524949493352e-07, + 2.280014399502761e-09, + 2.1917956338768363e-09, + 2.2101085406234233e-09, + 2.1894293045221502e-09 + ], + "bp_grad_norms_F": [ + 9.505700290901586e-06, + 7.817885716576711e-08, + 7.534623591709533e-08, + 7.650118760693658e-08, + 7.518445244159011e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3310546875, + "loss_eval": 1.9261689186096191, + "epoch": 86 + }, + { + "hidden_norms": [ + 28132.669921875, + 6893751.5, + 34460884.0, + 42910656.0, + 31780534.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5502969574754388e-07, + 2.2780193287275097e-09, + 2.1857382570544814e-09, + 2.200839510635433e-09, + 2.1766897173591815e-09 + ], + "bp_grad_norms_F": [ + 9.460140972805675e-06, + 7.810618996018093e-08, + 7.528173284754303e-08, + 7.643409105639876e-08, + 7.512058886049999e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.333984375, + "loss_eval": 1.9239721298217773, + "epoch": 87 + }, + { + "hidden_norms": [ + 28148.599609375, + 6899411.0, + 34495884.0, + 42954048.0, + 31804918.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5502014605317527e-07, + 2.2734785165567928e-09, + 2.191139492069283e-09, + 2.201265170143074e-09, + 2.182727776300908e-09 + ], + "bp_grad_norms_F": [ + 9.466436495131347e-06, + 7.804617752071863e-08, + 7.521869349602639e-08, + 7.63711227591557e-08, + 7.50560502638109e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3369140625, + "loss_eval": 1.9230663776397705, + "epoch": 88 + }, + { + "hidden_norms": [ + 28162.9609375, + 6901370.5, + 34523684.0, + 42989220.0, + 31824814.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5575578515836241e-07, + 2.2783777087198587e-09, + 2.1914692283075965e-09, + 2.19572404702717e-09, + 2.1778470138400507e-09 + ], + "bp_grad_norms_F": [ + 9.514466910331976e-06, + 7.809557445170867e-08, + 7.525108713934969e-08, + 7.640503696393353e-08, + 7.508738519845792e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3447265625, + "loss_eval": 1.9263484477996826, + "epoch": 89 + }, + { + "hidden_norms": [ + 28175.54296875, + 6907143.0, + 34559816.0, + 43035484.0, + 31854504.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5354446247783926e-07, + 2.272713128803616e-09, + 2.1856987331148048e-09, + 2.2020374412790034e-09, + 2.1765065305601183e-09 + ], + "bp_grad_norms_F": [ + 9.444916940992698e-06, + 7.799643242378806e-08, + 7.51774322793608e-08, + 7.632959864167788e-08, + 7.50167856722328e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9226629734039307, + "epoch": 90 + }, + { + "hidden_norms": [ + 28185.98046875, + 6908239.0, + 34575728.0, + 43054472.0, + 31863434.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5382977380795637e-07, + 2.274502586274707e-09, + 2.1870079081054428e-09, + 2.1993444843104726e-09, + 2.181675506918168e-09 + ], + "bp_grad_norms_F": [ + 9.480510016146582e-06, + 7.80089948193563e-08, + 7.51953308508746e-08, + 7.635033938413471e-08, + 7.503523846708049e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3359375, + "loss_eval": 1.92463219165802, + "epoch": 91 + }, + { + "hidden_norms": [ + 28195.05078125, + 6911853.0, + 34606972.0, + 43094588.0, + 31890320.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5355996652033355e-07, + 2.2723862791451666e-09, + 2.1887525125663387e-09, + 2.1977624165003817e-09, + 2.1820119044946296e-09 + ], + "bp_grad_norms_F": [ + 9.450015568290837e-06, + 7.795882339678428e-08, + 7.514577760048269e-08, + 7.629873266523646e-08, + 7.498609022604796e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9231452941894531, + "epoch": 92 + }, + { + "hidden_norms": [ + 28202.009765625, + 6911585.0, + 34614424.0, + 43102544.0, + 31893396.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5335498915192147e-07, + 2.273481403136657e-09, + 2.18971196730422e-09, + 2.201623994224633e-09, + 2.179575853133997e-09 + ], + "bp_grad_norms_F": [ + 9.466421943216119e-06, + 7.796668910486915e-08, + 7.514941557928978e-08, + 7.630385567836129e-08, + 7.498929477378624e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9242045879364014, + "epoch": 93 + }, + { + "hidden_norms": [ + 28207.30078125, + 6912594.5, + 34624228.0, + 43114124.0, + 31900214.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.541789487191636e-07, + 2.26694063520938e-09, + 2.1774959613196643e-09, + 2.1911708003585773e-09, + 2.177005020698175e-09 + ], + "bp_grad_norms_F": [ + 9.48972228798084e-06, + 7.800251466960617e-08, + 7.518539746342867e-08, + 7.634076126805667e-08, + 7.502466559117238e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3349609375, + "loss_eval": 1.9264299869537354, + "epoch": 94 + }, + { + "hidden_norms": [ + 28210.744140625, + 6914176.5, + 34633372.0, + 43125584.0, + 31907212.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5396986441373883e-07, + 2.2685893164009485e-09, + 2.182473091139059e-09, + 2.2001969135487798e-09, + 2.1797674776280473e-09 + ], + "bp_grad_norms_F": [ + 9.470595614402555e-06, + 7.796354850597709e-08, + 7.514324096291602e-08, + 7.629726184177343e-08, + 7.498252330151445e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.3388671875, + "loss_eval": 1.9243674278259277, + "epoch": 95 + }, + { + "hidden_norms": [ + 28213.134765625, + 6914654.0, + 34637116.0, + 43129968.0, + 31909774.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5392139118830528e-07, + 2.2676351907335857e-09, + 2.181399949563456e-09, + 2.194956438827944e-09, + 2.1772521563434566e-09 + ], + "bp_grad_norms_F": [ + 9.468548341828864e-06, + 7.796590040243245e-08, + 7.514832134347671e-08, + 7.630251985801806e-08, + 7.498784526660529e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.33984375, + "loss_eval": 1.9245264530181885, + "epoch": 96 + }, + { + "hidden_norms": [ + 28214.392578125, + 6914571.0, + 34637992.0, + 43130936.0, + 31909692.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5425968058480066e-07, + 2.2704826907471443e-09, + 2.18207008018112e-09, + 2.1958874718563948e-09, + 2.177970914729599e-09 + ], + "bp_grad_norms_F": [ + 9.473776117374655e-06, + 7.796563039619286e-08, + 7.514674393860332e-08, + 7.63012906190852e-08, + 7.498606890976589e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9245213270187378, + "epoch": 97 + }, + { + "hidden_norms": [ + 28215.587890625, + 6915082.0, + 34641648.0, + 43135608.0, + 31912816.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5412730647312856e-07, + 2.2691615253478403e-09, + 2.181160807523952e-09, + 2.1947776929209795e-09, + 2.1773913783107446e-09 + ], + "bp_grad_norms_F": [ + 9.472671081312e-06, + 7.796593592956924e-08, + 7.514773869843339e-08, + 7.630221432464168e-08, + 7.498719867271575e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9246418476104736, + "epoch": 98 + }, + { + "hidden_norms": [ + 28216.130859375, + 6915161.5, + 34642452.0, + 43136600.0, + 31913348.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5420548038491688e-07, + 2.2695016976825855e-09, + 2.1805732774993203e-09, + 2.1951678252918327e-09, + 2.1776345171531375e-09 + ], + "bp_grad_norms_F": [ + 9.474650141783059e-06, + 7.796723622277568e-08, + 7.514872635283609e-08, + 7.63033014550274e-08, + 7.498815079998167e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9247386455535889, + "epoch": 99 + }, + { + "hidden_norms": [ + 28216.1875, + 6915194.0, + 34642580.0, + 43136768.0, + 31913448.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5419134058447526e-07, + 2.2693393830763853e-09, + 2.180579494748258e-09, + 2.194876502770171e-09, + 2.1777446512771803e-09 + ], + "bp_grad_norms_F": [ + 9.474156286159996e-06, + 7.796705148166438e-08, + 7.51486410877078e-08, + 7.630320908447175e-08, + 7.498806553485338e-08 + ], + "gamma_dfa": NaN, + "acc_eval": 0.337890625, + "loss_eval": 1.9247117042541504, + "epoch": 100 + } + ], + "seed": 42, + "depth": 4, + "d_hidden": 256 +}
\ No newline at end of file |
