summaryrefslogtreecommitdiff
path: root/results/snapshot_evolution_v2/snapshot_fa_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_evolution_v2/snapshot_fa_s42.json')
-rw-r--r--results/snapshot_evolution_v2/snapshot_fa_s42.json2734
1 files changed, 2734 insertions, 0 deletions
diff --git a/results/snapshot_evolution_v2/snapshot_fa_s42.json b/results/snapshot_evolution_v2/snapshot_fa_s42.json
new file mode 100644
index 0000000..277acec
--- /dev/null
+++ b/results/snapshot_evolution_v2/snapshot_fa_s42.json
@@ -0,0 +1,2734 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010068593546748161,
+ 0.000997236929833889,
+ 0.0009934091940522194,
+ 0.0009870644425973296,
+ 0.0009829498594626784
+ ],
+ "bp_grad_norms_F": [
+ 0.03544403985142708,
+ 0.03507080301642418,
+ 0.03477022796869278,
+ 0.03443896397948265,
+ 0.03407429903745651
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.115234375,
+ "loss_eval": 2.383650302886963,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 1156.72998046875,
+ 7932.5859375,
+ 11656.220703125,
+ 13101.765625,
+ 12094.2197265625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5287704400179791e-06,
+ 8.219874985115894e-07,
+ 8.303726986014226e-07,
+ 8.411634553340264e-07,
+ 8.074007382674608e-07
+ ],
+ "bp_grad_norms_F": [
+ 0.0005889489548280835,
+ 0.0001249020715476945,
+ 0.00010261647548759356,
+ 8.311456622323021e-05,
+ 6.362409476423636e-05
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2431640625,
+ "loss_eval": 2.0429816246032715,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 2267.652099609375,
+ 33227.19921875,
+ 62863.03515625,
+ 73248.0546875,
+ 64100.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 6.826750791333325e-07,
+ 1.582481274908787e-07,
+ 1.5909284911685972e-07,
+ 1.6235998145930353e-07,
+ 1.57003455569793e-07
+ ],
+ "bp_grad_norms_F": [
+ 9.194230369757861e-05,
+ 3.062757241423242e-05,
+ 2.5034905775100924e-05,
+ 1.2339382010395639e-05,
+ 1.1088715837104246e-05
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.234375,
+ "loss_eval": 2.053070068359375,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 3317.195556640625,
+ 69574.59375,
+ 208893.703125,
+ 272473.75,
+ 236858.453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 5.585509370575892e-07,
+ 5.853191709093153e-08,
+ 5.772180244889569e-08,
+ 5.9099026117337417e-08,
+ 5.743537911939711e-08
+ ],
+ "bp_grad_norms_F": [
+ 5.4304215154843405e-05,
+ 1.798659286578186e-05,
+ 6.792580734327203e-06,
+ 5.748081548517803e-06,
+ 5.4292308959702495e-06
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.109177350997925,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 4279.80322265625,
+ 131147.296875,
+ 524522.6875,
+ 669556.125,
+ 582199.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 4.5417544924930553e-07,
+ 2.7819011094720736e-08,
+ 2.7284025705398562e-08,
+ 2.7924896173203706e-08,
+ 2.717020919362767e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.7083517124992795e-05,
+ 3.1135298286244506e-06,
+ 2.188051212215214e-06,
+ 1.643483983571059e-06,
+ 1.5356297353719128e-06
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2314453125,
+ "loss_eval": 2.1304922103881836,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 5095.1298828125,
+ 222828.6875,
+ 891649.1875,
+ 1124229.75,
+ 978070.3125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.9661114215050475e-07,
+ 1.7936926610673254e-08,
+ 1.787710601774961e-08,
+ 1.8164961090860743e-08,
+ 1.7773361449258118e-08
+ ],
+ "bp_grad_norms_F": [
+ 2.5229386665159836e-05,
+ 1.7291312133238534e-06,
+ 8.046768016356509e-07,
+ 6.81868698393373e-07,
+ 6.581432785424113e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2275390625,
+ "loss_eval": 2.1189823150634766,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 5762.8369140625,
+ 345252.125,
+ 1352057.25,
+ 1685390.25,
+ 1472510.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.5811123666462663e-07,
+ 1.2679316263586315e-08,
+ 1.2558022177699968e-08,
+ 1.2735733356805667e-08,
+ 1.2553626582700872e-08
+ ],
+ "bp_grad_norms_F": [
+ 1.9819366571027786e-05,
+ 7.985001957422355e-07,
+ 4.666244706186262e-07,
+ 4.659337093926297e-07,
+ 4.531105162186577e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2314453125,
+ "loss_eval": 2.1147799491882324,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 6342.46337890625,
+ 489436.21875,
+ 1846600.125,
+ 2298539.25,
+ 2010095.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2295056939801725e-07,
+ 9.47152134500584e-09,
+ 9.449903082270339e-09,
+ 9.579181003971371e-09,
+ 9.398083200551355e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.761323437676765e-05,
+ 3.5219920846429886e-07,
+ 3.464733993041591e-07,
+ 3.515923765462503e-07,
+ 3.4331398524045653e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.263671875,
+ "loss_eval": 2.0468926429748535,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 6895.3232421875,
+ 642604.125,
+ 2340199.25,
+ 2912852.0,
+ 2551695.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 3.2115181625158584e-07,
+ 8.011411978259275e-09,
+ 8.093356207439228e-09,
+ 8.185297772911326e-09,
+ 8.036058929405954e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.6510130080860108e-05,
+ 2.8924068828928284e-07,
+ 2.88436524442659e-07,
+ 2.9188095140852965e-07,
+ 2.860562631212815e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2373046875,
+ "loss_eval": 2.0705394744873047,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 7418.32666015625,
+ 802952.8125,
+ 2905706.5,
+ 3629847.25,
+ 3176127.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.9990744110364176e-07,
+ 6.746414982217175e-09,
+ 6.801009533319302e-09,
+ 6.844500521907548e-09,
+ 6.780156436292373e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.5715995687060058e-05,
+ 2.419061502223485e-07,
+ 2.416737459043361e-07,
+ 2.441595654545381e-07,
+ 2.39673738633428e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.271484375,
+ "loss_eval": 2.03157901763916,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 8026.80126953125,
+ 964342.4375,
+ 3455197.75,
+ 4322591.0,
+ 3777789.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.9810524893036927e-07,
+ 5.931947377746383e-09,
+ 5.9767870652649435e-09,
+ 6.012730313642578e-09,
+ 5.922320855944463e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.546428757137619e-05,
+ 2.1311132059054216e-07,
+ 2.1318879817044945e-07,
+ 2.1529912430651166e-07,
+ 2.115393868962201e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2421875,
+ "loss_eval": 2.029039144515991,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 8568.4677734375,
+ 1146051.75,
+ 4149878.75,
+ 5211595.5,
+ 4551772.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.77834743656058e-07,
+ 5.156825633179096e-09,
+ 5.185044393840599e-09,
+ 5.243859568793141e-09,
+ 5.148059312176656e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4489689419860952e-05,
+ 1.8374593935277517e-07,
+ 1.8364994502917398e-07,
+ 1.8539546431384224e-07,
+ 1.8235705567803961e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.279296875,
+ "loss_eval": 2.015061855316162,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 9099.6689453125,
+ 1306440.25,
+ 4712579.5,
+ 5930700.5,
+ 5167806.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.789404618397384e-07,
+ 4.740023484828271e-09,
+ 4.688871069191691e-09,
+ 4.722021884617789e-09,
+ 4.664129082954105e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.440922096662689e-05,
+ 1.6886964715467911e-07,
+ 1.6845007166921278e-07,
+ 1.6997903173887607e-07,
+ 1.673002003599322e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.279296875,
+ "loss_eval": 2.0080716609954834,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 9619.3310546875,
+ 1468314.25,
+ 5278606.0,
+ 6647205.0,
+ 5776389.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.678217470020172e-07,
+ 4.431488953571261e-09,
+ 4.461886859985498e-09,
+ 4.481298443437254e-09,
+ 4.434627776106481e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.4280021787271835e-05,
+ 1.5716064183379785e-07,
+ 1.5650925888621714e-07,
+ 1.5793726504398364e-07,
+ 1.5547414022876183e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.294921875,
+ "loss_eval": 2.003105401992798,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 10185.365234375,
+ 1637280.875,
+ 5941891.0,
+ 7477497.0,
+ 6482495.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.580181046596408e-07,
+ 4.108497098087582e-09,
+ 4.027958855346014e-09,
+ 4.0670666834330405e-09,
+ 4.01310229491969e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3607143955596257e-05,
+ 1.4447114438098652e-07,
+ 1.4335948606003512e-07,
+ 1.4459322983384482e-07,
+ 1.424295135166176e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2841796875,
+ "loss_eval": 1.9895731210708618,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 10773.4443359375,
+ 1777185.125,
+ 6485962.5,
+ 8158632.5,
+ 7057802.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.536919225804013e-07,
+ 3.8119583045670424e-09,
+ 3.815232130222057e-09,
+ 3.836773565524254e-09,
+ 3.790971536687948e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3741724615101703e-05,
+ 1.3785883368200302e-07,
+ 1.3661090747518756e-07,
+ 1.3781669849777245e-07,
+ 1.3573732360327995e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.263671875,
+ "loss_eval": 2.0124382972717285,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11403.58984375,
+ 1931677.0,
+ 7089585.5,
+ 8906384.0,
+ 7683122.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.446777500608732e-07,
+ 3.674859083702131e-09,
+ 3.648833679648078e-09,
+ 3.6761997890266684e-09,
+ 3.624884392650074e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3561247214965988e-05,
+ 1.2985380237751087e-07,
+ 1.2829688955662277e-07,
+ 1.294151275033073e-07,
+ 1.2746555455578346e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.26953125,
+ "loss_eval": 2.0030646324157715,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 12115.1162109375,
+ 2091857.0,
+ 7735447.5,
+ 9727085.0,
+ 8371443.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.378987460360804e-07,
+ 3.4695852857424825e-09,
+ 3.42812689346772e-09,
+ 3.4526042025362358e-09,
+ 3.40047856539627e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3279566701385193e-05,
+ 1.2257437731477694e-07,
+ 1.2078584177288576e-07,
+ 1.2181956776657898e-07,
+ 1.1999593141354126e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.9935777187347412,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 12755.7646484375,
+ 2248501.0,
+ 8338276.5,
+ 10490721.0,
+ 8991669.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.3127104498144035e-07,
+ 3.35100103221464e-09,
+ 3.3095433060736923e-09,
+ 3.326423581029303e-09,
+ 3.2682878625678313e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3015700460528024e-05,
+ 1.1814677947086238e-07,
+ 1.1589928305966168e-07,
+ 1.1685516199122503e-07,
+ 1.1511789210771894e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2900390625,
+ "loss_eval": 1.9912320375442505,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 13395.4189453125,
+ 2393670.0,
+ 8949124.0,
+ 11235038.0,
+ 9603954.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.2520477216403378e-07,
+ 3.2867890631393948e-09,
+ 3.2246825210080488e-09,
+ 3.250592239822936e-09,
+ 3.201830800492189e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.3049841072643176e-05,
+ 1.1301781910333375e-07,
+ 1.1090982354744483e-07,
+ 1.1187000836798688e-07,
+ 1.101881252907333e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2626953125,
+ "loss_eval": 2.0112197399139404,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 14034.6982421875,
+ 2529761.5,
+ 9576616.0,
+ 12035853.0,
+ 10258897.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.1533313088184514e-07,
+ 3.174721152632287e-09,
+ 3.1246687459685063e-09,
+ 3.149874805430386e-09,
+ 3.09314329705046e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.26855793496361e-05,
+ 1.0948959072720754e-07,
+ 1.0680034279175743e-07,
+ 1.0768705749342189e-07,
+ 1.0610038714276016e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.25,
+ "loss_eval": 2.0056447982788086,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 14717.9462890625,
+ 2650771.25,
+ 10157696.0,
+ 12784758.0,
+ 10849881.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.086567434389508e-07,
+ 2.999795301050767e-09,
+ 2.966421552841325e-09,
+ 2.9786708655166194e-09,
+ 2.947827537624903e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2321271242399234e-05,
+ 1.0535904237940485e-07,
+ 1.0280631101977633e-07,
+ 1.0365675251478024e-07,
+ 1.021143916091205e-07
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.9869788885116577,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 15327.8466796875,
+ 2777500.75,
+ 10776735.0,
+ 13573723.0,
+ 11474654.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.0232576503076416e-07,
+ 2.9384910060770153e-09,
+ 2.867603710043909e-09,
+ 2.8935454032819052e-09,
+ 2.8441446975335793e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.231426631420618e-05,
+ 1.0333050681765599e-07,
+ 1.0039466502576033e-07,
+ 1.0124550442469626e-07,
+ 9.972216474807283e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2939453125,
+ "loss_eval": 1.9892809391021729,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 15945.8837890625,
+ 2878910.75,
+ 11304857.0,
+ 14241028.0,
+ 11994238.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 2.0171727044271393e-07,
+ 2.9479860774728195e-09,
+ 2.8580404709543927e-09,
+ 2.8716116151628057e-09,
+ 2.8270419338838337e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2025901924062055e-05,
+ 1.0096052704966496e-07,
+ 9.789676624905042e-08,
+ 9.872773176766714e-08,
+ 9.722123195388122e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2802734375,
+ "loss_eval": 1.9858973026275635,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 16595.853515625,
+ 3002464.5,
+ 11949546.0,
+ 15061732.0,
+ 12646630.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.9120048477816454e-07,
+ 2.8694004949869623e-09,
+ 2.772703400211185e-09,
+ 2.777924779095997e-09,
+ 2.7492945697815685e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.2024025636492297e-05,
+ 9.894926478182242e-08,
+ 9.581360416177631e-08,
+ 9.663772715384766e-08,
+ 9.51538083882042e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.296875,
+ "loss_eval": 1.9969089031219482,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 17227.1640625,
+ 3125553.25,
+ 12574712.0,
+ 15844785.0,
+ 13247150.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.8941717883080855e-07,
+ 2.8377846739147117e-09,
+ 2.7375035571708395e-09,
+ 2.7606503749666444e-09,
+ 2.7206534802814986e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.153391167463269e-05,
+ 9.671435208247203e-08,
+ 9.34372863525823e-08,
+ 9.424089597587226e-08,
+ 9.280081059159784e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.294921875,
+ "loss_eval": 1.9766383171081543,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 17808.20703125,
+ 3256055.25,
+ 13319775.0,
+ 16758460.0,
+ 13956453.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.8628608700055338e-07,
+ 2.7554525328099544e-09,
+ 2.625358597185823e-09,
+ 2.6348250248275917e-09,
+ 2.614828797931068e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0964491593767889e-05,
+ 9.419229485274627e-08,
+ 9.09606185928169e-08,
+ 9.175563775443152e-08,
+ 9.03681396380307e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2919921875,
+ "loss_eval": 1.9645390510559082,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 18401.28125,
+ 3393640.75,
+ 14088409.0,
+ 17726368.0,
+ 14707189.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7694672749257734e-07,
+ 2.722393421805691e-09,
+ 2.634128470901942e-09,
+ 2.6627771099185793e-09,
+ 2.6215960513553682e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1054430615331512e-05,
+ 9.26544814205954e-08,
+ 8.924564554035896e-08,
+ 9.002578593708677e-08,
+ 8.865336553753878e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2861328125,
+ "loss_eval": 1.974367618560791,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 18936.51953125,
+ 3515726.25,
+ 14734875.0,
+ 18530786.0,
+ 15301454.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7923295558830432e-07,
+ 2.6605673220103654e-09,
+ 2.530292642077825e-09,
+ 2.5396913461150916e-09,
+ 2.517351882502794e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.1157896551594604e-05,
+ 9.233546904852119e-08,
+ 8.888883229474231e-08,
+ 8.968125086994405e-08,
+ 8.831575115664236e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.2841796875,
+ "loss_eval": 1.986099362373352,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 19457.962890625,
+ 3664789.5,
+ 15342228.0,
+ 19308666.0,
+ 15894652.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.7488744674665213e-07,
+ 2.6636790551037848e-09,
+ 2.4992619085395518e-09,
+ 2.507181573463413e-09,
+ 2.486318262384657e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.092042657546699e-05,
+ 9.157383118463258e-08,
+ 8.810303597783786e-08,
+ 8.888122238204232e-08,
+ 8.75455583582152e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.9868172407150269,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 19933.78515625,
+ 3775119.25,
+ 16017107.0,
+ 20154288.0,
+ 16541561.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.715164188453855e-07,
+ 2.5937807457410145e-09,
+ 2.4676627408126706e-09,
+ 2.4873916260048645e-09,
+ 2.4605657511500567e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0760413715615869e-05,
+ 9.029215419786851e-08,
+ 8.696353148707203e-08,
+ 8.772182269467521e-08,
+ 8.64171596504093e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.291015625,
+ "loss_eval": 1.9754526615142822,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 20432.466796875,
+ 3910461.25,
+ 16712518.0,
+ 21021696.0,
+ 17196572.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.710603356741558e-07,
+ 2.6387678708772455e-09,
+ 2.524718212271182e-09,
+ 2.5378650292395832e-09,
+ 2.5052109275947032e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0587626093183644e-05,
+ 8.93876332952459e-08,
+ 8.59824282883892e-08,
+ 8.675493745613494e-08,
+ 8.546451368829366e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9657469987869263,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 20875.439453125,
+ 4054334.0,
+ 17463474.0,
+ 21948092.0,
+ 17887228.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.729485461510194e-07,
+ 2.6252673368531987e-09,
+ 2.4720219204965588e-09,
+ 2.491059358789016e-09,
+ 2.4621127359125694e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0830392966454383e-05,
+ 8.912193294463577e-08,
+ 8.547249308321625e-08,
+ 8.626851411008829e-08,
+ 8.495522507701025e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9752991199493408,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 21372.0234375,
+ 4181554.25,
+ 18179600.0,
+ 22866024.0,
+ 18562826.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6644050049308134e-07,
+ 2.5652076018900516e-09,
+ 2.4415069965755265e-09,
+ 2.4562532008332028e-09,
+ 2.423905742787724e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0476498573552817e-05,
+ 8.780278903941507e-08,
+ 8.420673225373321e-08,
+ 8.501019266304866e-08,
+ 8.373319104748589e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9647243022918701,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 21698.390625,
+ 4323451.5,
+ 18873394.0,
+ 23742746.0,
+ 19211736.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6982900774564769e-07,
+ 2.6139097553112833e-09,
+ 2.4535891096633122e-09,
+ 2.465766257842006e-09,
+ 2.4349082750063644e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0547244528424926e-05,
+ 8.761546865798664e-08,
+ 8.380350635661671e-08,
+ 8.460440881208342e-08,
+ 8.332586531878405e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9688763618469238,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 22000.6484375,
+ 4419910.5,
+ 19288578.0,
+ 24275390.0,
+ 19571482.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6632812105399353e-07,
+ 2.5976403250638214e-09,
+ 2.4608304283191273e-09,
+ 2.4786184216196716e-09,
+ 2.4511619400868767e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0402384759800043e-05,
+ 8.75945431744185e-08,
+ 8.378519567031617e-08,
+ 8.458554390244899e-08,
+ 8.331597456390227e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.962469458580017,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 22332.140625,
+ 4505425.5,
+ 19876824.0,
+ 24999434.0,
+ 20098762.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.673159886195208e-07,
+ 2.5706452522200607e-09,
+ 2.4236175288905315e-09,
+ 2.4205843995872556e-09,
+ 2.4001298726261666e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0201652912655845e-05,
+ 8.668673245892933e-08,
+ 8.301810083821692e-08,
+ 8.384706973174616e-08,
+ 8.257533323785538e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3046875,
+ "loss_eval": 1.9482183456420898,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 22704.90625,
+ 4601120.5,
+ 20416742.0,
+ 25650594.0,
+ 20558608.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6260217705621471e-07,
+ 2.501829188261695e-09,
+ 2.37497355115579e-09,
+ 2.379827890308661e-09,
+ 2.364261231235787e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0307686352462042e-05,
+ 8.687224806180893e-08,
+ 8.317324073914278e-08,
+ 8.40014422465174e-08,
+ 8.273995177887628e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.9718880653381348,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 22953.462890625,
+ 4708118.5,
+ 21018216.0,
+ 26396430.0,
+ 21081344.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6642815126033383e-07,
+ 2.5344910614677474e-09,
+ 2.3881991939589398e-09,
+ 2.393568676595237e-09,
+ 2.366601137282487e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0291260878148023e-05,
+ 8.597661604881068e-08,
+ 8.222435354809932e-08,
+ 8.30701907261755e-08,
+ 8.179645050176987e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3173828125,
+ "loss_eval": 1.9656648635864258,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 23329.68359375,
+ 4813138.0,
+ 21547542.0,
+ 27050624.0,
+ 21536360.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6755477361130033e-07,
+ 2.5133575221047977e-09,
+ 2.3339741250794077e-09,
+ 2.3630628565030065e-09,
+ 2.3331871989995534e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0207740160694811e-05,
+ 8.593145395252577e-08,
+ 8.217772773377874e-08,
+ 8.303662468733819e-08,
+ 8.176558452532845e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9581431150436401,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 23598.361328125,
+ 4903029.0,
+ 22069792.0,
+ 27713646.0,
+ 21984984.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6272531411232194e-07,
+ 2.4648321161890863e-09,
+ 2.360529327560812e-09,
+ 2.364856310776986e-09,
+ 2.3259458803437383e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0116659723280463e-05,
+ 8.537404028174933e-08,
+ 8.159113207284463e-08,
+ 8.246142613188567e-08,
+ 8.120937167177544e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.9615185260772705,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 23904.275390625,
+ 5004298.0,
+ 22611816.0,
+ 28369744.0,
+ 22444866.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6563248550482967e-07,
+ 2.5165425299178423e-09,
+ 2.3475779098447447e-09,
+ 2.3561286255358027e-09,
+ 2.3397561665916555e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0093037417391315e-05,
+ 8.496893855181042e-08,
+ 8.129408968216012e-08,
+ 8.217033098389948e-08,
+ 8.091691228173659e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3056640625,
+ "loss_eval": 1.9596519470214844,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 24124.95703125,
+ 5079679.0,
+ 23056108.0,
+ 28905466.0,
+ 22810520.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.650763863381144e-07,
+ 2.5150639348936465e-09,
+ 2.375127650111608e-09,
+ 2.3864086262648243e-09,
+ 2.3595001508169844e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0080430001835339e-05,
+ 8.473855928059493e-08,
+ 8.099364379177132e-08,
+ 8.18785963474511e-08,
+ 8.06336757364079e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3251953125,
+ "loss_eval": 1.9462497234344482,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 24350.154296875,
+ 5170977.5,
+ 23526890.0,
+ 29466298.0,
+ 23191828.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6226854882006592e-07,
+ 2.5123039204544284e-09,
+ 2.381558061870237e-09,
+ 2.391710607341224e-09,
+ 2.3734676446451886e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0192407899012323e-05,
+ 8.457134015316115e-08,
+ 8.096912296196024e-08,
+ 8.18817795789073e-08,
+ 8.06216249316094e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.950229287147522,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 24543.87890625,
+ 5230886.0,
+ 23931748.0,
+ 29937192.0,
+ 23499106.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6538373870389478e-07,
+ 2.4975805867910594e-09,
+ 2.3630661871720804e-09,
+ 2.3725827968945623e-09,
+ 2.3566677498365607e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0082419976242818e-05,
+ 8.452050792584487e-08,
+ 8.1015215869229e-08,
+ 8.194035672204336e-08,
+ 8.06845363854336e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.30078125,
+ "loss_eval": 1.9453504085540771,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 24711.091796875,
+ 5298309.0,
+ 24318082.0,
+ 30413608.0,
+ 23808788.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6054062257353507e-07,
+ 2.4891384509118097e-09,
+ 2.358970574434238e-09,
+ 2.368707230360201e-09,
+ 2.3476884880579973e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0053097867057659e-05,
+ 8.462841805112475e-08,
+ 8.112137095395155e-08,
+ 8.206667700960679e-08,
+ 8.080490943029872e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3076171875,
+ "loss_eval": 1.9472556114196777,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 24881.759765625,
+ 5378830.0,
+ 24836314.0,
+ 31031698.0,
+ 24231208.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.623594982902432e-07,
+ 2.4946655852176036e-09,
+ 2.3718913499948258e-09,
+ 2.3750907907071905e-09,
+ 2.3478305966051494e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.012617394735571e-05,
+ 8.473565316080567e-08,
+ 8.116323613194254e-08,
+ 8.212452939915238e-08,
+ 8.085635272436775e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9553910493850708,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 25032.86328125,
+ 5446721.0,
+ 25258438.0,
+ 31534450.0,
+ 24555236.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.632960788811033e-07,
+ 2.470913029739563e-09,
+ 2.316862923734675e-09,
+ 2.3169177687520914e-09,
+ 2.3029997908707855e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.900480108626653e-06,
+ 8.452943944803337e-08,
+ 8.106712812150363e-08,
+ 8.2038923210348e-08,
+ 8.077390845073751e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9489891529083252,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 25306.201171875,
+ 5468743.5,
+ 25525060.0,
+ 31867246.0,
+ 24722362.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5847486167785974e-07,
+ 2.4746471538605874e-09,
+ 2.3425053008452323e-09,
+ 2.3598758502885175e-09,
+ 2.3311046426499615e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.7980091595673e-06,
+ 8.43976621922593e-08,
+ 8.096849057892541e-08,
+ 8.195242884312393e-08,
+ 8.069165602364592e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3134765625,
+ "loss_eval": 1.9313395023345947,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 25419.810546875,
+ 5521521.5,
+ 25869234.0,
+ 32269302.0,
+ 24978000.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6377224199004559e-07,
+ 2.4982107493798367e-09,
+ 2.3510355884326373e-09,
+ 2.359785478134313e-09,
+ 2.3393140757832498e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.003210672934074e-05,
+ 8.464159151344575e-08,
+ 8.12287339613249e-08,
+ 8.224073155815859e-08,
+ 8.095251047279817e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3095703125,
+ "loss_eval": 1.94147527217865,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 25543.001953125,
+ 5573999.0,
+ 26298990.0,
+ 32786014.0,
+ 25316304.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.593823384382631e-07,
+ 2.512666297249666e-09,
+ 2.392667397543846e-09,
+ 2.4054993552624637e-09,
+ 2.386617126148849e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0020607987826224e-05,
+ 8.429628906014841e-08,
+ 8.090298564411569e-08,
+ 8.193208600459911e-08,
+ 8.064517231787249e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.9412651062011719,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 25755.05859375,
+ 5633394.5,
+ 26712786.0,
+ 33270568.0,
+ 25632750.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.615333218296655e-07,
+ 2.483285133081381e-09,
+ 2.346244309947565e-09,
+ 2.3569415308344333e-09,
+ 2.342600557980745e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.841775863606017e-06,
+ 8.406106388747503e-08,
+ 8.07588094176026e-08,
+ 8.180128219237304e-08,
+ 8.051125632846379e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3193359375,
+ "loss_eval": 1.9356749057769775,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 25838.6875,
+ 5676516.5,
+ 26956640.0,
+ 33554564.0,
+ 25797852.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5953406773405732e-07,
+ 2.4927520048123597e-09,
+ 2.379676899977312e-09,
+ 2.3930151193951588e-09,
+ 2.37515118683973e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0000761903938837e-05,
+ 8.431718612200712e-08,
+ 8.108807492135384e-08,
+ 8.215462798943918e-08,
+ 8.085050495765245e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.322265625,
+ "loss_eval": 1.9513205289840698,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 25925.244140625,
+ 5739893.0,
+ 27348932.0,
+ 34049508.0,
+ 26115016.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5941535025376652e-07,
+ 2.4419115618457e-09,
+ 2.335727167235291e-09,
+ 2.3481498967470316e-09,
+ 2.335213800108704e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.962137482943945e-06,
+ 8.399173623274692e-08,
+ 8.08289613019042e-08,
+ 8.190350797576684e-08,
+ 8.060307266077871e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3173828125,
+ "loss_eval": 1.9443122148513794,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 26078.8125,
+ 5808761.5,
+ 27799278.0,
+ 34615776.0,
+ 26499736.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5867621527831943e-07,
+ 2.4137036813698387e-09,
+ 2.31744068379669e-09,
+ 2.327602111051874e-09,
+ 2.313133462550354e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.748204320203513e-06,
+ 8.347069524461403e-08,
+ 8.032785814293675e-08,
+ 8.14167648854891e-08,
+ 8.011366503524187e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9361423254013062,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 26192.453125,
+ 5875144.0,
+ 28166196.0,
+ 35073324.0,
+ 26791154.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5812705100870517e-07,
+ 2.4364927853071094e-09,
+ 2.339390015038134e-09,
+ 2.3421220518571317e-09,
+ 2.328011117214146e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.899279575620312e-06,
+ 8.359175751593284e-08,
+ 8.043829780035594e-08,
+ 8.154502495472116e-08,
+ 8.023434361348336e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.940393090248108,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 26281.6796875,
+ 5935011.0,
+ 28625862.0,
+ 35638648.0,
+ 27180628.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6062698193763936e-07,
+ 2.4364579243041362e-09,
+ 2.3309267849214166e-09,
+ 2.3373505353418977e-09,
+ 2.3235424695400297e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.917155693983659e-06,
+ 8.292303022017222e-08,
+ 7.976373694873473e-08,
+ 8.087503999831824e-08,
+ 7.955991776498195e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.945765495300293,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 26394.865234375,
+ 5988690.5,
+ 28944822.0,
+ 36062032.0,
+ 27426714.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.6303006589168945e-07,
+ 2.4247555074907723e-09,
+ 2.309517688203755e-09,
+ 2.3198174492478074e-09,
+ 2.3075219512946887e-09
+ ],
+ "bp_grad_norms_F": [
+ 1.0007075616158545e-05,
+ 8.301859821813196e-08,
+ 7.986342609456187e-08,
+ 8.099387827087412e-08,
+ 7.966451676111319e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.9433667659759521,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 26515.357421875,
+ 6051740.5,
+ 29293128.0,
+ 36499980.0,
+ 27690768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5923862406452827e-07,
+ 2.3941215676615e-09,
+ 2.28924412759568e-09,
+ 2.2969097734915067e-09,
+ 2.280708066848547e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.82554138317937e-06,
+ 8.282027863515395e-08,
+ 7.976368721074323e-08,
+ 8.090249536962801e-08,
+ 7.957222436516531e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.306640625,
+ "loss_eval": 1.944448709487915,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 26621.947265625,
+ 6089471.5,
+ 29639332.0,
+ 36907412.0,
+ 27955134.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5679145803915162e-07,
+ 2.3988511177464034e-09,
+ 2.303158996852517e-09,
+ 2.3152970651807436e-09,
+ 2.2871571303539895e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.731273166835308e-06,
+ 8.24191062065438e-08,
+ 7.936159107657659e-08,
+ 8.050036370832458e-08,
+ 7.917343225471996e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3125,
+ "loss_eval": 1.9350972175598145,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 26731.64453125,
+ 6146909.5,
+ 30036422.0,
+ 37405476.0,
+ 28295768.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5779031059537374e-07,
+ 2.4025526013105036e-09,
+ 2.3019863792939077e-09,
+ 2.3154580475193143e-09,
+ 2.293559120403188e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.80158438323997e-06,
+ 8.19560526110763e-08,
+ 7.889645559089331e-08,
+ 8.003749485396838e-08,
+ 7.871490481647925e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.941221833229065,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 26842.380859375,
+ 6189510.0,
+ 30305302.0,
+ 37746040.0,
+ 28515236.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5621530735643319e-07,
+ 2.3939163984465495e-09,
+ 2.3025825690581314e-09,
+ 2.3148469807665606e-09,
+ 2.2962292067774115e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.731598765938543e-06,
+ 8.167720011442725e-08,
+ 7.863504691840717e-08,
+ 7.977818938798009e-08,
+ 7.845925864558012e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3408203125,
+ "loss_eval": 1.9333854913711548,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 26940.765625,
+ 6243737.5,
+ 30559802.0,
+ 38046748.0,
+ 28709922.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5672847553105385e-07,
+ 2.3640371882294176e-09,
+ 2.2657933307357325e-09,
+ 2.2837092217287136e-09,
+ 2.2615944672566e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.668071470514406e-06,
+ 8.165712017671467e-08,
+ 7.869160612017367e-08,
+ 7.984421301898692e-08,
+ 7.851971872696595e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9349033832550049,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 27024.9140625,
+ 6285780.0,
+ 30783454.0,
+ 38328276.0,
+ 28883832.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5834399391678744e-07,
+ 2.3645019275875256e-09,
+ 2.2709001346044033e-09,
+ 2.2806179167389473e-09,
+ 2.2639952135250496e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.799305189517327e-06,
+ 8.167254605950802e-08,
+ 7.873082097376027e-08,
+ 7.989201833424886e-08,
+ 7.856029071717785e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.31640625,
+ "loss_eval": 1.9409070014953613,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 27131.298828125,
+ 6330564.0,
+ 31012118.0,
+ 38625700.0,
+ 29050708.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.588112752415327e-07,
+ 2.403508059245496e-09,
+ 2.2917150399592856e-09,
+ 2.3033945861783423e-09,
+ 2.2864310444958846e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.54241204453865e-06,
+ 8.120213124129805e-08,
+ 7.823086889402475e-08,
+ 7.938096047155341e-08,
+ 7.805995494436502e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3388671875,
+ "loss_eval": 1.9211525917053223,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 27208.25,
+ 6368866.0,
+ 31290472.0,
+ 38967492.0,
+ 29272872.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5740459957669373e-07,
+ 2.3837900542389434e-09,
+ 2.284773703564724e-09,
+ 2.298153001234482e-09,
+ 2.2881960770604337e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.658318958827294e-06,
+ 8.104061777203242e-08,
+ 7.810449886846982e-08,
+ 7.925908818151584e-08,
+ 7.793548206791456e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.341796875,
+ "loss_eval": 1.9278589487075806,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 27276.62890625,
+ 6418036.5,
+ 31545874.0,
+ 39283716.0,
+ 29477138.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5503043471198907e-07,
+ 2.357751327508595e-09,
+ 2.2688111389612686e-09,
+ 2.2810615618595875e-09,
+ 2.2629353946257424e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.6196936283377e-06,
+ 8.082280089638516e-08,
+ 7.795324563630857e-08,
+ 7.91092062968346e-08,
+ 7.778949395742529e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.33984375,
+ "loss_eval": 1.9305698871612549,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 27340.607421875,
+ 6465153.0,
+ 31796498.0,
+ 39598816.0,
+ 29679376.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5558319432784629e-07,
+ 2.3627866330144798e-09,
+ 2.2779722552712656e-09,
+ 2.2912376440586968e-09,
+ 2.2693087409209056e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.68782387644751e-06,
+ 8.066198375900058e-08,
+ 7.781451927257876e-08,
+ 7.897661191691441e-08,
+ 7.765357423750174e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3173828125,
+ "loss_eval": 1.9328408241271973,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 27396.21484375,
+ 6507270.5,
+ 32041844.0,
+ 39890444.0,
+ 29881876.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5313091239477217e-07,
+ 2.336748128328736e-09,
+ 2.2449873071650472e-09,
+ 2.2587733905510277e-09,
+ 2.237245722014336e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.509177289146464e-06,
+ 8.020302288969106e-08,
+ 7.739499352510393e-08,
+ 7.854830386122558e-08,
+ 7.723401296289012e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.318359375,
+ "loss_eval": 1.9248214960098267,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 27461.697265625,
+ 6534744.5,
+ 32295470.0,
+ 40216712.0,
+ 30089670.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5820302223801264e-07,
+ 2.3342023869332706e-09,
+ 2.2277899525136036e-09,
+ 2.237228180490547e-09,
+ 2.2202666372095337e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.662662705522962e-06,
+ 8.017656227821135e-08,
+ 7.73198536307973e-08,
+ 7.847864225141166e-08,
+ 7.715301109101347e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.9348523616790771,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 27519.265625,
+ 6576646.0,
+ 32533798.0,
+ 40497036.0,
+ 30273994.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5546247311704064e-07,
+ 2.332068760324546e-09,
+ 2.2422437240265936e-09,
+ 2.259832765361125e-09,
+ 2.2382042885737974e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.630303793528583e-06,
+ 7.993662620719988e-08,
+ 7.707911464649442e-08,
+ 7.823470582479786e-08,
+ 7.691809855714382e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3212890625,
+ "loss_eval": 1.9298650026321411,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 27578.833984375,
+ 6611492.0,
+ 32783444.0,
+ 40806224.0,
+ 30475316.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5486573090583988e-07,
+ 2.310989177800593e-09,
+ 2.214788796806033e-09,
+ 2.2242498953772838e-09,
+ 2.209040284029129e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.58504097070545e-06,
+ 7.973878268785484e-08,
+ 7.692549530702308e-08,
+ 7.808419866250915e-08,
+ 7.67675771840004e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.314453125,
+ "loss_eval": 1.9349405765533447,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 27637.01953125,
+ 6652277.0,
+ 32940606.0,
+ 41021348.0,
+ 30603354.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5176895828972192e-07,
+ 2.309274771405967e-09,
+ 2.2196366966653613e-09,
+ 2.2291524182094236e-09,
+ 2.212444005778025e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.506617061560974e-06,
+ 7.949277147645262e-08,
+ 7.665874335316403e-08,
+ 7.781166289078101e-08,
+ 7.6499844681166e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.32421875,
+ "loss_eval": 1.9272165298461914,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 27665.341796875,
+ 6675607.5,
+ 33128100.0,
+ 41256448.0,
+ 30754874.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.570084151580886e-07,
+ 2.2943660304974856e-09,
+ 2.2026656054663363e-09,
+ 2.2121668941110784e-09,
+ 2.1966797270067673e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.71559165918734e-06,
+ 7.9600532387758e-08,
+ 7.679192037812754e-08,
+ 7.795681966626944e-08,
+ 7.663498990950757e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3115234375,
+ "loss_eval": 1.941681146621704,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 27715.794921875,
+ 6709802.5,
+ 33331388.0,
+ 41504024.0,
+ 30915288.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5387240637210198e-07,
+ 2.3100528157016242e-09,
+ 2.2238448860179005e-09,
+ 2.2321375858780357e-09,
+ 2.2150188350167355e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.473335921938997e-06,
+ 7.898351128687864e-08,
+ 7.616839781121598e-08,
+ 7.73214452465254e-08,
+ 7.601196472251104e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.33203125,
+ "loss_eval": 1.9246938228607178,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 27766.177734375,
+ 6726091.5,
+ 33455028.0,
+ 41663816.0,
+ 31007976.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5595279023727926e-07,
+ 2.298697898694968e-09,
+ 2.2091579676697393e-09,
+ 2.215150729512061e-09,
+ 2.1983310727335947e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.587340173311532e-06,
+ 7.91313112813441e-08,
+ 7.627861009495973e-08,
+ 7.743443575236597e-08,
+ 7.611913588334573e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3232421875,
+ "loss_eval": 1.931347370147705,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 27818.396484375,
+ 6749941.5,
+ 33562528.0,
+ 41806788.0,
+ 31089946.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.542799026310604e-07,
+ 2.3069177679246877e-09,
+ 2.2149184708553094e-09,
+ 2.2274431188407107e-09,
+ 2.2138819666395193e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.57066185947042e-06,
+ 7.899650000808833e-08,
+ 7.612889874053508e-08,
+ 7.72842909668725e-08,
+ 7.59681810791335e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.328125,
+ "loss_eval": 1.9290614128112793,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 27874.181640625,
+ 6776020.5,
+ 33686440.0,
+ 41956108.0,
+ 31183962.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5547591658560123e-07,
+ 2.2904955709890373e-09,
+ 2.199639581590418e-09,
+ 2.2111712461025945e-09,
+ 2.1966135577144996e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.538461199554149e-06,
+ 7.882318442398173e-08,
+ 7.600280582664709e-08,
+ 7.715882333059199e-08,
+ 7.58423581714851e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3369140625,
+ "loss_eval": 1.9268429279327393,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 27928.552734375,
+ 6790532.0,
+ 33797660.0,
+ 42095308.0,
+ 31270040.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5469180425498053e-07,
+ 2.3010513494625684e-09,
+ 2.2103030516973377e-09,
+ 2.2237711672090654e-09,
+ 2.206205884647261e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.510661584499758e-06,
+ 7.866238149745186e-08,
+ 7.584375794067455e-08,
+ 7.699873805222524e-08,
+ 7.568271342961452e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3291015625,
+ "loss_eval": 1.9229360818862915,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 27959.18359375,
+ 6814900.0,
+ 33951204.0,
+ 42283796.0,
+ 31402056.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5280090792657575e-07,
+ 2.2722823622700616e-09,
+ 2.182985348042621e-09,
+ 2.195454484876791e-09,
+ 2.1783830295163398e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.445489922654815e-06,
+ 7.852113270701011e-08,
+ 7.573528648663341e-08,
+ 7.688608150147047e-08,
+ 7.557830628002193e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3232421875,
+ "loss_eval": 1.9262363910675049,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 27969.6171875,
+ 6828402.0,
+ 34031784.0,
+ 42376960.0,
+ 31453510.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5404552300424257e-07,
+ 2.2810822120078456e-09,
+ 2.1932544669311937e-09,
+ 2.216228756068972e-09,
+ 2.193953241302893e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.498375220573507e-06,
+ 7.844284510838406e-08,
+ 7.562837112118359e-08,
+ 7.677955693452532e-08,
+ 7.546795188773103e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.330078125,
+ "loss_eval": 1.925222396850586,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 27976.40625,
+ 6839237.5,
+ 34096948.0,
+ 42451852.0,
+ 31495834.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5588855717396655e-07,
+ 2.290766465407046e-09,
+ 2.2075170580393433e-09,
+ 2.2167860880273338e-09,
+ 2.1972801356184846e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.528901500743814e-06,
+ 7.844620597552421e-08,
+ 7.561048676052451e-08,
+ 7.67637402532273e-08,
+ 7.544804248027503e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3427734375,
+ "loss_eval": 1.9254777431488037,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 28004.76953125,
+ 6848695.0,
+ 34154160.0,
+ 42523512.0,
+ 31536314.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.562642069075082e-07,
+ 2.289735068217169e-09,
+ 2.2051671599854217e-09,
+ 2.2135104860154797e-09,
+ 2.188419445658951e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.512452379567549e-06,
+ 7.840634452804807e-08,
+ 7.557503778343744e-08,
+ 7.672917234913257e-08,
+ 7.541159163793054e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.341796875,
+ "loss_eval": 1.9253835678100586,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 28036.138671875,
+ 6859844.5,
+ 34231564.0,
+ 42620400.0,
+ 31595422.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5447380974364933e-07,
+ 2.2824857559555767e-09,
+ 2.1902821778496673e-09,
+ 2.2037338620606306e-09,
+ 2.183933034416441e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.456872248847503e-06,
+ 7.838458770947909e-08,
+ 7.556796077778927e-08,
+ 7.67221948194674e-08,
+ 7.540831603591869e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.333984375,
+ "loss_eval": 1.9241688251495361,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 28063.341796875,
+ 6866642.0,
+ 34298612.0,
+ 42705280.0,
+ 31647722.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.550155843688117e-07,
+ 2.281024480410565e-09,
+ 2.1895063540000592e-09,
+ 2.20287676988562e-09,
+ 2.1853003850935693e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.501630302111153e-06,
+ 7.833479287455702e-08,
+ 7.55063354063168e-08,
+ 7.666048418286664e-08,
+ 7.534579538059916e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.333984375,
+ "loss_eval": 1.9253199100494385,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 28090.240234375,
+ 6875769.0,
+ 34361584.0,
+ 42782612.0,
+ 31697334.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.536338629648526e-07,
+ 2.267983800763318e-09,
+ 2.1772310621059887e-09,
+ 2.1934687399749464e-09,
+ 2.1765453883659802e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.536663128528744e-06,
+ 7.836315774056857e-08,
+ 7.554304914947352e-08,
+ 7.669789425790441e-08,
+ 7.538390178751797e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3203125,
+ "loss_eval": 1.9292113780975342,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 28114.236328125,
+ 6884728.0,
+ 34407252.0,
+ 42840440.0,
+ 31732750.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5464524949493352e-07,
+ 2.280014399502761e-09,
+ 2.1917956338768363e-09,
+ 2.2101085406234233e-09,
+ 2.1894293045221502e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.505700290901586e-06,
+ 7.817885716576711e-08,
+ 7.534623591709533e-08,
+ 7.650118760693658e-08,
+ 7.518445244159011e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3310546875,
+ "loss_eval": 1.9261689186096191,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 28132.669921875,
+ 6893751.5,
+ 34460884.0,
+ 42910656.0,
+ 31780534.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5502969574754388e-07,
+ 2.2780193287275097e-09,
+ 2.1857382570544814e-09,
+ 2.200839510635433e-09,
+ 2.1766897173591815e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.460140972805675e-06,
+ 7.810618996018093e-08,
+ 7.528173284754303e-08,
+ 7.643409105639876e-08,
+ 7.512058886049999e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.333984375,
+ "loss_eval": 1.9239721298217773,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 28148.599609375,
+ 6899411.0,
+ 34495884.0,
+ 42954048.0,
+ 31804918.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5502014605317527e-07,
+ 2.2734785165567928e-09,
+ 2.191139492069283e-09,
+ 2.201265170143074e-09,
+ 2.182727776300908e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.466436495131347e-06,
+ 7.804617752071863e-08,
+ 7.521869349602639e-08,
+ 7.63711227591557e-08,
+ 7.50560502638109e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3369140625,
+ "loss_eval": 1.9230663776397705,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 28162.9609375,
+ 6901370.5,
+ 34523684.0,
+ 42989220.0,
+ 31824814.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5575578515836241e-07,
+ 2.2783777087198587e-09,
+ 2.1914692283075965e-09,
+ 2.19572404702717e-09,
+ 2.1778470138400507e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.514466910331976e-06,
+ 7.809557445170867e-08,
+ 7.525108713934969e-08,
+ 7.640503696393353e-08,
+ 7.508738519845792e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3447265625,
+ "loss_eval": 1.9263484477996826,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 28175.54296875,
+ 6907143.0,
+ 34559816.0,
+ 43035484.0,
+ 31854504.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5354446247783926e-07,
+ 2.272713128803616e-09,
+ 2.1856987331148048e-09,
+ 2.2020374412790034e-09,
+ 2.1765065305601183e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.444916940992698e-06,
+ 7.799643242378806e-08,
+ 7.51774322793608e-08,
+ 7.632959864167788e-08,
+ 7.50167856722328e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3349609375,
+ "loss_eval": 1.9226629734039307,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 28185.98046875,
+ 6908239.0,
+ 34575728.0,
+ 43054472.0,
+ 31863434.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5382977380795637e-07,
+ 2.274502586274707e-09,
+ 2.1870079081054428e-09,
+ 2.1993444843104726e-09,
+ 2.181675506918168e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.480510016146582e-06,
+ 7.80089948193563e-08,
+ 7.51953308508746e-08,
+ 7.635033938413471e-08,
+ 7.503523846708049e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3359375,
+ "loss_eval": 1.92463219165802,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 28195.05078125,
+ 6911853.0,
+ 34606972.0,
+ 43094588.0,
+ 31890320.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5355996652033355e-07,
+ 2.2723862791451666e-09,
+ 2.1887525125663387e-09,
+ 2.1977624165003817e-09,
+ 2.1820119044946296e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.450015568290837e-06,
+ 7.795882339678428e-08,
+ 7.514577760048269e-08,
+ 7.629873266523646e-08,
+ 7.498609022604796e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3388671875,
+ "loss_eval": 1.9231452941894531,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 28202.009765625,
+ 6911585.0,
+ 34614424.0,
+ 43102544.0,
+ 31893396.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5335498915192147e-07,
+ 2.273481403136657e-09,
+ 2.18971196730422e-09,
+ 2.201623994224633e-09,
+ 2.179575853133997e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.466421943216119e-06,
+ 7.796668910486915e-08,
+ 7.514941557928978e-08,
+ 7.630385567836129e-08,
+ 7.498929477378624e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3349609375,
+ "loss_eval": 1.9242045879364014,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 28207.30078125,
+ 6912594.5,
+ 34624228.0,
+ 43114124.0,
+ 31900214.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.541789487191636e-07,
+ 2.26694063520938e-09,
+ 2.1774959613196643e-09,
+ 2.1911708003585773e-09,
+ 2.177005020698175e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.48972228798084e-06,
+ 7.800251466960617e-08,
+ 7.518539746342867e-08,
+ 7.634076126805667e-08,
+ 7.502466559117238e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3349609375,
+ "loss_eval": 1.9264299869537354,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 28210.744140625,
+ 6914176.5,
+ 34633372.0,
+ 43125584.0,
+ 31907212.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5396986441373883e-07,
+ 2.2685893164009485e-09,
+ 2.182473091139059e-09,
+ 2.2001969135487798e-09,
+ 2.1797674776280473e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.470595614402555e-06,
+ 7.796354850597709e-08,
+ 7.514324096291602e-08,
+ 7.629726184177343e-08,
+ 7.498252330151445e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.3388671875,
+ "loss_eval": 1.9243674278259277,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 28213.134765625,
+ 6914654.0,
+ 34637116.0,
+ 43129968.0,
+ 31909774.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5392139118830528e-07,
+ 2.2676351907335857e-09,
+ 2.181399949563456e-09,
+ 2.194956438827944e-09,
+ 2.1772521563434566e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.468548341828864e-06,
+ 7.796590040243245e-08,
+ 7.514832134347671e-08,
+ 7.630251985801806e-08,
+ 7.498784526660529e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.33984375,
+ "loss_eval": 1.9245264530181885,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 28214.392578125,
+ 6914571.0,
+ 34637992.0,
+ 43130936.0,
+ 31909692.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5425968058480066e-07,
+ 2.2704826907471443e-09,
+ 2.18207008018112e-09,
+ 2.1958874718563948e-09,
+ 2.177970914729599e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.473776117374655e-06,
+ 7.796563039619286e-08,
+ 7.514674393860332e-08,
+ 7.63012906190852e-08,
+ 7.498606890976589e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.337890625,
+ "loss_eval": 1.9245213270187378,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 28215.587890625,
+ 6915082.0,
+ 34641648.0,
+ 43135608.0,
+ 31912816.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5412730647312856e-07,
+ 2.2691615253478403e-09,
+ 2.181160807523952e-09,
+ 2.1947776929209795e-09,
+ 2.1773913783107446e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.472671081312e-06,
+ 7.796593592956924e-08,
+ 7.514773869843339e-08,
+ 7.630221432464168e-08,
+ 7.498719867271575e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.337890625,
+ "loss_eval": 1.9246418476104736,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 28216.130859375,
+ 6915161.5,
+ 34642452.0,
+ 43136600.0,
+ 31913348.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5420548038491688e-07,
+ 2.2695016976825855e-09,
+ 2.1805732774993203e-09,
+ 2.1951678252918327e-09,
+ 2.1776345171531375e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.474650141783059e-06,
+ 7.796723622277568e-08,
+ 7.514872635283609e-08,
+ 7.63033014550274e-08,
+ 7.498815079998167e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.337890625,
+ "loss_eval": 1.9247386455535889,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 28216.1875,
+ 6915194.0,
+ 34642580.0,
+ 43136768.0,
+ 31913448.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 1.5419134058447526e-07,
+ 2.2693393830763853e-09,
+ 2.180579494748258e-09,
+ 2.194876502770171e-09,
+ 2.1777446512771803e-09
+ ],
+ "bp_grad_norms_F": [
+ 9.474156286159996e-06,
+ 7.796705148166438e-08,
+ 7.51486410877078e-08,
+ 7.630320908447175e-08,
+ 7.498806553485338e-08
+ ],
+ "gamma_dfa": NaN,
+ "acc_eval": 0.337890625,
+ "loss_eval": 1.9247117042541504,
+ "epoch": 100
+ }
+ ],
+ "seed": 42,
+ "depth": 4,
+ "d_hidden": 256
+} \ No newline at end of file