{ "config": { "output_dir": "results/h2_no_residual_full_s42", "epochs": 100, "lr": 0.001, "wd": 0.01, "seed": 42, "depth": 4, "d_hidden": 256, "log_every": 1, "no_residual_add": true, "w2_std": 0.5 }, "depth": 4, "d_hidden": 256, "num_classes": 10, "bp_log": [ { "hidden_norms": [ 8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656 ], "bp_grad_norms_per_sample_med": [ 0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05 ], "bp_grad_norms_F": [ 0.0380445197224617, 0.00666962843388319, 0.0046500470489263535, 0.003719294909387827, 0.003155440790578723 ], "gamma_dfa": NaN, "acc_eval": 0.080078125, "loss_eval": 2.446239709854126, "epoch": 0 }, { "hidden_norms": [ 86.00836944580078, 130.30899047851562, 107.6886215209961, 127.31951141357422, 155.31224060058594 ], "bp_grad_norms_per_sample_med": [ 5.636421337840147e-05, 4.504464232013561e-05, 4.254864325048402e-05, 4.0549883124185726e-05, 3.8371628761524335e-05 ], "bp_grad_norms_F": [ 0.0019479888724163175, 0.0014867106219753623, 0.0013919975608587265, 0.001322419848293066, 0.0012390650808811188 ], "gamma_dfa": NaN, "acc_eval": 0.1435546875, "loss_eval": 2.293787717819214, "epoch": 1 }, { "hidden_norms": [ 114.72047424316406, 154.09420776367188, 128.2491455078125, 160.83230590820312, 193.06747436523438 ], "bp_grad_norms_per_sample_med": [ 4.478770642890595e-05, 3.7948859244352207e-05, 3.570393528207205e-05, 3.381549322512001e-05, 3.158334220643155e-05 ], "bp_grad_norms_F": [ 0.0015459235291928053, 0.0012464966857805848, 0.0011667043436318636, 0.0010993058094754815, 0.0010170178720727563 ], "gamma_dfa": NaN, "acc_eval": 0.1728515625, "loss_eval": 2.2832698822021484, "epoch": 2 }, { "hidden_norms": [ 129.28399658203125, 169.31143188476562, 136.48431396484375, 176.9506378173828, 216.20181274414062 ], "bp_grad_norms_per_sample_med": [ 4.090799848199822e-05, 3.4604578104335815e-05, 3.2474679755978286e-05, 3.0787930882070214e-05, 2.844005575752817e-05 ], "bp_grad_norms_F": [ 0.0014615722466260195, 0.0011723904171958566, 0.0010821294272318482, 0.001009885803796351, 0.000921491184271872 ], "gamma_dfa": NaN, "acc_eval": 0.177734375, "loss_eval": 2.248687267303467, "epoch": 3 }, { "hidden_norms": [ 146.55203247070312, 179.31271362304688, 144.7793426513672, 195.2471923828125, 244.1785888671875 ], "bp_grad_norms_per_sample_med": [ 3.7983172660460696e-05, 3.2681429729564115e-05, 3.063849362661131e-05, 2.877583210647572e-05, 2.62654539255891e-05 ], "bp_grad_norms_F": [ 0.0013270865892991424, 0.0011031923349946737, 0.0010214283829554915, 0.0009468899224884808, 0.0008542603463865817 ], "gamma_dfa": NaN, "acc_eval": 0.201171875, "loss_eval": 2.1866140365600586, "epoch": 4 }, { "hidden_norms": [ 163.96316528320312, 186.10421752929688, 151.66432189941406, 204.73275756835938, 266.4998474121094 ], "bp_grad_norms_per_sample_med": [ 3.63540711987298e-05, 3.1559447961626574e-05, 2.965202475024853e-05, 2.767328805930447e-05, 2.4988346922327764e-05 ], "bp_grad_norms_F": [ 0.0012765713036060333, 0.0010719435522332788, 0.0009894924005493522, 0.0009105658973567188, 0.0008120943675749004 ], "gamma_dfa": NaN, "acc_eval": 0.205078125, "loss_eval": 2.213620185852051, "epoch": 5 }, { "hidden_norms": [ 173.03375244140625, 192.33702087402344, 151.7676544189453, 211.76028442382812, 273.14984130859375 ], "bp_grad_norms_per_sample_med": [ 3.612042564782314e-05, 3.138732790830545e-05, 2.92498261842411e-05, 2.741635762504302e-05, 2.4648286853334866e-05 ], "bp_grad_norms_F": [ 0.0012719081714749336, 0.0010634849313646555, 0.0009788337629288435, 0.0008956211968325078, 0.0007930789142847061 ], "gamma_dfa": NaN, "acc_eval": 0.201171875, "loss_eval": 2.20696759223938, "epoch": 6 }, { "hidden_norms": [ 184.99200439453125, 200.6100311279297, 154.7901611328125, 216.4141387939453, 294.1932067871094 ], "bp_grad_norms_per_sample_med": [ 3.5208213375881314e-05, 3.101788752246648e-05, 2.887230584747158e-05, 2.6716055799624883e-05, 2.381021658948157e-05 ], "bp_grad_norms_F": [ 0.0012596799060702324, 0.0010643631685525179, 0.0009746645228005946, 0.0008811713196337223, 0.0007715557585470378 ], "gamma_dfa": NaN, "acc_eval": 0.189453125, "loss_eval": 2.26588773727417, "epoch": 7 }, { "hidden_norms": [ 199.71249389648438, 206.28636169433594, 159.15716552734375, 225.3829803466797, 316.6280517578125 ], "bp_grad_norms_per_sample_med": [ 3.397777982172556e-05, 3.0055914976401255e-05, 2.8245711291674525e-05, 2.577536906755995e-05, 2.2829581212135963e-05 ], "bp_grad_norms_F": [ 0.0012129175011068583, 0.0010332722449675202, 0.0009465343900956213, 0.0008514428627677262, 0.0007388851954601705 ], "gamma_dfa": NaN, "acc_eval": 0.203125, "loss_eval": 2.232454776763916, "epoch": 8 }, { "hidden_norms": [ 209.29306030273438, 211.71087646484375, 155.6585235595703, 229.6345672607422, 335.6332092285156 ], "bp_grad_norms_per_sample_med": [ 3.381286660442129e-05, 3.0025108571862802e-05, 2.795294494717382e-05, 2.5483084755251184e-05, 2.2450465621659532e-05 ], "bp_grad_norms_F": [ 0.001203069812618196, 0.0010322949383407831, 0.0009428044431842864, 0.0008445970015600324, 0.0007283088052645326 ], "gamma_dfa": NaN, "acc_eval": 0.189453125, "loss_eval": 2.2567524909973145, "epoch": 9 }, { "hidden_norms": [ 219.5225067138672, 215.77891540527344, 158.00711059570312, 239.82870483398438, 364.106689453125 ], "bp_grad_norms_per_sample_med": [ 3.357209061505273e-05, 3.0128332582535222e-05, 2.8080758056603372e-05, 2.5434510462218896e-05, 2.2072978026699275e-05 ], "bp_grad_norms_F": [ 0.001222757389768958, 0.0010488828411325812, 0.0009540626197122037, 0.000844798400066793, 0.0007152045727707446 ], "gamma_dfa": NaN, "acc_eval": 0.1884765625, "loss_eval": 2.298661708831787, "epoch": 10 }, { "hidden_norms": [ 228.8721160888672, 219.33489990234375, 159.22947692871094, 242.5733642578125, 373.5672607421875 ], "bp_grad_norms_per_sample_med": [ 3.361105336807668e-05, 3.0123681426630355e-05, 2.82819164567627e-05, 2.5511151761747897e-05, 2.200892413384281e-05 ], "bp_grad_norms_F": [ 0.0012033756356686354, 0.0010383055778220296, 0.0009499595616944134, 0.0008407059940509498, 0.000707409402821213 ], "gamma_dfa": NaN, "acc_eval": 0.18359375, "loss_eval": 2.3219099044799805, "epoch": 11 }, { "hidden_norms": [ 238.0825958251953, 220.4098663330078, 157.96127319335938, 246.49105834960938, 399.103515625 ], "bp_grad_norms_per_sample_med": [ 3.3689280826365575e-05, 3.044224104087334e-05, 2.8301144993747585e-05, 2.544306880736258e-05, 2.16337175515946e-05 ], "bp_grad_norms_F": [ 0.0012109626550227404, 0.0010498397750779986, 0.0009549973183311522, 0.0008336003520525992, 0.0006956221768632531 ], "gamma_dfa": NaN, "acc_eval": 0.197265625, "loss_eval": 2.292271614074707, "epoch": 12 }, { "hidden_norms": [ 245.9247589111328, 225.1177520751953, 161.000244140625, 247.5177001953125, 405.64068603515625 ], "bp_grad_norms_per_sample_med": [ 3.318578455946408e-05, 2.9796459784847684e-05, 2.778910129563883e-05, 2.4826545995892957e-05, 2.1260259018163197e-05 ], "bp_grad_norms_F": [ 0.0012085892958566546, 0.0010467838728800416, 0.0009537216974422336, 0.0008304294897243381, 0.0006893921527080238 ], "gamma_dfa": NaN, "acc_eval": 0.1865234375, "loss_eval": 2.309349536895752, "epoch": 13 }, { "hidden_norms": [ 254.78964233398438, 226.26568603515625, 158.11354064941406, 246.54937744140625, 402.22564697265625 ], "bp_grad_norms_per_sample_med": [ 3.351089617353864e-05, 3.0367529689101502e-05, 2.8210330128786154e-05, 2.5112614821409807e-05, 2.127070547430776e-05 ], "bp_grad_norms_F": [ 0.0012080274755135179, 0.0010523217497393489, 0.0009614708251319826, 0.0008391732117161155, 0.0006922443280927837 ], "gamma_dfa": NaN, "acc_eval": 0.177734375, "loss_eval": 2.3668038845062256, "epoch": 14 }, { "hidden_norms": [ 262.1316833496094, 226.88943481445312, 157.7928009033203, 248.3592529296875, 416.15966796875 ], "bp_grad_norms_per_sample_med": [ 3.413746162550524e-05, 3.107329393969849e-05, 2.889345705625601e-05, 2.570425385783892e-05, 2.1452229702845216e-05 ], "bp_grad_norms_F": [ 0.0012374932412058115, 0.001085828524082899, 0.0009924235055223107, 0.0008545225136913359, 0.0006974710267968476 ], "gamma_dfa": NaN, "acc_eval": 0.1650390625, "loss_eval": 2.3762776851654053, "epoch": 15 }, { "hidden_norms": [ 270.8565979003906, 227.8741455078125, 160.908935546875, 249.23391723632812, 426.4018859863281 ], "bp_grad_norms_per_sample_med": [ 3.346315133967437e-05, 3.0396649890462868e-05, 2.8140580980107188e-05, 2.509099431335926e-05, 2.0963307179044932e-05 ], "bp_grad_norms_F": [ 0.0012071001110598445, 0.0010572251630946994, 0.0009650305728428066, 0.0008328591356985271, 0.0006829687627032399 ], "gamma_dfa": NaN, "acc_eval": 0.1748046875, "loss_eval": 2.3659489154815674, "epoch": 16 }, { "hidden_norms": [ 277.88897705078125, 229.93283081054688, 160.6474151611328, 249.1276092529297, 439.88336181640625 ], "bp_grad_norms_per_sample_med": [ 3.291336179245263e-05, 3.02154276141664e-05, 2.813426181091927e-05, 2.503528776287567e-05, 2.0815306925214827e-05 ], "bp_grad_norms_F": [ 0.0011904252460226417, 0.0010531789157539606, 0.000964420149102807, 0.0008325970848090947, 0.0006798306130804121 ], "gamma_dfa": NaN, "acc_eval": 0.17578125, "loss_eval": 2.3654253482818604, "epoch": 17 }, { "hidden_norms": [ 286.05938720703125, 230.5788116455078, 160.4178009033203, 247.1944122314453, 438.8507995605469 ], "bp_grad_norms_per_sample_med": [ 3.318934977869503e-05, 3.0551069357898086e-05, 2.8402588213793933e-05, 2.525982381484937e-05, 2.0943261915817857e-05 ], "bp_grad_norms_F": [ 0.0012075696140527725, 0.001069555408321321, 0.0009757071966305375, 0.0008412246825173497, 0.0006814986118115485 ], "gamma_dfa": NaN, "acc_eval": 0.1748046875, "loss_eval": 2.3814916610717773, "epoch": 18 }, { "hidden_norms": [ 291.21563720703125, 232.70465087890625, 157.34620666503906, 246.0981903076172, 446.42889404296875 ], "bp_grad_norms_per_sample_med": [ 3.315764479339123e-05, 3.062548057641834e-05, 2.8670148822129704e-05, 2.5318840926047415e-05, 2.096824573527556e-05 ], "bp_grad_norms_F": [ 0.0012071789242327213, 0.0010707362089306116, 0.0009821956045925617, 0.0008455720380879939, 0.0006821187562309206 ], "gamma_dfa": NaN, "acc_eval": 0.1728515625, "loss_eval": 2.4200758934020996, "epoch": 19 }, { "hidden_norms": [ 296.9744873046875, 232.92347717285156, 155.9208221435547, 242.89227294921875, 464.36663818359375 ], "bp_grad_norms_per_sample_med": [ 3.340119292261079e-05, 3.0905790481483564e-05, 2.8828215363319032e-05, 2.5400462618563324e-05, 2.0934525309712626e-05 ], "bp_grad_norms_F": [ 0.001213042763993144, 0.001074956264346838, 0.000986237544566393, 0.0008489739266224205, 0.0006839185953140259 ], "gamma_dfa": NaN, "acc_eval": 0.1669921875, "loss_eval": 2.4464807510375977, "epoch": 20 }, { "hidden_norms": [ 302.8837890625, 232.27020263671875, 156.21949768066406, 240.65646362304688, 465.4597473144531 ], "bp_grad_norms_per_sample_med": [ 3.269123408244923e-05, 3.057413414353505e-05, 2.8494312573457137e-05, 2.536452484491747e-05, 2.0975066945538856e-05 ], "bp_grad_norms_F": [ 0.0011949212057515979, 0.0010672758799046278, 0.0009809982730075717, 0.0008468242012895644, 0.0006826177705079317 ], "gamma_dfa": NaN, "acc_eval": 0.171875, "loss_eval": 2.4423742294311523, "epoch": 21 }, { "hidden_norms": [ 309.28985595703125, 234.24151611328125, 157.79649353027344, 237.83340454101562, 481.6331787109375 ], "bp_grad_norms_per_sample_med": [ 3.304004712845199e-05, 3.070462844334543e-05, 2.8894632123410702e-05, 2.556288927735295e-05, 2.0964585928595625e-05 ], "bp_grad_norms_F": [ 0.00119681132491678, 0.001071512931957841, 0.0009897719137370586, 0.0008524276199750602, 0.0006829827907495201 ], "gamma_dfa": NaN, "acc_eval": 0.1591796875, "loss_eval": 2.4570655822753906, "epoch": 22 }, { "hidden_norms": [ 313.0410461425781, 231.53106689453125, 157.91920471191406, 237.67922973632812, 458.6028137207031 ], "bp_grad_norms_per_sample_med": [ 3.3489413908682764e-05, 3.1275969377020374e-05, 2.9323471608222462e-05, 2.5867013391689397e-05, 2.119375130860135e-05 ], "bp_grad_norms_F": [ 0.001231541857123375, 0.0011033288901671767, 0.001017258851788938, 0.0008692976552993059, 0.0006914011319167912 ], "gamma_dfa": NaN, "acc_eval": 0.1435546875, "loss_eval": 2.4768424034118652, "epoch": 23 }, { "hidden_norms": [ 317.760986328125, 230.58580017089844, 159.59475708007812, 231.33895874023438, 457.3432922363281 ], "bp_grad_norms_per_sample_med": [ 3.3722881198627874e-05, 3.157257742714137e-05, 2.952909198938869e-05, 2.6216532205580734e-05, 2.1260124412947334e-05 ], "bp_grad_norms_F": [ 0.0012356883380562067, 0.001110993092879653, 0.001023975433781743, 0.0008810298750177026, 0.0006986238295212388 ], "gamma_dfa": NaN, "acc_eval": 0.1611328125, "loss_eval": 2.49592661857605, "epoch": 24 }, { "hidden_norms": [ 322.651123046875, 232.43505859375, 152.87049865722656, 231.94496154785156, 473.4416198730469 ], "bp_grad_norms_per_sample_med": [ 3.427052797633223e-05, 3.222951272618957e-05, 3.0394427085411735e-05, 2.6714942578109913e-05, 2.156150912924204e-05 ], "bp_grad_norms_F": [ 0.0012650383869186044, 0.001135875703766942, 0.0010507238330319524, 0.0008947087335400283, 0.0007038050098344684 ], "gamma_dfa": NaN, "acc_eval": 0.1455078125, "loss_eval": 2.5300588607788086, "epoch": 25 }, { "hidden_norms": [ 330.46783447265625, 230.2061004638672, 152.9967498779297, 227.8012237548828, 478.8476867675781 ], "bp_grad_norms_per_sample_med": [ 3.374157677171752e-05, 3.1537194445263594e-05, 2.9856541004846804e-05, 2.6372779757366516e-05, 2.1366411601775326e-05 ], "bp_grad_norms_F": [ 0.0012416786048561335, 0.001122219255194068, 0.0010412678821012378, 0.0008921810076572001, 0.0006990613183006644 ], "gamma_dfa": NaN, "acc_eval": 0.140625, "loss_eval": 2.537388801574707, "epoch": 26 }, { "hidden_norms": [ 334.9617919921875, 229.8689727783203, 156.80023193359375, 226.36166381835938, 473.52545166015625 ], "bp_grad_norms_per_sample_med": [ 3.429998105275445e-05, 3.2245541660813615e-05, 3.0571496608899906e-05, 2.689965367608238e-05, 2.1567262592725456e-05 ], "bp_grad_norms_F": [ 0.001256743329577148, 0.0011394708417356014, 0.0010550402803346515, 0.0009035509428940713, 0.0007058348273858428 ], "gamma_dfa": NaN, "acc_eval": 0.138671875, "loss_eval": 2.5099682807922363, "epoch": 27 }, { "hidden_norms": [ 338.32244873046875, 230.9785614013672, 152.46780395507812, 224.96499633789062, 486.111083984375 ], "bp_grad_norms_per_sample_med": [ 3.443951572990045e-05, 3.224790998501703e-05, 3.0727285775355995e-05, 2.7226298698224127e-05, 2.1652953364537098e-05 ], "bp_grad_norms_F": [ 0.0012660843785852194, 0.0011493951315060258, 0.0010706180473789573, 0.0009175407467409968, 0.0007115012849681079 ], "gamma_dfa": NaN, "acc_eval": 0.1298828125, "loss_eval": 2.5662076473236084, "epoch": 28 }, { "hidden_norms": [ 342.5646057128906, 229.08815002441406, 153.96673583984375, 216.54530334472656, 468.6747131347656 ], "bp_grad_norms_per_sample_med": [ 3.46860324498266e-05, 3.2538478990318254e-05, 3.093785562668927e-05, 2.7406946173869073e-05, 2.1759695300715975e-05 ], "bp_grad_norms_F": [ 0.0012609382392838597, 0.001147899660281837, 0.0010664825094863772, 0.0009160453919321299, 0.0007114250329323113 ], "gamma_dfa": NaN, "acc_eval": 0.123046875, "loss_eval": 2.586763381958008, "epoch": 29 }, { "hidden_norms": [ 348.8407287597656, 229.21829223632812, 152.20892333984375, 214.9100799560547, 478.5781555175781 ], "bp_grad_norms_per_sample_med": [ 3.3881755371112376e-05, 3.1849580409470946e-05, 3.0435230655712076e-05, 2.698182470339816e-05, 2.157314338546712e-05 ], "bp_grad_norms_F": [ 0.0012431713985279202, 0.0011320828925818205, 0.0010550167644396424, 0.0009089091327041388, 0.000706658698618412 ], "gamma_dfa": NaN, "acc_eval": 0.1318359375, "loss_eval": 2.5531229972839355, "epoch": 30 }, { "hidden_norms": [ 351.8199768066406, 225.8287811279297, 153.97621154785156, 207.98619079589844, 449.3790588378906 ], "bp_grad_norms_per_sample_med": [ 3.457794082351029e-05, 3.269680746598169e-05, 3.108347300440073e-05, 2.75895836239215e-05, 2.188902180932928e-05 ], "bp_grad_norms_F": [ 0.0012726614950224757, 0.0011605133768171072, 0.0010800294112414122, 0.0009289697627536952, 0.0007184858550317585 ], "gamma_dfa": NaN, "acc_eval": 0.130859375, "loss_eval": 2.5874619483947754, "epoch": 31 }, { "hidden_norms": [ 353.6206359863281, 225.6538543701172, 151.9993896484375, 207.81591796875, 458.920166015625 ], "bp_grad_norms_per_sample_med": [ 3.461301821516827e-05, 3.2766867661848664e-05, 3.128241587546654e-05, 2.7638012397801504e-05, 2.198204310843721e-05 ], "bp_grad_norms_F": [ 0.001283104415051639, 0.0011686854995787144, 0.0010903337970376015, 0.0009369406034238636, 0.000721081392839551 ], "gamma_dfa": NaN, "acc_eval": 0.1376953125, "loss_eval": 2.583052635192871, "epoch": 32 }, { "hidden_norms": [ 355.174560546875, 226.53065490722656, 150.45091247558594, 200.73980712890625, 457.2731018066406 ], "bp_grad_norms_per_sample_med": [ 3.5071778256678954e-05, 3.3138821891043335e-05, 3.159284096909687e-05, 2.8334745366009884e-05, 2.23859660763992e-05 ], "bp_grad_norms_F": [ 0.0012956986902281642, 0.0011821272782981396, 0.001104547642171383, 0.0009524936904199421, 0.0007312360685318708 ], "gamma_dfa": NaN, "acc_eval": 0.12890625, "loss_eval": 2.605353832244873, "epoch": 33 }, { "hidden_norms": [ 360.4849853515625, 223.40980529785156, 148.3797607421875, 195.64169311523438, 461.1542663574219 ], "bp_grad_norms_per_sample_med": [ 3.4972203138750046e-05, 3.31850751535967e-05, 3.171996650053188e-05, 2.820813824655488e-05, 2.2246067601372488e-05 ], "bp_grad_norms_F": [ 0.0012813522480428219, 0.0011739785550162196, 0.00110049347858876, 0.0009508885559625924, 0.0007318558637052774 ], "gamma_dfa": NaN, "acc_eval": 0.1279296875, "loss_eval": 2.609264373779297, "epoch": 34 }, { "hidden_norms": [ 365.4316711425781, 222.55001831054688, 148.93753051757812, 196.41476440429688, 464.26507568359375 ], "bp_grad_norms_per_sample_med": [ 3.474177356110886e-05, 3.299827585578896e-05, 3.161515633109957e-05, 2.8241847758181393e-05, 2.233032682852354e-05 ], "bp_grad_norms_F": [ 0.001280988217331469, 0.0011732708662748337, 0.0010997118661180139, 0.0009513412951491773, 0.0007320611621253192 ], "gamma_dfa": NaN, "acc_eval": 0.123046875, "loss_eval": 2.6414568424224854, "epoch": 35 }, { "hidden_norms": [ 365.99407958984375, 220.5921173095703, 147.05055236816406, 194.5092315673828, 456.3348083496094 ], "bp_grad_norms_per_sample_med": [ 3.5159438994014636e-05, 3.344163633300923e-05, 3.1946114177117124e-05, 2.86933845927706e-05, 2.2498443286167458e-05 ], "bp_grad_norms_F": [ 0.0013043885119259357, 0.0011966620804741979, 0.0011218151776120067, 0.0009711913880892098, 0.0007424909272231162 ], "gamma_dfa": NaN, "acc_eval": 0.1337890625, "loss_eval": 2.6415724754333496, "epoch": 36 }, { "hidden_norms": [ 370.3197326660156, 220.85414123535156, 148.2594451904297, 188.3152313232422, 446.8343505859375 ], "bp_grad_norms_per_sample_med": [ 3.53947798430454e-05, 3.362595452927053e-05, 3.218940764782019e-05, 2.885511094063986e-05, 2.269916149089113e-05 ], "bp_grad_norms_F": [ 0.001304175122641027, 0.001198453363031149, 0.0011262644547969103, 0.0009740483365021646, 0.0007447644020430744 ], "gamma_dfa": NaN, "acc_eval": 0.1279296875, "loss_eval": 2.6847548484802246, "epoch": 37 }, { "hidden_norms": [ 372.6519775390625, 219.43032836914062, 146.2524871826172, 186.9598388671875, 419.9220275878906 ], "bp_grad_norms_per_sample_med": [ 3.5350865800864995e-05, 3.369166006450541e-05, 3.231317532481626e-05, 2.9215334507171065e-05, 2.2943044314160943e-05 ], "bp_grad_norms_F": [ 0.0013154788175597787, 0.0012110902462154627, 0.00113767315633595, 0.000987510895356536, 0.0007552221650257707 ], "gamma_dfa": NaN, "acc_eval": 0.134765625, "loss_eval": 2.663112163543701, "epoch": 38 }, { "hidden_norms": [ 377.5515441894531, 217.7505340576172, 144.7539520263672, 182.63914489746094, 424.8920593261719 ], "bp_grad_norms_per_sample_med": [ 3.550875771907158e-05, 3.3909564081113786e-05, 3.234989708289504e-05, 2.9385402740444988e-05, 2.3012338715489022e-05 ], "bp_grad_norms_F": [ 0.0013136330526322126, 0.0012126904912292957, 0.001143725821748376, 0.0009956557769328356, 0.000757638190407306 ], "gamma_dfa": NaN, "acc_eval": 0.1123046875, "loss_eval": 2.6713695526123047, "epoch": 39 }, { "hidden_norms": [ 375.5976867675781, 217.32119750976562, 143.29833984375, 178.9922332763672, 416.0475769042969 ], "bp_grad_norms_per_sample_med": [ 3.6261131754145026e-05, 3.459263825789094e-05, 3.311317050247453e-05, 3.0077193514443934e-05, 2.332564690732397e-05 ], "bp_grad_norms_F": [ 0.0013422674965113401, 0.0012380937114357948, 0.0011671145912259817, 0.0010137255303561687, 0.0007670389022678137 ], "gamma_dfa": NaN, "acc_eval": 0.1171875, "loss_eval": 2.6898365020751953, "epoch": 40 }, { "hidden_norms": [ 375.6454772949219, 215.73880004882812, 143.0796356201172, 173.5657958984375, 413.10693359375 ], "bp_grad_norms_per_sample_med": [ 3.5994391510030255e-05, 3.4521792258601636e-05, 3.3360858651576564e-05, 3.016969822056126e-05, 2.3851269361330196e-05 ], "bp_grad_norms_F": [ 0.0013558906503021717, 0.0012535321293398738, 0.0011830577859655023, 0.0010295362444594502, 0.0007781152380630374 ], "gamma_dfa": NaN, "acc_eval": 0.119140625, "loss_eval": 2.6808576583862305, "epoch": 41 }, { "hidden_norms": [ 381.1890869140625, 214.87374877929688, 142.17715454101562, 172.16009521484375, 413.11871337890625 ], "bp_grad_norms_per_sample_med": [ 3.590781852835789e-05, 3.450449730735272e-05, 3.32859308400657e-05, 3.011901571881026e-05, 2.3740196411381476e-05 ], "bp_grad_norms_F": [ 0.0013439194299280643, 0.0012433268129825592, 0.0011747550452128053, 0.0010278060799464583, 0.0007790841045789421 ], "gamma_dfa": NaN, "acc_eval": 0.1083984375, "loss_eval": 2.7061455249786377, "epoch": 42 }, { "hidden_norms": [ 382.1147766113281, 212.32655334472656, 142.33558654785156, 169.52694702148438, 398.5701904296875 ], "bp_grad_norms_per_sample_med": [ 3.659713547676802e-05, 3.507183282636106e-05, 3.372716673766263e-05, 3.064091288251802e-05, 2.416563620499801e-05 ], "bp_grad_norms_F": [ 0.0013747483026236296, 0.0012707116547971964, 0.0012008449994027615, 0.0010481667704880238, 0.0007909793639555573 ], "gamma_dfa": NaN, "acc_eval": 0.107421875, "loss_eval": 2.7121200561523438, "epoch": 43 }, { "hidden_norms": [ 388.24554443359375, 211.70144653320312, 141.58709716796875, 166.8690643310547, 390.73895263671875 ], "bp_grad_norms_per_sample_med": [ 3.605844176490791e-05, 3.457901402725838e-05, 3.344014839967713e-05, 3.0472821890725754e-05, 2.386603955528699e-05 ], "bp_grad_norms_F": [ 0.0013416680740192533, 0.0012422216823324561, 0.0011764775263145566, 0.0010343515314161777, 0.0007849647663533688 ], "gamma_dfa": NaN, "acc_eval": 0.1240234375, "loss_eval": 2.6901586055755615, "epoch": 44 }, { "hidden_norms": [ 387.182861328125, 211.15060424804688, 141.0326385498047, 165.57235717773438, 375.9649963378906 ], "bp_grad_norms_per_sample_med": [ 3.6760768125532195e-05, 3.520414247759618e-05, 3.39620492013637e-05, 3.100339381489903e-05, 2.4274080715258606e-05 ], "bp_grad_norms_F": [ 0.0013679155381396413, 0.0012680977815762162, 0.001201036386191845, 0.0010586031712591648, 0.0007975373882800341 ], "gamma_dfa": NaN, "acc_eval": 0.115234375, "loss_eval": 2.7196202278137207, "epoch": 45 }, { "hidden_norms": [ 389.78302001953125, 209.2168426513672, 140.19239807128906, 162.1501007080078, 373.6092529296875 ], "bp_grad_norms_per_sample_med": [ 3.6972556699765846e-05, 3.547927553881891e-05, 3.4321546991122887e-05, 3.136819213978015e-05, 2.4795872377580963e-05 ], "bp_grad_norms_F": [ 0.001378108048811555, 0.0012792085763067007, 0.0012131200637668371, 0.0010711504146456718, 0.0008094239747151732 ], "gamma_dfa": NaN, "acc_eval": 0.1123046875, "loss_eval": 2.732020854949951, "epoch": 46 }, { "hidden_norms": [ 390.8168640136719, 207.98391723632812, 140.21983337402344, 161.1061248779297, 358.555419921875 ], "bp_grad_norms_per_sample_med": [ 3.740100146387704e-05, 3.60443300451152e-05, 3.478667713352479e-05, 3.1701372790848836e-05, 2.49275763053447e-05 ], "bp_grad_norms_F": [ 0.0013912947615608573, 0.0012947055511176586, 0.0012257345952093601, 0.00108279287815094, 0.000817548600025475 ], "gamma_dfa": NaN, "acc_eval": 0.11328125, "loss_eval": 2.734851598739624, "epoch": 47 }, { "hidden_norms": [ 392.3091735839844, 206.94676208496094, 137.84091186523438, 156.7150115966797, 363.1738586425781 ], "bp_grad_norms_per_sample_med": [ 3.7181769585004076e-05, 3.575249866116792e-05, 3.458252103882842e-05, 3.156786260660738e-05, 2.489473990863189e-05 ], "bp_grad_norms_F": [ 0.0013799670850858092, 0.0012849466875195503, 0.0012195904273539782, 0.0010820929892361164, 0.0008166414918377995 ], "gamma_dfa": NaN, "acc_eval": 0.1083984375, "loss_eval": 2.730489492416382, "epoch": 48 }, { "hidden_norms": [ 392.93621826171875, 206.63357543945312, 137.95150756835938, 156.19265747070312, 348.4825744628906 ], "bp_grad_norms_per_sample_med": [ 3.750698306248523e-05, 3.625384488259442e-05, 3.4952467103721574e-05, 3.2122828997671604e-05, 2.5343802917632274e-05 ], "bp_grad_norms_F": [ 0.0014074875507503748, 0.0013119739014655352, 0.0012457441771402955, 0.0011056199437007308, 0.0008317606407217681 ], "gamma_dfa": NaN, "acc_eval": 0.10546875, "loss_eval": 2.7619447708129883, "epoch": 49 }, { "hidden_norms": [ 394.5487976074219, 204.12411499023438, 137.66342163085938, 151.4534454345703, 343.6612854003906 ], "bp_grad_norms_per_sample_med": [ 3.779921098612249e-05, 3.6266086681280285e-05, 3.5253593523520976e-05, 3.246645428589545e-05, 2.558354208304081e-05 ], "bp_grad_norms_F": [ 0.0014083774294704199, 0.0013136735651642084, 0.0012480755103752017, 0.0011111509520560503, 0.0008380677900277078 ], "gamma_dfa": NaN, "acc_eval": 0.095703125, "loss_eval": 2.7554924488067627, "epoch": 50 }, { "hidden_norms": [ 397.6114196777344, 202.55885314941406, 136.6888427734375, 150.49545288085938, 329.96112060546875 ], "bp_grad_norms_per_sample_med": [ 3.777034726226702e-05, 3.6449018807616085e-05, 3.515862044878304e-05, 3.240678779548034e-05, 2.560876600909978e-05 ], "bp_grad_norms_F": [ 0.001405128394253552, 0.001311970641836524, 0.001248166779987514, 0.0011124340817332268, 0.0008421412203460932 ], "gamma_dfa": NaN, "acc_eval": 0.10546875, "loss_eval": 2.7597320079803467, "epoch": 51 }, { "hidden_norms": [ 397.78509521484375, 202.12451171875, 135.5238800048828, 148.92816162109375, 322.4108581542969 ], "bp_grad_norms_per_sample_med": [ 3.840518184006214e-05, 3.6834608181379735e-05, 3.5840494092553854e-05, 3.275332346674986e-05, 2.6062174583785236e-05 ], "bp_grad_norms_F": [ 0.001429337658919394, 0.00133553147315979, 0.0012706448324024677, 0.001131666824221611, 0.0008531482890248299 ], "gamma_dfa": NaN, "acc_eval": 0.099609375, "loss_eval": 2.7737417221069336, "epoch": 52 }, { "hidden_norms": [ 397.3096618652344, 199.6620635986328, 134.52984619140625, 145.349853515625, 298.2867431640625 ], "bp_grad_norms_per_sample_med": [ 3.877158087561838e-05, 3.721338725881651e-05, 3.603506775107235e-05, 3.3124437322840095e-05, 2.6345343940192834e-05 ], "bp_grad_norms_F": [ 0.0014398579951375723, 0.001346803386695683, 0.0012816074304282665, 0.001146289287135005, 0.0008667311049066484 ], "gamma_dfa": NaN, "acc_eval": 0.1025390625, "loss_eval": 2.799215316772461, "epoch": 53 }, { "hidden_norms": [ 400.7160949707031, 198.93077087402344, 134.9965057373047, 147.8721923828125, 299.2564392089844 ], "bp_grad_norms_per_sample_med": [ 3.8850699638715014e-05, 3.7408095522550866e-05, 3.61659076588694e-05, 3.348653990542516e-05, 2.6619676646078005e-05 ], "bp_grad_norms_F": [ 0.0014573318185284734, 0.0013647449668496847, 0.001298584509640932, 0.001162077416665852, 0.0008761510835029185 ], "gamma_dfa": NaN, "acc_eval": 0.08984375, "loss_eval": 2.8113207817077637, "epoch": 54 }, { "hidden_norms": [ 399.78253173828125, 198.36306762695312, 132.11000061035156, 142.8116912841797, 299.17218017578125 ], "bp_grad_norms_per_sample_med": [ 3.933380503440276e-05, 3.791782364714891e-05, 3.674212348414585e-05, 3.40558253810741e-05, 2.7044263333664276e-05 ], "bp_grad_norms_F": [ 0.001484063221141696, 0.0013903625076636672, 0.0013244440779089928, 0.0011864654952660203, 0.0008941980777308345 ], "gamma_dfa": NaN, "acc_eval": 0.0888671875, "loss_eval": 2.847215175628662, "epoch": 55 }, { "hidden_norms": [ 401.17156982421875, 196.801025390625, 134.57815551757812, 139.7723388671875, 288.41851806640625 ], "bp_grad_norms_per_sample_med": [ 3.922020914615132e-05, 3.7812937080161646e-05, 3.68127366527915e-05, 3.415128594497219e-05, 2.7148824301548302e-05 ], "bp_grad_norms_F": [ 0.0014704873319715261, 0.001381139038130641, 0.0013163810363039374, 0.001184670371003449, 0.0008946889429353178 ], "gamma_dfa": NaN, "acc_eval": 0.0908203125, "loss_eval": 2.816185712814331, "epoch": 56 }, { "hidden_norms": [ 400.9927978515625, 196.3038330078125, 132.07135009765625, 139.7966766357422, 279.3277587890625 ], "bp_grad_norms_per_sample_med": [ 3.982979615102522e-05, 3.841472425847314e-05, 3.7321347917895764e-05, 3.467328497208655e-05, 2.7518768547452055e-05 ], "bp_grad_norms_F": [ 0.0014958448009565473, 0.001403261674568057, 0.0013373151887208223, 0.0012032209197059274, 0.0009093029075302184 ], "gamma_dfa": NaN, "acc_eval": 0.09765625, "loss_eval": 2.8296005725860596, "epoch": 57 }, { "hidden_norms": [ 401.6940612792969, 195.37176513671875, 131.6783447265625, 139.06954956054688, 268.53350830078125 ], "bp_grad_norms_per_sample_med": [ 3.964872666983865e-05, 3.833413211395964e-05, 3.708717122208327e-05, 3.448158531682566e-05, 2.7542468160390854e-05 ], "bp_grad_norms_F": [ 0.0014878648798912764, 0.0013977688504382968, 0.00133328081574291, 0.0012016715481877327, 0.0009097974398173392 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 2.80366849899292, "epoch": 58 }, { "hidden_norms": [ 402.2669372558594, 195.07772827148438, 130.2777099609375, 136.1566925048828, 263.0674133300781 ], "bp_grad_norms_per_sample_med": [ 4.008352698292583e-05, 3.8822814531158656e-05, 3.763332642847672e-05, 3.510116948746145e-05, 2.7965274057351053e-05 ], "bp_grad_norms_F": [ 0.0015098530566319823, 0.0014185438631102443, 0.001352492137812078, 0.0012215198948979378, 0.0009253643220290542 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 2.833949089050293, "epoch": 59 }, { "hidden_norms": [ 404.5005798339844, 192.42762756347656, 130.96656799316406, 135.46536254882812, 255.70611572265625 ], "bp_grad_norms_per_sample_med": [ 4.0377384721068665e-05, 3.883212775690481e-05, 3.7497047742363065e-05, 3.505245331325568e-05, 2.8039796234224923e-05 ], "bp_grad_norms_F": [ 0.0015065876068547368, 0.0014162716688588262, 0.0013495896710082889, 0.0012195424642413855, 0.0009257213678210974 ], "gamma_dfa": NaN, "acc_eval": 0.103515625, "loss_eval": 2.8347878456115723, "epoch": 60 }, { "hidden_norms": [ 405.3465270996094, 191.92613220214844, 129.0675048828125, 135.35177612304688, 252.48280334472656 ], "bp_grad_norms_per_sample_med": [ 4.047132460982539e-05, 3.890526568284258e-05, 3.791163908317685e-05, 3.532003393047489e-05, 2.8360002033878118e-05 ], "bp_grad_norms_F": [ 0.001506851869635284, 0.0014191134832799435, 0.0013552922755479813, 0.0012275888584554195, 0.0009371190681122243 ], "gamma_dfa": NaN, "acc_eval": 0.0947265625, "loss_eval": 2.8487884998321533, "epoch": 61 }, { "hidden_norms": [ 405.92303466796875, 191.02706909179688, 130.1326904296875, 131.96170043945312, 243.21319580078125 ], "bp_grad_norms_per_sample_med": [ 4.0983595681609586e-05, 3.9633086998946965e-05, 3.8324356864904985e-05, 3.588865001802333e-05, 2.8768741685780697e-05 ], "bp_grad_norms_F": [ 0.001533527858555317, 0.0014434503391385078, 0.0013784898910671473, 0.001250342931598425, 0.0009516954887658358 ], "gamma_dfa": NaN, "acc_eval": 0.099609375, "loss_eval": 2.853466749191284, "epoch": 62 }, { "hidden_norms": [ 404.5056457519531, 189.7686004638672, 128.53379821777344, 131.6268768310547, 239.69944763183594 ], "bp_grad_norms_per_sample_med": [ 4.129076478420757e-05, 3.997457315563224e-05, 3.881670272676274e-05, 3.6345707485452294e-05, 2.9240014555398375e-05 ], "bp_grad_norms_F": [ 0.0015445395838469267, 0.001454798853956163, 0.0013908768305554986, 0.0012628707336261868, 0.000962753314524889 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 2.864095687866211, "epoch": 63 }, { "hidden_norms": [ 406.03680419921875, 189.29116821289062, 127.50506591796875, 131.68568420410156, 233.78379821777344 ], "bp_grad_norms_per_sample_med": [ 4.1155919461743906e-05, 4.004100264864974e-05, 3.874011599691585e-05, 3.628453123383224e-05, 2.934946860477794e-05 ], "bp_grad_norms_F": [ 0.0015430431813001633, 0.0014545356389135122, 0.0013910855632275343, 0.0012647509574890137, 0.0009666763944551349 ], "gamma_dfa": NaN, "acc_eval": 0.095703125, "loss_eval": 2.8635716438293457, "epoch": 64 }, { "hidden_norms": [ 406.0451354980469, 188.50218200683594, 126.54427337646484, 131.3389129638672, 226.51025390625 ], "bp_grad_norms_per_sample_med": [ 4.183232886134647e-05, 4.0587648982182145e-05, 3.94381677324418e-05, 3.678469511214644e-05, 2.9675620680791326e-05 ], "bp_grad_norms_F": [ 0.001558265183120966, 0.0014702302869409323, 0.0014062377158552408, 0.0012798203388229012, 0.0009780466789379716 ], "gamma_dfa": NaN, "acc_eval": 0.095703125, "loss_eval": 2.8676958084106445, "epoch": 65 }, { "hidden_norms": [ 408.6777038574219, 187.3246307373047, 127.4869155883789, 129.45443725585938, 217.5286102294922 ], "bp_grad_norms_per_sample_med": [ 4.219069887767546e-05, 4.0918450395110995e-05, 3.9726855902699754e-05, 3.7175828765612096e-05, 2.9963695851620287e-05 ], "bp_grad_norms_F": [ 0.0015777976950630546, 0.001490283408202231, 0.0014262630138546228, 0.001298666698858142, 0.0009915514383465052 ], "gamma_dfa": NaN, "acc_eval": 0.0869140625, "loss_eval": 2.8961129188537598, "epoch": 66 }, { "hidden_norms": [ 407.8295593261719, 186.51223754882812, 126.99847412109375, 128.33078002929688, 215.7896270751953 ], "bp_grad_norms_per_sample_med": [ 4.240999624016695e-05, 4.097919736523181e-05, 3.9745518733980134e-05, 3.734237179742195e-05, 3.010852560692001e-05 ], "bp_grad_norms_F": [ 0.0015762250404804945, 0.00148971623275429, 0.0014267999213188887, 0.0013026067754253745, 0.0009967804653570056 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.8922109603881836, "epoch": 67 }, { "hidden_norms": [ 408.5052490234375, 185.35150146484375, 126.04090881347656, 127.63972473144531, 211.70339965820312 ], "bp_grad_norms_per_sample_med": [ 4.2915176891256124e-05, 4.142584293731488e-05, 4.0363862353842705e-05, 3.7879472074564546e-05, 3.063846452278085e-05 ], "bp_grad_norms_F": [ 0.0015976275317370892, 0.001511436770670116, 0.0014480556128546596, 0.001321145216934383, 0.001012138556689024 ], "gamma_dfa": NaN, "acc_eval": 0.08984375, "loss_eval": 2.9307312965393066, "epoch": 68 }, { "hidden_norms": [ 408.47100830078125, 185.3424835205078, 126.64398956298828, 127.55502319335938, 211.88119506835938 ], "bp_grad_norms_per_sample_med": [ 4.3488638766575605e-05, 4.180728137725964e-05, 4.041391730424948e-05, 3.8047244743211195e-05, 3.0868024623487145e-05 ], "bp_grad_norms_F": [ 0.00161185662727803, 0.0015253758756443858, 0.0014606004115194082, 0.0013330455403774977, 0.0010200685355812311 ], "gamma_dfa": NaN, "acc_eval": 0.087890625, "loss_eval": 2.932239532470703, "epoch": 69 }, { "hidden_norms": [ 408.52923583984375, 184.1455535888672, 125.52372741699219, 125.75703430175781, 202.25552368164062 ], "bp_grad_norms_per_sample_med": [ 4.348695438238792e-05, 4.2108520574402064e-05, 4.075234028277919e-05, 3.836580435745418e-05, 3.1048515666043386e-05 ], "bp_grad_norms_F": [ 0.0016183900879696012, 0.0015315954806283116, 0.0014678208390250802, 0.001341602997854352, 0.0010267652105540037 ], "gamma_dfa": NaN, "acc_eval": 0.0869140625, "loss_eval": 2.9302639961242676, "epoch": 70 }, { "hidden_norms": [ 408.8894958496094, 183.35772705078125, 125.07991027832031, 125.64179229736328, 197.8079376220703 ], "bp_grad_norms_per_sample_med": [ 4.373578849481419e-05, 4.239315967424773e-05, 4.112703027203679e-05, 3.845592436846346e-05, 3.1269701139535755e-05 ], "bp_grad_norms_F": [ 0.0016269702464342117, 0.0015422124415636063, 0.0014783325605094433, 0.001352085149846971, 0.0010349294170737267 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 2.9367189407348633, "epoch": 71 }, { "hidden_norms": [ 408.4325256347656, 182.9261932373047, 124.68492126464844, 124.7309341430664, 192.49610900878906 ], "bp_grad_norms_per_sample_med": [ 4.388380693853833e-05, 4.263465234544128e-05, 4.1247698391089216e-05, 3.877044946420938e-05, 3.1494288123212755e-05 ], "bp_grad_norms_F": [ 0.0016377014108002186, 0.0015517075080424547, 0.0014868414727970958, 0.001360182068310678, 0.0010441095801070333 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.930757999420166, "epoch": 72 }, { "hidden_norms": [ 408.14178466796875, 182.40310668945312, 124.50841522216797, 123.8620834350586, 190.0107879638672 ], "bp_grad_norms_per_sample_med": [ 4.45740224677138e-05, 4.323892426327802e-05, 4.188392267678864e-05, 3.935809581889771e-05, 3.189874405506998e-05 ], "bp_grad_norms_F": [ 0.0016554963076487184, 0.00156887574121356, 0.0015039717545732856, 0.0013761234004050493, 0.0010567718418315053 ], "gamma_dfa": NaN, "acc_eval": 0.0869140625, "loss_eval": 2.9669477939605713, "epoch": 73 }, { "hidden_norms": [ 408.57916259765625, 181.7321014404297, 124.03689575195312, 122.9704818725586, 187.95928955078125 ], "bp_grad_norms_per_sample_med": [ 4.501524745137431e-05, 4.3535896111279726e-05, 4.2307488911319524e-05, 3.976419611717574e-05, 3.218180063413456e-05 ], "bp_grad_norms_F": [ 0.0016716192476451397, 0.001584019628353417, 0.0015181623166427016, 0.0013901714701205492, 0.0010662488639354706 ], "gamma_dfa": NaN, "acc_eval": 0.0908203125, "loss_eval": 2.9710330963134766, "epoch": 74 }, { "hidden_norms": [ 408.1520690917969, 180.9037322998047, 124.13348388671875, 123.0340576171875, 186.64889526367188 ], "bp_grad_norms_per_sample_med": [ 4.489531056606211e-05, 4.363941479823552e-05, 4.237061511958018e-05, 3.981809277320281e-05, 3.235776239307597e-05 ], "bp_grad_norms_F": [ 0.0016766563057899475, 0.0015889391070231795, 0.0015231993747875094, 0.0013958020135760307, 0.0010720851132646203 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.959228515625, "epoch": 75 }, { "hidden_norms": [ 409.3914794921875, 180.49095153808594, 123.59921264648438, 122.37818145751953, 181.8359375 ], "bp_grad_norms_per_sample_med": [ 4.522506060311571e-05, 4.3832860683323815e-05, 4.2538729758234695e-05, 3.9995622501010075e-05, 3.253304384998046e-05 ], "bp_grad_norms_F": [ 0.0016819218872115016, 0.001593844499439001, 0.0015282074455171824, 0.0014012405881658196, 0.0010784030891954899 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.961671829223633, "epoch": 76 }, { "hidden_norms": [ 407.241455078125, 180.02792358398438, 123.85694885253906, 122.00341033935547, 179.4743194580078 ], "bp_grad_norms_per_sample_med": [ 4.5559816499007866e-05, 4.4125670683570206e-05, 4.277457628631964e-05, 4.0345701563637704e-05, 3.2811487471917644e-05 ], "bp_grad_norms_F": [ 0.0016946949763223529, 0.0016066118841990829, 0.0015405946178361773, 0.0014128233306109905, 0.0010864713694900274 ], "gamma_dfa": NaN, "acc_eval": 0.09765625, "loss_eval": 2.971811294555664, "epoch": 77 }, { "hidden_norms": [ 408.3240661621094, 179.1845245361328, 123.02991485595703, 121.22331237792969, 176.96409606933594 ], "bp_grad_norms_per_sample_med": [ 4.576908759190701e-05, 4.430625631357543e-05, 4.3082043703179806e-05, 4.0411658119410276e-05, 3.2916912459768355e-05 ], "bp_grad_norms_F": [ 0.0016961582005023956, 0.0016096236649900675, 0.0015443011652678251, 0.0014174508396536112, 0.0010930649004876614 ], "gamma_dfa": NaN, "acc_eval": 0.0947265625, "loss_eval": 2.974250316619873, "epoch": 78 }, { "hidden_norms": [ 409.5758972167969, 178.83154296875, 122.89900207519531, 120.96637725830078, 176.27029418945312 ], "bp_grad_norms_per_sample_med": [ 4.575210914481431e-05, 4.45544756075833e-05, 4.321682718000375e-05, 4.0704584534978494e-05, 3.307598308310844e-05 ], "bp_grad_norms_F": [ 0.0017041281098499894, 0.001617106725461781, 0.0015517985448241234, 0.0014248047955334187, 0.0010987903224304318 ], "gamma_dfa": NaN, "acc_eval": 0.0888671875, "loss_eval": 2.9865829944610596, "epoch": 79 }, { "hidden_norms": [ 408.8537902832031, 178.98573303222656, 122.46696472167969, 121.31299591064453, 173.41905212402344 ], "bp_grad_norms_per_sample_med": [ 4.6213288442231715e-05, 4.482917211134918e-05, 4.371384784462862e-05, 4.093564712093212e-05, 3.334296343382448e-05 ], "bp_grad_norms_F": [ 0.00171999994199723, 0.001632340019568801, 0.001565982005558908, 0.0014375611208379269, 0.0011084020370617509 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.993680953979492, "epoch": 80 }, { "hidden_norms": [ 408.5456848144531, 178.0683135986328, 122.94597625732422, 119.80611419677734, 171.1206817626953 ], "bp_grad_norms_per_sample_med": [ 4.6296096115838736e-05, 4.503710806602612e-05, 4.384905696497299e-05, 4.111307498533279e-05, 3.349714825162664e-05 ], "bp_grad_norms_F": [ 0.0017213152023032308, 0.0016335739055648446, 0.0015675420872867107, 0.001440141350030899, 0.001112470985390246 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 2.994321346282959, "epoch": 81 }, { "hidden_norms": [ 409.3093566894531, 177.68714904785156, 122.89625549316406, 119.95466613769531, 168.89804077148438 ], "bp_grad_norms_per_sample_med": [ 4.6671568270539865e-05, 4.528012505033985e-05, 4.418051685206592e-05, 4.1504132241243497e-05, 3.381213900865987e-05 ], "bp_grad_norms_F": [ 0.001732644159346819, 0.0016448728274554014, 0.0015783295966684818, 0.001450547482818365, 0.0011199831496924162 ], "gamma_dfa": NaN, "acc_eval": 0.0947265625, "loss_eval": 3.004246950149536, "epoch": 82 }, { "hidden_norms": [ 408.72955322265625, 177.53179931640625, 121.72450256347656, 119.71387481689453, 168.49583435058594 ], "bp_grad_norms_per_sample_med": [ 4.686604006565176e-05, 4.567100768326782e-05, 4.437788811628707e-05, 4.169986641500145e-05, 3.4023832995444536e-05 ], "bp_grad_norms_F": [ 0.0017455043271183968, 0.0016571393935009837, 0.0015903809107840061, 0.0014616175321862102, 0.001127574942074716 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 3.015833854675293, "epoch": 83 }, { "hidden_norms": [ 409.93121337890625, 177.41183471679688, 121.63835144042969, 119.78266906738281, 166.5583953857422 ], "bp_grad_norms_per_sample_med": [ 4.7002995415823534e-05, 4.566587813314982e-05, 4.4412678107619286e-05, 4.1799670725595206e-05, 3.404032759135589e-05 ], "bp_grad_norms_F": [ 0.0017475533531978726, 0.0016598458169028163, 0.0015934593975543976, 0.0014648212818428874, 0.0011309005785733461 ], "gamma_dfa": NaN, "acc_eval": 0.095703125, "loss_eval": 3.014139413833618, "epoch": 84 }, { "hidden_norms": [ 409.67083740234375, 177.14193725585938, 121.51908111572266, 119.6811294555664, 166.031982421875 ], "bp_grad_norms_per_sample_med": [ 4.713247108156793e-05, 4.586786963045597e-05, 4.4539196096593514e-05, 4.203089338261634e-05, 3.428043783060275e-05 ], "bp_grad_norms_F": [ 0.0017551736673340201, 0.001667042262852192, 0.0016005010111257434, 0.0014717906014993787, 0.0011371106375008821 ], "gamma_dfa": NaN, "acc_eval": 0.087890625, "loss_eval": 3.0291876792907715, "epoch": 85 }, { "hidden_norms": [ 410.37042236328125, 176.73268127441406, 121.4700698852539, 119.30713653564453, 163.45822143554688 ], "bp_grad_norms_per_sample_med": [ 4.7194233047775924e-05, 4.609613824868575e-05, 4.4591557525563985e-05, 4.207295205560513e-05, 3.430316428421065e-05 ], "bp_grad_norms_F": [ 0.001759424339979887, 0.0016711216885596514, 0.0016040647169575095, 0.0014759227633476257, 0.001140325446613133 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 3.0314245223999023, "epoch": 86 }, { "hidden_norms": [ 409.8002624511719, 176.60916137695312, 121.219970703125, 118.81930541992188, 164.01478576660156 ], "bp_grad_norms_per_sample_med": [ 4.7294168325606734e-05, 4.6120272600091994e-05, 4.4749522203346714e-05, 4.225381417199969e-05, 3.438722342252731e-05 ], "bp_grad_norms_F": [ 0.0017650157678872347, 0.0016766699263826013, 0.0016095110913738608, 0.0014808655250817537, 0.0011436669155955315 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 3.030081272125244, "epoch": 87 }, { "hidden_norms": [ 409.7901306152344, 176.61012268066406, 121.13548278808594, 118.5867919921875, 162.41827392578125 ], "bp_grad_norms_per_sample_med": [ 4.7548022848786786e-05, 4.6351164201041684e-05, 4.494565655477345e-05, 4.2309966374887154e-05, 3.455657861195505e-05 ], "bp_grad_norms_F": [ 0.0017697742441669106, 0.001681560999713838, 0.00161420414224267, 0.0014853639295324683, 0.0011477968655526638 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 3.0332422256469727, "epoch": 88 }, { "hidden_norms": [ 409.9271240234375, 176.3477783203125, 120.93573760986328, 118.68280029296875, 161.79257202148438 ], "bp_grad_norms_per_sample_med": [ 4.757043279823847e-05, 4.634608922060579e-05, 4.5027496526017785e-05, 4.236193490214646e-05, 3.461442975094542e-05 ], "bp_grad_norms_F": [ 0.0017714434070512652, 0.0016832581022754312, 0.0016157239442691207, 0.0014867670834064484, 0.0011494142236188054 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.0295891761779785, "epoch": 89 }, { "hidden_norms": [ 409.3666076660156, 176.4572296142578, 121.02136993408203, 118.42733001708984, 161.92198181152344 ], "bp_grad_norms_per_sample_med": [ 4.7602890845155343e-05, 4.65112243546173e-05, 4.5134373067412525e-05, 4.2457497329451144e-05, 3.4702385164564475e-05 ], "bp_grad_norms_F": [ 0.0017726266523823142, 0.0016847110819071531, 0.0016171842580661178, 0.0014885812997817993, 0.001151244156062603 ], "gamma_dfa": NaN, "acc_eval": 0.09375, "loss_eval": 3.0332508087158203, "epoch": 90 }, { "hidden_norms": [ 408.93438720703125, 176.05850219726562, 121.09625244140625, 118.71532440185547, 160.93397521972656 ], "bp_grad_norms_per_sample_med": [ 4.767462087329477e-05, 4.656092278310098e-05, 4.517777415458113e-05, 4.260002606315538e-05, 3.481149542494677e-05 ], "bp_grad_norms_F": [ 0.0017778765177354217, 0.0016896515153348446, 0.0016218661330640316, 0.0014927292941138148, 0.0011542538413777947 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 3.0385818481445312, "epoch": 91 }, { "hidden_norms": [ 408.2444763183594, 176.17698669433594, 120.81340789794922, 118.79690551757812, 160.8688507080078 ], "bp_grad_norms_per_sample_med": [ 4.765141420648433e-05, 4.667821849579923e-05, 4.5252400013851e-05, 4.269158671377227e-05, 3.480418672552332e-05 ], "bp_grad_norms_F": [ 0.0017795232124626637, 0.0016910110134631395, 0.0016234440263360739, 0.0014941159170120955, 0.0011556288227438927 ], "gamma_dfa": NaN, "acc_eval": 0.0908203125, "loss_eval": 3.0389466285705566, "epoch": 92 }, { "hidden_norms": [ 408.58831787109375, 176.04327392578125, 120.86355590820312, 118.54495239257812, 160.07017517089844 ], "bp_grad_norms_per_sample_med": [ 4.780395101988688e-05, 4.6777106035733595e-05, 4.532063030637801e-05, 4.271055877325125e-05, 3.487269350443967e-05 ], "bp_grad_norms_F": [ 0.001782167237251997, 0.0016936222091317177, 0.0016259904950857162, 0.0014966638991609216, 0.0011574920499697328 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.0411715507507324, "epoch": 93 }, { "hidden_norms": [ 408.69635009765625, 175.86227416992188, 120.84530639648438, 118.5611572265625, 159.65382385253906 ], "bp_grad_norms_per_sample_med": [ 4.7862777137197554e-05, 4.672469003708102e-05, 4.5333617890719324e-05, 4.2781779484357685e-05, 3.488900983938947e-05 ], "bp_grad_norms_F": [ 0.001782999956049025, 0.0016942995134741068, 0.0016265579033643007, 0.001497312681749463, 0.001158081111498177 ], "gamma_dfa": NaN, "acc_eval": 0.0927734375, "loss_eval": 3.0412378311157227, "epoch": 94 }, { "hidden_norms": [ 408.5793151855469, 175.8729705810547, 120.83885192871094, 118.5599365234375, 159.589111328125 ], "bp_grad_norms_per_sample_med": [ 4.793615153175779e-05, 4.6734887291677296e-05, 4.529079524218105e-05, 4.2848438170040026e-05, 3.4947173844557256e-05 ], "bp_grad_norms_F": [ 0.0017846085829660296, 0.0016958917258307338, 0.001628118334338069, 0.0014987689210101962, 0.0011592835653573275 ], "gamma_dfa": NaN, "acc_eval": 0.0908203125, "loss_eval": 3.043121576309204, "epoch": 95 }, { "hidden_norms": [ 408.6483459472656, 175.8555908203125, 120.81853485107422, 118.52471160888672, 159.30239868164062 ], "bp_grad_norms_per_sample_med": [ 4.796134089701809e-05, 4.68125035695266e-05, 4.539822111837566e-05, 4.2882278648903593e-05, 3.495233249850571e-05 ], "bp_grad_norms_F": [ 0.0017852310556918383, 0.0016965895192697644, 0.001628802390769124, 0.0014994175871834159, 0.0011597864795476198 ], "gamma_dfa": NaN, "acc_eval": 0.0908203125, "loss_eval": 3.0433754920959473, "epoch": 96 }, { "hidden_norms": [ 408.78167724609375, 175.81280517578125, 120.72789001464844, 118.362060546875, 159.2758026123047 ], "bp_grad_norms_per_sample_med": [ 4.7979057853808627e-05, 4.6818935516057536e-05, 4.545195770333521e-05, 4.2866002331720665e-05, 3.4974782465724275e-05 ], "bp_grad_norms_F": [ 0.0017855397891253233, 0.0016968693817034364, 0.0016290779458358884, 0.001499759964644909, 0.001160072861239314 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.0432236194610596, "epoch": 97 }, { "hidden_norms": [ 408.695068359375, 175.82485961914062, 120.68985748291016, 118.31425476074219, 159.31414794921875 ], "bp_grad_norms_per_sample_med": [ 4.796995563083328e-05, 4.685561725636944e-05, 4.54587752756197e-05, 4.2861738620558754e-05, 3.4979620977537706e-05 ], "bp_grad_norms_F": [ 0.0017854906618595123, 0.0016968429554253817, 0.001629071426577866, 0.0014998035039752722, 0.0011602065060287714 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.0435032844543457, "epoch": 98 }, { "hidden_norms": [ 408.69329833984375, 175.80587768554688, 120.6858901977539, 118.34341430664062, 159.32943725585938 ], "bp_grad_norms_per_sample_med": [ 4.796809298568405e-05, 4.686374086304568e-05, 4.545971387415193e-05, 4.28554521931801e-05, 3.4983324439963326e-05 ], "bp_grad_norms_F": [ 0.0017855679616332054, 0.0016969236312434077, 0.001629148842766881, 0.0014998704427853227, 0.0011602530721575022 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.043445348739624, "epoch": 99 }, { "hidden_norms": [ 408.6950378417969, 175.79644775390625, 120.68733978271484, 118.34892272949219, 159.32240295410156 ], "bp_grad_norms_per_sample_med": [ 4.7968002036213875e-05, 4.6864570322213694e-05, 4.546308991848491e-05, 4.2857409425778314e-05, 3.498443402349949e-05 ], "bp_grad_norms_F": [ 0.0017855766927823424, 0.0016969360876828432, 0.0016291660722345114, 0.0014998912811279297, 0.0011602782178670168 ], "gamma_dfa": NaN, "acc_eval": 0.091796875, "loss_eval": 3.0435147285461426, "epoch": 100 } ], "dfa_log": [ { "hidden_norms": [ 8.718070030212402, 42.802223205566406, 44.22697067260742, 46.05121994018555, 46.896766662597656 ], "bp_grad_norms_per_sample_med": [ 0.0010791289387270808, 0.0002035950165009126, 0.00014324457151815295, 0.00011542177526280284, 9.846547618508339e-05 ], "bp_grad_norms_F": [ 0.0380445197224617, 0.00666962843388319, 0.0046500470489263535, 0.003719294909387827, 0.003155440790578723 ], "gamma_dfa": 0.004864378133788705, "acc_eval": 0.080078125, "loss_eval": 2.446239709854126, "epoch": 0 }, { "hidden_norms": [ 1180.2318115234375, 5768.2900390625, 5472.90234375, 6369.3427734375, 5295.2470703125 ], "bp_grad_norms_per_sample_med": [ 1.2146981589467032e-06, 8.634061714474228e-07, 8.587696811446222e-07, 8.589160529481887e-07, 8.53334995554178e-07 ], "bp_grad_norms_F": [ 6.592504360014573e-05, 4.607137088896707e-05, 4.4360855099512264e-05, 4.341698149801232e-05, 4.290258584660478e-05 ], "gamma_dfa": 0.0467059058137238, "acc_eval": 0.15625, "loss_eval": 2.2713985443115234, "epoch": 1 }, { "hidden_norms": [ 2712.02197265625, 35799.15625, 30196.22265625, 31429.328125, 21571.224609375 ], "bp_grad_norms_per_sample_med": [ 3.2316361853190756e-07, 1.6252558054929978e-07, 1.6230175958753534e-07, 1.6301386551731412e-07, 1.6222111298702657e-07 ], "bp_grad_norms_F": [ 2.881550244637765e-05, 1.2372604032862e-05, 1.1472440746729262e-05, 1.1236465070396662e-05, 1.1124561751785222e-05 ], "gamma_dfa": 0.035421818611212075, "acc_eval": 0.146484375, "loss_eval": 2.335322856903076, "epoch": 2 }, { "hidden_norms": [ 4310.83203125, 104622.7734375, 77630.2421875, 78666.21875, 48679.88671875 ], "bp_grad_norms_per_sample_med": [ 1.8400233159354684e-07, 6.495802296058173e-08, 6.498943605492968e-08, 6.491647042139448e-08, 6.464611601586512e-08 ], "bp_grad_norms_F": [ 1.769972368492745e-05, 5.158871317689773e-06, 4.676893240684876e-06, 4.603746219800087e-06, 4.549533514364157e-06 ], "gamma_dfa": 0.03363112888473552, "acc_eval": 0.150390625, "loss_eval": 2.4106125831604004, "epoch": 3 }, { "hidden_norms": [ 5880.8115234375, 227753.375, 152491.703125, 155418.390625, 88801.296875 ], "bp_grad_norms_per_sample_med": [ 1.2607929988917022e-07, 3.377261137416099e-08, 3.3712492353288326e-08, 3.3661436305010284e-08, 3.362825395925029e-08 ], "bp_grad_norms_F": [ 1.548601358081214e-05, 2.78187621916004e-06, 2.4831683731463272e-06, 2.456902620906476e-06, 2.4304001726704882e-06 ], "gamma_dfa": 0.027950844378210604, "acc_eval": 0.1494140625, "loss_eval": 2.473954677581787, "epoch": 4 }, { "hidden_norms": [ 7446.83203125, 415853.34375, 244149.921875, 253104.71875, 141041.109375 ], "bp_grad_norms_per_sample_med": [ 1.0277101125666377e-07, 2.1167430475088622e-08, 2.113832486827505e-08, 2.1176427722480184e-08, 2.102850160667913e-08 ], "bp_grad_norms_F": [ 1.4487833141174633e-05, 2.0795134787476854e-06, 1.5597894389429712e-06, 1.522601451142691e-06, 1.5034931948321173e-06 ], "gamma_dfa": 0.02746052150905598, "acc_eval": 0.1435546875, "loss_eval": 2.5455238819122314, "epoch": 5 }, { "hidden_norms": [ 8986.072265625, 683627.0, 382622.5625, 394341.96875, 225869.703125 ], "bp_grad_norms_per_sample_med": [ 8.362774650549909e-08, 1.4089099664715832e-08, 1.4079772014952141e-08, 1.4096787737116756e-08, 1.4042676355074946e-08 ], "bp_grad_norms_F": [ 1.094696290238062e-05, 1.43898739679571e-06, 1.0249204933643341e-06, 1.0037305173682398e-06, 9.89082195701485e-07 ], "gamma_dfa": 0.022385360905900598, "acc_eval": 0.1416015625, "loss_eval": 2.617079973220825, "epoch": 6 }, { "hidden_norms": [ 10599.609375, 1064012.5, 545495.875, 573164.9375, 330028.71875 ], "bp_grad_norms_per_sample_med": [ 7.213265718064577e-08, 1.0183534016050544e-08, 1.0178969667151705e-08, 1.0194342259239875e-08, 1.0160833951999848e-08 ], "bp_grad_norms_F": [ 1.0159021258004941e-05, 8.805947686596483e-07, 7.233961696329061e-07, 7.142662639125774e-07, 7.038501053102664e-07 ], "gamma_dfa": 0.014009941252879798, "acc_eval": 0.1337890625, "loss_eval": 2.7312068939208984, "epoch": 7 }, { "hidden_norms": [ 12143.3994140625, 1557775.25, 759262.3125, 792826.0, 460775.59375 ], "bp_grad_norms_per_sample_med": [ 6.697734988847515e-08, 7.604014307105444e-09, 7.596973716772482e-09, 7.606048235686558e-09, 7.604833207608408e-09 ], "bp_grad_norms_F": [ 9.400837370776571e-06, 6.404222290257167e-07, 5.235326625552261e-07, 5.169007977201545e-07, 5.090913077765435e-07 ], "gamma_dfa": 0.011664194520562887, "acc_eval": 0.1328125, "loss_eval": 2.825345516204834, "epoch": 8 }, { "hidden_norms": [ 13694.29296875, 2172737.5, 997486.0625, 1070732.625, 629918.4375 ], "bp_grad_norms_per_sample_med": [ 6.409224795334012e-08, 6.097121918458015e-09, 6.086279480399526e-09, 6.08825212466968e-09, 6.0656004663428575e-09 ], "bp_grad_norms_F": [ 9.614421287551522e-06, 5.113795964462042e-07, 4.071621901857725e-07, 4.02141125732669e-07, 3.9655543560002116e-07 ], "gamma_dfa": 0.008997007156722248, "acc_eval": 0.1298828125, "loss_eval": 2.988190174102783, "epoch": 9 }, { "hidden_norms": [ 15223.474609375, 2927110.5, 1275342.625, 1378191.375, 828821.8125 ], "bp_grad_norms_per_sample_med": [ 6.029451782296746e-08, 5.071707498416345e-09, 5.069247244193775e-09, 5.075359243988942e-09, 5.0706532306321606e-09 ], "bp_grad_norms_F": [ 9.640240023145452e-06, 4.242011186761374e-07, 3.2627585255795566e-07, 3.2204775379796047e-07, 3.1740532335788885e-07 ], "gamma_dfa": 0.0051322957733646035, "acc_eval": 0.125, "loss_eval": 3.152592658996582, "epoch": 10 }, { "hidden_norms": [ 16733.46484375, 3849004.0, 1605019.5, 1758574.0, 1046866.9375 ], "bp_grad_norms_per_sample_med": [ 5.804990976798763e-08, 4.271067943761864e-09, 4.260845898329535e-09, 4.262723063419571e-09, 4.251643481723022e-09 ], "bp_grad_norms_F": [ 9.824444532569032e-06, 3.8355952369784063e-07, 2.739863020906341e-07, 2.699064225453185e-07, 2.6583589374240546e-07 ], "gamma_dfa": 0.002556616673246026, "acc_eval": 0.125, "loss_eval": 3.3216772079467773, "epoch": 11 }, { "hidden_norms": [ 18226.0703125, 4895676.0, 1964835.75, 2174918.0, 1297900.0 ], "bp_grad_norms_per_sample_med": [ 5.8149943527041614e-08, 3.753563682096228e-09, 3.750809440816738e-09, 3.756827737788626e-09, 3.745073584582315e-09 ], "bp_grad_norms_F": [ 1.0199929420195986e-05, 3.2010626682676957e-07, 2.3428944473380398e-07, 2.3066610310706892e-07, 2.272569474826014e-07 ], "gamma_dfa": -0.001056009205058217, "acc_eval": 0.1162109375, "loss_eval": 3.5638060569763184, "epoch": 12 }, { "hidden_norms": [ 19695.107421875, 6176501.5, 2397138.0, 2692062.25, 1632551.125 ], "bp_grad_norms_per_sample_med": [ 5.818218085096305e-08, 3.2458047360961473e-09, 3.240681722971317e-09, 3.251705793516635e-09, 3.2418265849543104e-09 ], "bp_grad_norms_F": [ 1.0194554306508508e-05, 2.884790433199669e-07, 2.0161056113465747e-07, 1.9845649035232782e-07, 1.9566277842386626e-07 ], "gamma_dfa": -0.003356708213686943, "acc_eval": 0.11328125, "loss_eval": 3.7695584297180176, "epoch": 13 }, { "hidden_norms": [ 21182.841796875, 7649758.0, 2859185.75, 3238327.25, 2017791.0 ], "bp_grad_norms_per_sample_med": [ 5.6009717752658617e-08, 2.8617739289416022e-09, 2.86194334897516e-09, 2.864514181410982e-09, 2.8607307633876644e-09 ], "bp_grad_norms_F": [ 9.991773367801215e-06, 2.805488747981144e-07, 1.7382579642344353e-07, 1.7105583083321108e-07, 1.6860903429005702e-07 ], "gamma_dfa": -0.004406693275086582, "acc_eval": 0.1103515625, "loss_eval": 3.9298348426818848, "epoch": 14 }, { "hidden_norms": [ 22575.759765625, 9260891.0, 3426286.0, 3904244.75, 2469897.0 ], "bp_grad_norms_per_sample_med": [ 5.523341073399024e-08, 2.458340642164103e-09, 2.4571535917061738e-09, 2.4605368853514165e-09, 2.455863956640769e-09 ], "bp_grad_norms_F": [ 9.669157407188322e-06, 2.321831686913356e-07, 1.4871888254219812e-07, 1.466667072236305e-07, 1.44689224157446e-07 ], "gamma_dfa": -0.005493569537065923, "acc_eval": 0.11328125, "loss_eval": 4.065067291259766, "epoch": 15 }, { "hidden_norms": [ 23971.93359375, 11148851.0, 3986279.5, 4682323.5, 2980997.5 ], "bp_grad_norms_per_sample_med": [ 5.2560817920266345e-08, 2.1839356989517e-09, 2.1809569705766307e-09, 2.1860839805043497e-09, 2.177982905138265e-09 ], "bp_grad_norms_F": [ 9.612061148800422e-06, 2.2171894897837774e-07, 1.2985647401819733e-07, 1.2793493908702658e-07, 1.2610371413757093e-07 ], "gamma_dfa": -0.0057282960042357445, "acc_eval": 0.1103515625, "loss_eval": 4.23506498336792, "epoch": 16 }, { "hidden_norms": [ 25387.59765625, 13199074.0, 4584581.0, 5421912.0, 3520717.25 ], "bp_grad_norms_per_sample_med": [ 5.063454011633439e-08, 1.9527632844074105e-09, 1.9520551841623046e-09, 1.956988127105319e-09, 1.9527153227727467e-09 ], "bp_grad_norms_F": [ 9.531939213047735e-06, 1.855236746450828e-07, 1.1443902536711903e-07, 1.1294694246544168e-07, 1.1146746459189671e-07 ], "gamma_dfa": -0.00637711986200884, "acc_eval": 0.1123046875, "loss_eval": 4.372166633605957, "epoch": 17 }, { "hidden_norms": [ 26803.72265625, 15607512.0, 5231978.5, 6327852.0, 4171921.5 ], "bp_grad_norms_per_sample_med": [ 5.073666287103151e-08, 1.7431257548494727e-09, 1.7403234409130164e-09, 1.7429053755790846e-09, 1.737441190918787e-09 ], "bp_grad_norms_F": [ 9.275222510041203e-06, 1.6788693812941347e-07, 1.0197032906944514e-07, 1.0054727539454689e-07, 9.927033062240298e-08 ], "gamma_dfa": -0.006377041107043624, "acc_eval": 0.1142578125, "loss_eval": 4.511043071746826, "epoch": 18 }, { "hidden_norms": [ 28166.5859375, 18256806.0, 6062269.0, 7361214.0, 4908964.5 ], "bp_grad_norms_per_sample_med": [ 4.8937458529962896e-08, 1.5624438409744812e-09, 1.5615452264583496e-09, 1.5637011685498692e-09, 1.559517959215384e-09 ], "bp_grad_norms_F": [ 9.249049981008284e-06, 1.5261937846844376e-07, 9.117609778286351e-08, 8.977448828773049e-08, 8.863072764597746e-08 ], "gamma_dfa": -0.007660938150365837, "acc_eval": 0.1171875, "loss_eval": 4.64661979675293, "epoch": 19 }, { "hidden_norms": [ 29548.751953125, 21145650.0, 6936910.0, 8491332.0, 5632708.0 ], "bp_grad_norms_per_sample_med": [ 4.774140904828528e-08, 1.397353122101208e-09, 1.3845558033409588e-09, 1.3843480806130515e-09, 1.3776775276141962e-09 ], "bp_grad_norms_F": [ 9.035198672791012e-06, 1.426667637360879e-07, 8.229534387282911e-08, 8.094935566305139e-08, 7.995085837819715e-08 ], "gamma_dfa": -0.00677196380274836, "acc_eval": 0.111328125, "loss_eval": 4.76383113861084, "epoch": 20 }, { "hidden_norms": [ 30869.275390625, 24201464.0, 7880455.0, 9702563.0, 6424945.5 ], "bp_grad_norms_per_sample_med": [ 4.703911571368735e-08, 1.2679121086378586e-09, 1.2570423590929636e-09, 1.2592289433399628e-09, 1.2545631200566731e-09 ], "bp_grad_norms_F": [ 8.886428986443207e-06, 1.178441522142748e-07, 7.369149557234778e-08, 7.258120149344904e-08, 7.175417238158843e-08 ], "gamma_dfa": -0.008610141419922002, "acc_eval": 0.1162109375, "loss_eval": 4.926914691925049, "epoch": 21 }, { "hidden_norms": [ 32181.666015625, 27506424.0, 8773789.0, 11014517.0, 7322481.5 ], "bp_grad_norms_per_sample_med": [ 4.4904634677322974e-08, 1.1420530077188573e-09, 1.121353787603141e-09, 1.124021098419803e-09, 1.120450510150306e-09 ], "bp_grad_norms_F": [ 8.90475439518923e-06, 1.1447492909155699e-07, 6.648813410947696e-08, 6.533218765980564e-08, 6.45067217419637e-08 ], "gamma_dfa": -0.007374132976110559, "acc_eval": 0.111328125, "loss_eval": 5.004192352294922, "epoch": 22 }, { "hidden_norms": [ 33471.7265625, 31266642.0, 9769161.0, 12538190.0, 8328704.0 ], "bp_grad_norms_per_sample_med": [ 4.517446683394155e-08, 1.0276371975592724e-09, 1.005762251260478e-09, 1.0072189748910887e-09, 1.0049648890841922e-09 ], "bp_grad_norms_F": [ 8.657435500936117e-06, 1.0238768766157591e-07, 6.021300436032107e-08, 5.9172805322305067e-08, 5.8442100936417773e-08 ], "gamma_dfa": -0.006727739999405458, "acc_eval": 0.1123046875, "loss_eval": 5.116036415100098, "epoch": 23 }, { "hidden_norms": [ 34792.7890625, 35134068.0, 11038143.0, 14059113.0, 9444097.0 ], "bp_grad_norms_per_sample_med": [ 4.4753964090205045e-08, 9.320837435211615e-10, 9.107828935484008e-10, 9.128516276213361e-10, 9.105118325969386e-10 ], "bp_grad_norms_F": [ 8.577152584621217e-06, 9.559200009334745e-08, 5.512932332862874e-08, 5.411101611230151e-08, 5.343352782460897e-08 ], "gamma_dfa": -0.00556181388310506, "acc_eval": 0.1142578125, "loss_eval": 5.2026848793029785, "epoch": 24 }, { "hidden_norms": [ 36056.9921875, 39258876.0, 12277943.0, 15686179.0, 10635754.0 ], "bp_grad_norms_per_sample_med": [ 4.2437520164639864e-08, 8.431049747237296e-10, 8.279052998716452e-10, 8.256172967513464e-10, 8.249605998322806e-10 ], "bp_grad_norms_F": [ 8.401701961702202e-06, 9.383651189409647e-08, 5.072890729707069e-08, 4.9743736241225633e-08, 4.90946696629635e-08 ], "gamma_dfa": -0.004373190506157698, "acc_eval": 0.115234375, "loss_eval": 5.283636569976807, "epoch": 25 }, { "hidden_norms": [ 37332.3203125, 43838448.0, 13573116.0, 17373072.0, 11853122.0 ], "bp_grad_norms_per_sample_med": [ 3.96461210527832e-08, 7.721222550216567e-10, 7.523985323665272e-10, 7.522342748700339e-10, 7.507660604311184e-10 ], "bp_grad_norms_F": [ 8.241736395575572e-06, 8.553880093131738e-08, 4.659301566789509e-08, 4.568136446891913e-08, 4.507716511170656e-08 ], "gamma_dfa": -0.003043898326723138, "acc_eval": 0.1123046875, "loss_eval": 5.340336322784424, "epoch": 26 }, { "hidden_norms": [ 38604.234375, 48637388.0, 14943648.0, 19237954.0, 13168041.0 ], "bp_grad_norms_per_sample_med": [ 3.845103080379886e-08, 7.063521434425013e-10, 6.949120723298563e-10, 6.971247468179342e-10, 6.954581355245182e-10 ], "bp_grad_norms_F": [ 8.12488178780768e-06, 8.518332350604396e-08, 4.348786220020884e-08, 4.2559751278758995e-08, 4.1998429622935873e-08 ], "gamma_dfa": -0.0021704566534026526, "acc_eval": 0.1103515625, "loss_eval": 5.403829574584961, "epoch": 27 }, { "hidden_norms": [ 39856.5078125, 53569880.0, 16230254.0, 21087022.0, 14556169.0 ], "bp_grad_norms_per_sample_med": [ 3.739526022172868e-08, 6.497330451438188e-10, 6.402843810704439e-10, 6.384167083872683e-10, 6.366632776533265e-10 ], "bp_grad_norms_F": [ 8.042790796025656e-06, 7.930053413929272e-08, 4.0553047142566356e-08, 3.9663138551304655e-08, 3.909939749746627e-08 ], "gamma_dfa": 0.00027063591551268473, "acc_eval": 0.11328125, "loss_eval": 5.486921310424805, "epoch": 28 }, { "hidden_norms": [ 41114.66015625, 59315272.0, 17822804.0, 22986032.0, 16084622.0 ], "bp_grad_norms_per_sample_med": [ 3.655359392951141e-08, 6.013742281929524e-10, 5.905386180060646e-10, 5.911486300469448e-10, 5.910953393417628e-10 ], "bp_grad_norms_F": [ 7.960659786476754e-06, 8.031720000190035e-08, 3.805743276075191e-08, 3.7164745947393385e-08, 3.6596219388229656e-08 ], "gamma_dfa": 0.0034554791564005427, "acc_eval": 0.1142578125, "loss_eval": 5.604689598083496, "epoch": 29 }, { "hidden_norms": [ 42325.58984375, 64740044.0, 19249378.0, 25010146.0, 17657480.0 ], "bp_grad_norms_per_sample_med": [ 3.541291704323157e-08, 5.539400049769938e-10, 5.454215967759524e-10, 5.459841467825299e-10, 5.440591865912836e-10 ], "bp_grad_norms_F": [ 7.836213626433164e-06, 7.777267541086985e-08, 3.578357521405451e-08, 3.4922344127608085e-08, 3.437838813624694e-08 ], "gamma_dfa": 0.003963275059504667, "acc_eval": 0.115234375, "loss_eval": 5.663756370544434, "epoch": 30 }, { "hidden_norms": [ 43534.375, 70424152.0, 20966526.0, 27032410.0, 19126838.0 ], "bp_grad_norms_per_sample_med": [ 3.4974387830288833e-08, 5.135932235056373e-10, 5.051635221242634e-10, 5.056056129326691e-10, 5.03480979130444e-10 ], "bp_grad_norms_F": [ 7.886262210377026e-06, 8.217509162022907e-08, 3.401517645329477e-08, 3.309881080326704e-08, 3.255568614690674e-08 ], "gamma_dfa": 0.006612789164137212, "acc_eval": 0.1162109375, "loss_eval": 5.706640243530273, "epoch": 31 }, { "hidden_norms": [ 44720.9453125, 76344112.0, 22771320.0, 29203482.0, 20864830.0 ], "bp_grad_norms_per_sample_med": [ 3.4229628909088206e-08, 4.800634334500842e-10, 4.701866673784139e-10, 4.693791466614528e-10, 4.668225250803459e-10 ], "bp_grad_norms_F": [ 7.781368367432151e-06, 7.414258362814508e-08, 3.207212984079888e-08, 3.1193785332561674e-08, 3.0666903683140845e-08 ], "gamma_dfa": 0.008515000299667008, "acc_eval": 0.1162109375, "loss_eval": 5.720961093902588, "epoch": 32 }, { "hidden_norms": [ 45875.8046875, 82383720.0, 24638848.0, 31558806.0, 22520176.0 ], "bp_grad_norms_per_sample_med": [ 3.390868030805905e-08, 4.458567681719927e-10, 4.385545260277013e-10, 4.3886239087242984e-10, 4.3707018559935307e-10 ], "bp_grad_norms_F": [ 7.905513484729454e-06, 7.275451707755565e-08, 3.047262708832932e-08, 2.960254974482268e-08, 2.9090815090171418e-08 ], "gamma_dfa": 0.01025733859205502, "acc_eval": 0.1142578125, "loss_eval": 5.7539262771606445, "epoch": 33 }, { "hidden_norms": [ 47003.1328125, 89200944.0, 26495704.0, 33934388.0, 24310298.0 ], "bp_grad_norms_per_sample_med": [ 3.3027241386207606e-08, 4.1779490977944533e-10, 4.123023311652929e-10, 4.1292305685836084e-10, 4.1066355871421933e-10 ], "bp_grad_norms_F": [ 8.257205990958028e-06, 7.720848316239426e-08, 2.8986395506080953e-08, 2.8067159263400754e-08, 2.7556911419424068e-08 ], "gamma_dfa": 0.012584943462570664, "acc_eval": 0.11328125, "loss_eval": 5.796531677246094, "epoch": 34 }, { "hidden_norms": [ 48090.08984375, 95793720.0, 28464040.0, 36264388.0, 26293806.0 ], "bp_grad_norms_per_sample_med": [ 3.217191490989535e-08, 3.894292666117849e-10, 3.8594555329396485e-10, 3.8626962739485293e-10, 3.8498901289152343e-10 ], "bp_grad_norms_F": [ 8.125247404677793e-06, 7.330743301281473e-08, 2.7641750222073824e-08, 2.6769551908500944e-08, 2.6268399011541987e-08 ], "gamma_dfa": 0.015375214185041841, "acc_eval": 0.1181640625, "loss_eval": 5.804059982299805, "epoch": 35 }, { "hidden_norms": [ 49138.04296875, 102879768.0, 30344818.0, 38660032.0, 28092164.0 ], "bp_grad_norms_per_sample_med": [ 3.081565580487222e-08, 3.644603230323895e-10, 3.576897944501667e-10, 3.568374207230107e-10, 3.5416741761551407e-10 ], "bp_grad_norms_F": [ 8.033912308746949e-06, 7.398465839969504e-08, 2.61401691403762e-08, 2.530256892896432e-08, 2.481599992165684e-08 ], "gamma_dfa": 0.01655786213814281, "acc_eval": 0.1162109375, "loss_eval": 5.779043197631836, "epoch": 36 }, { "hidden_norms": [ 50205.23828125, 109785504.0, 32500932.0, 40993492.0, 30124936.0 ], "bp_grad_norms_per_sample_med": [ 3.087046351879508e-08, 3.450236207847013e-10, 3.3626229578587186e-10, 3.3652211572920976e-10, 3.357169819917516e-10 ], "bp_grad_norms_F": [ 8.317977517435793e-06, 6.930265783466893e-08, 2.4881831706125013e-08, 2.413608513052168e-08, 2.36848762824593e-08 ], "gamma_dfa": 0.01839016478334088, "acc_eval": 0.1162109375, "loss_eval": 5.815016746520996, "epoch": 37 }, { "hidden_norms": [ 51234.28125, 116882832.0, 34622344.0, 43672052.0, 32010828.0 ], "bp_grad_norms_per_sample_med": [ 3.011625793192252e-08, 3.242739410325157e-10, 3.1924299315200244e-10, 3.1952127055312474e-10, 3.181244712102682e-10 ], "bp_grad_norms_F": [ 8.41012479213532e-06, 7.246134714478103e-08, 2.3759820777513596e-08, 2.3049024022725462e-08, 2.2618014128283903e-08 ], "gamma_dfa": 0.019554060958398622, "acc_eval": 0.1142578125, "loss_eval": 5.829615116119385, "epoch": 38 }, { "hidden_norms": [ 52247.84375, 124228312.0, 36552372.0, 46094684.0, 33968656.0 ], "bp_grad_norms_per_sample_med": [ 3.024800321327348e-08, 3.052329222708039e-10, 3.0248267779420246e-10, 3.022799510699059e-10, 3.012357030485191e-10 ], "bp_grad_norms_F": [ 7.947497579152696e-06, 6.409469932577849e-08, 2.2781945219207955e-08, 2.209960925370069e-08, 2.1678969730487552e-08 ], "gamma_dfa": 0.022201491628948133, "acc_eval": 0.1142578125, "loss_eval": 5.778614044189453, "epoch": 39 }, { "hidden_norms": [ 53254.6640625, 131932448.0, 38786720.0, 48743312.0, 36026440.0 ], "bp_grad_norms_per_sample_med": [ 2.9781913823967443e-08, 2.8849589384094543e-10, 2.856256064998064e-10, 2.8570401600092055e-10, 2.844837143634038e-10 ], "bp_grad_norms_F": [ 7.602731329825474e-06, 6.632863147615353e-08, 2.174161650714268e-08, 2.107603691570148e-08, 2.067151072537854e-08 ], "gamma_dfa": 0.02325869471678743, "acc_eval": 0.119140625, "loss_eval": 5.798803329467773, "epoch": 40 }, { "hidden_norms": [ 54228.43359375, 139390368.0, 41071128.0, 51348924.0, 38183484.0 ], "bp_grad_norms_per_sample_med": [ 2.9682835744893055e-08, 2.752674477246586e-10, 2.7137878055860654e-10, 2.716726288376492e-10, 2.71538042051489e-10 ], "bp_grad_norms_F": [ 7.424123396049254e-06, 6.37739248077196e-08, 2.099002749389456e-08, 2.0336601735948534e-08, 1.9947020035715468e-08 ], "gamma_dfa": 0.024572641068516532, "acc_eval": 0.119140625, "loss_eval": 5.8440093994140625, "epoch": 41 }, { "hidden_norms": [ 55136.65625, 147294320.0, 43301224.0, 54132172.0, 40002916.0 ], "bp_grad_norms_per_sample_med": [ 3.0416718033166035e-08, 2.623444794735974e-10, 2.586598435438958e-10, 2.587878522586351e-10, 2.5755084176459775e-10 ], "bp_grad_norms_F": [ 7.195616944954963e-06, 5.543640568816954e-08, 2.0126753597082825e-08, 1.9496084746606357e-08, 1.9124053451946565e-08 ], "gamma_dfa": 0.026229552553559188, "acc_eval": 0.1201171875, "loss_eval": 5.841940879821777, "epoch": 42 }, { "hidden_norms": [ 56057.48828125, 155058496.0, 45581136.0, 56721952.0, 42172944.0 ], "bp_grad_norms_per_sample_med": [ 2.9346542973485157e-08, 2.4918875296542353e-10, 2.4687848987348104e-10, 2.470146309718757e-10, 2.4589502656269246e-10 ], "bp_grad_norms_F": [ 7.236937562993262e-06, 4.957384902581907e-08, 1.9364815528888357e-08, 1.8756255215635065e-08, 1.840485097659439e-08 ], "gamma_dfa": 0.027025546743971063, "acc_eval": 0.12109375, "loss_eval": 5.79724645614624, "epoch": 43 }, { "hidden_norms": [ 56951.0546875, 163286592.0, 47715684.0, 59381272.0, 44453996.0 ], "bp_grad_norms_per_sample_med": [ 2.9479124918907473e-08, 2.39016806347081e-10, 2.3503707313743405e-10, 2.33648544956111e-10, 2.335798499064623e-10 ], "bp_grad_norms_F": [ 7.3719347710721195e-06, 5.521000900898798e-08, 1.8681236113593513e-08, 1.8048309513574168e-08, 1.7682033615074033e-08 ], "gamma_dfa": 0.02818910058704205, "acc_eval": 0.1181640625, "loss_eval": 5.779097080230713, "epoch": 44 }, { "hidden_norms": [ 57889.91015625, 171572336.0, 49962976.0, 62099764.0, 46403104.0 ], "bp_grad_norms_per_sample_med": [ 3.00151405951965e-08, 2.294373580014053e-10, 2.2455036441382248e-10, 2.2508651886798958e-10, 2.2402991961545382e-10 ], "bp_grad_norms_F": [ 7.484923116862774e-06, 5.0286196540128e-08, 1.8117480848900414e-08, 1.7483015923858147e-08, 1.7114837547183015e-08 ], "gamma_dfa": 0.029963871067593573, "acc_eval": 0.1220703125, "loss_eval": 5.8359575271606445, "epoch": 45 }, { "hidden_norms": [ 58731.421875, 180056896.0, 52137220.0, 64717056.0, 48647116.0 ], "bp_grad_norms_per_sample_med": [ 2.929727926925807e-08, 2.1976008512947232e-10, 2.159663420320257e-10, 2.163312862180078e-10, 2.1587925891353166e-10 ], "bp_grad_norms_F": [ 7.681007446080912e-06, 5.031828109736125e-08, 1.7532725493651924e-08, 1.6936246183263393e-08, 1.659478598980968e-08 ], "gamma_dfa": 0.03088831547938753, "acc_eval": 0.1220703125, "loss_eval": 5.786240100860596, "epoch": 46 }, { "hidden_norms": [ 59567.96875, 187949040.0, 54233264.0, 67384816.0, 50735356.0 ], "bp_grad_norms_per_sample_med": [ 2.870891080419824e-08, 2.1069677946794485e-10, 2.057157916235397e-10, 2.0573617809382938e-10, 2.051469827346608e-10 ], "bp_grad_norms_F": [ 7.31024283595616e-06, 4.820083177037304e-08, 1.691453910268592e-08, 1.6327849294839325e-08, 1.5993451896179067e-08 ], "gamma_dfa": 0.03192764806590276, "acc_eval": 0.119140625, "loss_eval": 5.707631587982178, "epoch": 47 }, { "hidden_norms": [ 60402.91796875, 196285488.0, 56440304.0, 70085304.0, 52941472.0 ], "bp_grad_norms_per_sample_med": [ 2.8424729237030988e-08, 2.033633955678127e-10, 1.9889993818633656e-10, 1.9922237470826332e-10, 1.9868894030050654e-10 ], "bp_grad_norms_F": [ 7.644263860129286e-06, 4.852574519986774e-08, 1.6383141954179337e-08, 1.581754283108694e-08, 1.548989914113008e-08 ], "gamma_dfa": 0.033413520381145645, "acc_eval": 0.1220703125, "loss_eval": 5.704823017120361, "epoch": 48 }, { "hidden_norms": [ 61196.53515625, 204414672.0, 58842936.0, 72912304.0, 55068312.0 ], "bp_grad_norms_per_sample_med": [ 2.859230185947581e-08, 1.9821513874695995e-10, 1.9266777062654228e-10, 1.9288849684162557e-10, 1.9265547490654455e-10 ], "bp_grad_norms_F": [ 7.879517397668678e-06, 4.184777324667266e-08, 1.6105406785982268e-08, 1.550557016116727e-08, 1.5175970702330233e-08 ], "gamma_dfa": 0.034091180186806014, "acc_eval": 0.1201171875, "loss_eval": 5.725862979888916, "epoch": 49 }, { "hidden_norms": [ 61914.14453125, 212112608.0, 61176224.0, 75542504.0, 57474876.0 ], "bp_grad_norms_per_sample_med": [ 2.8669807861092522e-08, 1.8937640344773854e-10, 1.8534798695846177e-10, 1.855716413867725e-10, 1.852704378801917e-10 ], "bp_grad_norms_F": [ 8.087788955890574e-06, 4.2019124180114886e-08, 1.5675068354426003e-08, 1.5084628657291432e-08, 1.4754542476680399e-08 ], "gamma_dfa": 0.034466555964172585, "acc_eval": 0.1201171875, "loss_eval": 5.820840358734131, "epoch": 50 }, { "hidden_norms": [ 62603.82421875, 219453520.0, 63197896.0, 78229512.0, 59644488.0 ], "bp_grad_norms_per_sample_med": [ 2.9210220020559063e-08, 1.8399998191753753e-10, 1.7923225403837506e-10, 1.792543474765651e-10, 1.785920855645884e-10 ], "bp_grad_norms_F": [ 8.000329216883983e-06, 4.107307916001446e-08, 1.5165383615567407e-08, 1.4602372644390016e-08, 1.4272954373950597e-08 ], "gamma_dfa": 0.035090556057184585, "acc_eval": 0.12109375, "loss_eval": 5.784890174865723, "epoch": 51 }, { "hidden_norms": [ 63365.48828125, 227326704.0, 65434160.0, 80771200.0, 61832948.0 ], "bp_grad_norms_per_sample_med": [ 2.9006677948473225e-08, 1.7990454959093682e-10, 1.7418685938075384e-10, 1.7404670760168273e-10, 1.7386522777051994e-10 ], "bp_grad_norms_F": [ 8.04007868282497e-06, 3.7175201583750095e-08, 1.4899267597456856e-08, 1.4325389763314433e-08, 1.4007627946455159e-08 ], "gamma_dfa": 0.035336821872988367, "acc_eval": 0.12109375, "loss_eval": 5.837845802307129, "epoch": 52 }, { "hidden_norms": [ 64122.77734375, 235505280.0, 67571832.0, 83154408.0, 63815212.0 ], "bp_grad_norms_per_sample_med": [ 2.8882961800036355e-08, 1.752420292211454e-10, 1.6966168747689636e-10, 1.6997936391760504e-10, 1.6931231416883463e-10 ], "bp_grad_norms_F": [ 7.732651283731684e-06, 3.6642365586203596e-08, 1.4491905453439813e-08, 1.39411024946412e-08, 1.3628048911584756e-08 ], "gamma_dfa": 0.035559086416469654, "acc_eval": 0.12109375, "loss_eval": 5.813376426696777, "epoch": 53 }, { "hidden_norms": [ 64808.83203125, 243721104.0, 69766352.0, 85766896.0, 65980356.0 ], "bp_grad_norms_per_sample_med": [ 2.8568885923618836e-08, 1.6757319143412275e-10, 1.6364704036320177e-10, 1.6374304689925623e-10, 1.6309503747535814e-10 ], "bp_grad_norms_F": [ 7.502960215788335e-06, 3.409801507814336e-08, 1.4090593580817767e-08, 1.3566921808205734e-08, 1.3258036446472943e-08 ], "gamma_dfa": 0.03633021883433685, "acc_eval": 0.12109375, "loss_eval": 5.748073101043701, "epoch": 54 }, { "hidden_norms": [ 65405.05078125, 251434864.0, 71765544.0, 88222840.0, 68040816.0 ], "bp_grad_norms_per_sample_med": [ 2.8620791070466112e-08, 1.6591342189009595e-10, 1.611620559227589e-10, 1.6055762275257734e-10, 1.6039196359951546e-10 ], "bp_grad_norms_F": [ 7.535967142757727e-06, 3.341937571121889e-08, 1.3891366279494832e-08, 1.3369996665346662e-08, 1.3064806125839823e-08 ], "gamma_dfa": 0.037189101487456355, "acc_eval": 0.1220703125, "loss_eval": 5.769567966461182, "epoch": 55 }, { "hidden_norms": [ 65975.4296875, 259364544.0, 73868528.0, 90804584.0, 70148048.0 ], "bp_grad_norms_per_sample_med": [ 2.8815582808761064e-08, 1.6121720625150715e-10, 1.5669744668489471e-10, 1.568625784820199e-10, 1.56342438994983e-10 ], "bp_grad_norms_F": [ 7.530327820859384e-06, 2.989135694519973e-08, 1.3588412173248798e-08, 1.308291253110383e-08, 1.2791012693469384e-08 ], "gamma_dfa": 0.037349180958699435, "acc_eval": 0.1201171875, "loss_eval": 5.802239418029785, "epoch": 56 }, { "hidden_norms": [ 66535.546875, 267235600.0, 75921592.0, 93206176.0, 72113992.0 ], "bp_grad_norms_per_sample_med": [ 2.8679746577608967e-08, 1.5684299692342307e-10, 1.530628263024525e-10, 1.5322397517447683e-10, 1.5271124642612932e-10 ], "bp_grad_norms_F": [ 7.578343684144784e-06, 2.8776035776445497e-08, 1.3372356555407805e-08, 1.2855631226216246e-08, 1.2555028128247159e-08 ], "gamma_dfa": 0.03780493976228172, "acc_eval": 0.1201171875, "loss_eval": 5.850732803344727, "epoch": 57 }, { "hidden_norms": [ 67107.3125, 274158304.0, 77594136.0, 95315520.0, 73880288.0 ], "bp_grad_norms_per_sample_med": [ 2.9038343285492374e-08, 1.5442255807407435e-10, 1.5004263109741345e-10, 1.5028490951696227e-10, 1.4968959405337046e-10 ], "bp_grad_norms_F": [ 7.555737283837516e-06, 3.160908335075874e-08, 1.3153115929753767e-08, 1.2644002289619038e-08, 1.2345022781801163e-08 ], "gamma_dfa": 0.03859367490440491, "acc_eval": 0.12109375, "loss_eval": 5.83157205581665, "epoch": 58 }, { "hidden_norms": [ 67633.5703125, 281346784.0, 79395712.0, 97521760.0, 75716480.0 ], "bp_grad_norms_per_sample_med": [ 2.8924493022941533e-08, 1.5015137744267548e-10, 1.4681762749990668e-10, 1.469668414744163e-10, 1.4640397227871915e-10 ], "bp_grad_norms_F": [ 7.076869223965332e-06, 3.03394500633658e-08, 1.2924256331814377e-08, 1.2421836004250508e-08, 1.2128483106721433e-08 ], "gamma_dfa": 0.03882967439312779, "acc_eval": 0.1201171875, "loss_eval": 5.850924491882324, "epoch": 59 }, { "hidden_norms": [ 68127.2578125, 288068512.0, 81019736.0, 99671120.0, 77532304.0 ], "bp_grad_norms_per_sample_med": [ 2.900766915558961e-08, 1.4631622302641034e-10, 1.434221075236053e-10, 1.4353812582967862e-10, 1.428595158836643e-10 ], "bp_grad_norms_F": [ 7.026245839369949e-06, 3.037761331370348e-08, 1.2673269544904997e-08, 1.216829925709817e-08, 1.1867063776094255e-08 ], "gamma_dfa": 0.039077571367670316, "acc_eval": 0.119140625, "loss_eval": 5.843035697937012, "epoch": 60 }, { "hidden_norms": [ 68607.2890625, 295220896.0, 83038584.0, 101714504.0, 79438864.0 ], "bp_grad_norms_per_sample_med": [ 2.889952988027744e-08, 1.4436063455747217e-10, 1.410637162635453e-10, 1.4117192137508283e-10, 1.405108668306454e-10 ], "bp_grad_norms_F": [ 6.8223289417801425e-06, 2.9571756599011678e-08, 1.237319757763089e-08, 1.1902468344260342e-08, 1.1619527562345411e-08 ], "gamma_dfa": 0.0394883609842509, "acc_eval": 0.119140625, "loss_eval": 5.8329925537109375, "epoch": 61 }, { "hidden_norms": [ 69038.0703125, 302174528.0, 84795640.0, 103621440.0, 81134560.0 ], "bp_grad_norms_per_sample_med": [ 2.8758867287592693e-08, 1.4096314393530207e-10, 1.380290187702471e-10, 1.3813312993438132e-10, 1.3748156779680443e-10 ], "bp_grad_norms_F": [ 6.821945589763345e-06, 2.9822015079616904e-08, 1.2211526900784975e-08, 1.1739270888710962e-08, 1.1454956982959175e-08 ], "gamma_dfa": 0.03950453496872797, "acc_eval": 0.1201171875, "loss_eval": 5.862898826599121, "epoch": 62 }, { "hidden_norms": [ 69486.8671875, 308758272.0, 86559352.0, 105690288.0, 82830320.0 ], "bp_grad_norms_per_sample_med": [ 2.880081950706881e-08, 1.381648684350978e-10, 1.3562810596834396e-10, 1.3572509782733277e-10, 1.3508719143295878e-10 ], "bp_grad_norms_F": [ 6.841747108410345e-06, 3.094388745239485e-08, 1.2084786504829026e-08, 1.1623659368353856e-08, 1.1344519990075241e-08 ], "gamma_dfa": 0.03953796969653922, "acc_eval": 0.1181640625, "loss_eval": 5.886589527130127, "epoch": 63 }, { "hidden_norms": [ 69910.8515625, 314931680.0, 87987448.0, 107443096.0, 84227784.0 ], "bp_grad_norms_per_sample_med": [ 2.8549854036441502e-08, 1.3562842515746354e-10, 1.3309958690754797e-10, 1.3318925129457426e-10, 1.32547681164219e-10 ], "bp_grad_norms_F": [ 6.486627626145491e-06, 3.26463052147119e-08, 1.1863860116534397e-08, 1.1407089495207856e-08, 1.112555558790973e-08 ], "gamma_dfa": 0.040154138219804736, "acc_eval": 0.12109375, "loss_eval": 5.841930389404297, "epoch": 64 }, { "hidden_norms": [ 70309.921875, 320869664.0, 89479256.0, 109445496.0, 85720672.0 ], "bp_grad_norms_per_sample_med": [ 2.8119913508817262e-08, 1.333930049751686e-10, 1.311449004948173e-10, 1.3122899988893266e-10, 1.306234981290899e-10 ], "bp_grad_norms_F": [ 6.1845657910453156e-06, 3.1657755528158305e-08, 1.1685694190077811e-08, 1.1245842479468138e-08, 1.0970555130995763e-08 ], "gamma_dfa": 0.04057217295485316, "acc_eval": 0.1181640625, "loss_eval": 5.787144184112549, "epoch": 65 }, { "hidden_norms": [ 70717.453125, 326733312.0, 90990512.0, 111385000.0, 87145456.0 ], "bp_grad_norms_per_sample_med": [ 2.868856441295975e-08, 1.3173599711091555e-10, 1.290058199154842e-10, 1.2908775437470155e-10, 1.284874151519233e-10 ], "bp_grad_norms_F": [ 6.056342499505263e-06, 3.0463933597957293e-08, 1.1565422397552538e-08, 1.1122933685214775e-08, 1.0847451825668486e-08 ], "gamma_dfa": 0.040889364270697115, "acc_eval": 0.119140625, "loss_eval": 5.847908020019531, "epoch": 66 }, { "hidden_norms": [ 71084.71875, 332338880.0, 92455056.0, 113026960.0, 88541256.0 ], "bp_grad_norms_per_sample_med": [ 2.7999890406249506e-08, 1.2975863439290691e-10, 1.2677238425684578e-10, 1.268507521245965e-10, 1.2626712175833887e-10 ], "bp_grad_norms_F": [ 5.962062004982727e-06, 2.9298774961716845e-08, 1.14416129903816e-08, 1.1010567568803253e-08, 1.0736493472052189e-08 ], "gamma_dfa": 0.040890415915782796, "acc_eval": 0.1201171875, "loss_eval": 5.816187381744385, "epoch": 67 }, { "hidden_norms": [ 71436.84375, 337832864.0, 93879264.0, 114665400.0, 89926616.0 ], "bp_grad_norms_per_sample_med": [ 2.7683153547286565e-08, 1.2797991832957933e-10, 1.2511817970572991e-10, 1.2518648617731998e-10, 1.246210634686662e-10 ], "bp_grad_norms_F": [ 5.7771489991864655e-06, 2.8285153774731953e-08, 1.1245044895247247e-08, 1.0827025498372223e-08, 1.0562406060898866e-08 ], "gamma_dfa": 0.04072478835223592, "acc_eval": 0.1201171875, "loss_eval": 5.783463478088379, "epoch": 68 }, { "hidden_norms": [ 71769.5546875, 342918304.0, 95263584.0, 116254568.0, 91446520.0 ], "bp_grad_norms_per_sample_med": [ 2.775840357571724e-08, 1.2646382552272684e-10, 1.2334086529897093e-10, 1.2337944554907665e-10, 1.2288142725580542e-10 ], "bp_grad_norms_F": [ 5.667419827659614e-06, 2.6888709925287912e-08, 1.1133559851828068e-08, 1.0716635578944533e-08, 1.0457153365450722e-08 ], "gamma_dfa": 0.040744281255683745, "acc_eval": 0.1201171875, "loss_eval": 5.804702281951904, "epoch": 69 }, { "hidden_norms": [ 72080.078125, 347772576.0, 96482160.0, 117685240.0, 92638296.0 ], "bp_grad_norms_per_sample_med": [ 2.8613341029881667e-08, 1.2489977108121053e-10, 1.2201274712797527e-10, 1.220573642157774e-10, 1.2148008987633574e-10 ], "bp_grad_norms_F": [ 5.642392352456227e-06, 2.7134319680044428e-08, 1.1023663759601732e-08, 1.0605543110386861e-08, 1.034114660569685e-08 ], "gamma_dfa": 0.04128229359048419, "acc_eval": 0.1201171875, "loss_eval": 5.805394172668457, "epoch": 70 }, { "hidden_norms": [ 72369.9921875, 352377056.0, 97691240.0, 119151816.0, 93761800.0 ], "bp_grad_norms_per_sample_med": [ 2.8514245187238885e-08, 1.2353804090814435e-10, 1.2041069530344117e-10, 1.2046977304613904e-10, 1.1990240744719216e-10 ], "bp_grad_norms_F": [ 5.6565527302154806e-06, 2.8678897479039733e-08, 1.0947891482260275e-08, 1.0533200978102286e-08, 1.0270048811378274e-08 ], "gamma_dfa": 0.04154024633317022, "acc_eval": 0.119140625, "loss_eval": 5.7999067306518555, "epoch": 71 }, { "hidden_norms": [ 72651.671875, 356846048.0, 98782024.0, 120475080.0, 94848032.0 ], "bp_grad_norms_per_sample_med": [ 2.8226885717685946e-08, 1.221410056428951e-10, 1.1935313848354667e-10, 1.193777160457543e-10, 1.1868718508001308e-10 ], "bp_grad_norms_F": [ 5.597235940513201e-06, 2.7164126947809564e-08, 1.078571720825039e-08, 1.038548358422986e-08, 1.0128220928606879e-08 ], "gamma_dfa": 0.041652156607597135, "acc_eval": 0.119140625, "loss_eval": 5.782708168029785, "epoch": 72 }, { "hidden_norms": [ 72915.9765625, 361214752.0, 99899064.0, 121794264.0, 95956256.0 ], "bp_grad_norms_per_sample_med": [ 2.8156543763202535e-08, 1.208296795951469e-10, 1.1789087761560069e-10, 1.1794409893184366e-10, 1.1745009131924888e-10 ], "bp_grad_norms_F": [ 5.609212166746147e-06, 2.767807316672588e-08, 1.074356958952194e-08, 1.0335670985739398e-08, 1.007653693818611e-08 ], "gamma_dfa": 0.041388919182281825, "acc_eval": 0.1171875, "loss_eval": 5.816926956176758, "epoch": 73 }, { "hidden_norms": [ 73160.8984375, 365176576.0, 100896352.0, 123055840.0, 96952304.0 ], "bp_grad_norms_per_sample_med": [ 2.8052935974187676e-08, 1.2002213112261018e-10, 1.1708690961231838e-10, 1.1711043246265262e-10, 1.1664859356219637e-10 ], "bp_grad_norms_F": [ 5.528850579139544e-06, 2.6534554109503006e-08, 1.062906651583262e-08, 1.0228863978056779e-08, 9.976772297193293e-09 ], "gamma_dfa": 0.04158145491965115, "acc_eval": 0.1201171875, "loss_eval": 5.83203125, "epoch": 74 }, { "hidden_norms": [ 73388.9921875, 369039872.0, 101870976.0, 124229664.0, 97872176.0 ], "bp_grad_norms_per_sample_med": [ 2.811547972214612e-08, 1.1867723470615488e-10, 1.160038107239636e-10, 1.1605346544873996e-10, 1.1549688982981365e-10 ], "bp_grad_norms_F": [ 5.516625151358312e-06, 2.6522718243882082e-08, 1.0559543461852172e-08, 1.0160210450749219e-08, 9.905477327265544e-09 ], "gamma_dfa": 0.04162494709453313, "acc_eval": 0.1181640625, "loss_eval": 5.825821876525879, "epoch": 75 }, { "hidden_norms": [ 73607.875, 372436096.0, 102747608.0, 125356400.0, 98735744.0 ], "bp_grad_norms_per_sample_med": [ 2.8296041065800637e-08, 1.1797214594100325e-10, 1.1553259737784316e-10, 1.1555564144449804e-10, 1.148080935875484e-10 ], "bp_grad_norms_F": [ 5.4743991313443985e-06, 2.5615005228019072e-08, 1.0501097769122225e-08, 1.0109610926178902e-08, 9.859975946824306e-09 ], "gamma_dfa": 0.04183118613582337, "acc_eval": 0.1171875, "loss_eval": 5.838399887084961, "epoch": 76 }, { "hidden_norms": [ 73806.21875, 375504928.0, 103559744.0, 126298048.0, 99592752.0 ], "bp_grad_norms_per_sample_med": [ 2.8072012270285995e-08, 1.16896228807839e-10, 1.1455134063531602e-10, 1.1459744958530749e-10, 1.1405828365118609e-10 ], "bp_grad_norms_F": [ 5.35501703780028e-06, 2.4375134799470288e-08, 1.0415713624922773e-08, 1.0033582853452572e-08, 9.78571357279634e-09 ], "gamma_dfa": 0.04175542373559438, "acc_eval": 0.1181640625, "loss_eval": 5.806183815002441, "epoch": 77 }, { "hidden_norms": [ 73982.1328125, 378528768.0, 104296416.0, 127198352.0, 100364600.0 ], "bp_grad_norms_per_sample_med": [ 2.802979714999765e-08, 1.1618311174244056e-10, 1.1359845702996196e-10, 1.1364404556291063e-10, 1.1310929276531212e-10 ], "bp_grad_norms_F": [ 5.359067017707275e-06, 2.4563517442288685e-08, 1.0355730495348325e-08, 9.969440384338668e-09, 9.722052496385913e-09 ], "gamma_dfa": 0.041852476922940696, "acc_eval": 0.1171875, "loss_eval": 5.812763690948486, "epoch": 78 }, { "hidden_norms": [ 74143.3515625, 381338400.0, 104995776.0, 128103664.0, 101143248.0 ], "bp_grad_norms_per_sample_med": [ 2.803018084307496e-08, 1.1504715929921971e-10, 1.1309976566398205e-10, 1.1314182923882754e-10, 1.1259981835820554e-10 ], "bp_grad_norms_F": [ 5.305423201207304e-06, 2.479905347740896e-08, 1.0304642472647174e-08, 9.922130672634921e-09, 9.675199308389892e-09 ], "gamma_dfa": 0.04194222000660375, "acc_eval": 0.1201171875, "loss_eval": 5.790335655212402, "epoch": 79 }, { "hidden_norms": [ 74296.140625, 383779872.0, 105624680.0, 128832568.0, 101739872.0 ], "bp_grad_norms_per_sample_med": [ 2.8086292402917934e-08, 1.1405020677868194e-10, 1.1259575216637785e-10, 1.126363308179279e-10, 1.121035694828798e-10 ], "bp_grad_norms_F": [ 5.285005499899853e-06, 2.497140805246545e-08, 1.0247953596831394e-08, 9.865908978667903e-09, 9.618767116137406e-09 ], "gamma_dfa": 0.042092169023817405, "acc_eval": 0.1201171875, "loss_eval": 5.78256893157959, "epoch": 80 }, { "hidden_norms": [ 74432.171875, 386197824.0, 106270032.0, 129540264.0, 102336408.0 ], "bp_grad_norms_per_sample_med": [ 2.8129701235002358e-08, 1.1369888364143321e-10, 1.1195557675369727e-10, 1.1199620397750465e-10, 1.1146324141453334e-10 ], "bp_grad_norms_F": [ 5.2314603635750245e-06, 2.418116018532146e-08, 1.0211192780218425e-08, 9.833079239740528e-09, 9.588974059226985e-09 ], "gamma_dfa": 0.0422149248624919, "acc_eval": 0.1201171875, "loss_eval": 5.794626235961914, "epoch": 81 }, { "hidden_norms": [ 74557.1328125, 388309664.0, 106804240.0, 130160096.0, 102871888.0 ], "bp_grad_norms_per_sample_med": [ 2.8006962082827158e-08, 1.1333335658836319e-10, 1.1151064099879093e-10, 1.1155010942731636e-10, 1.1102004732199688e-10 ], "bp_grad_norms_F": [ 5.231111572356895e-06, 2.3960881279094792e-08, 1.0185694065967255e-08, 9.808036161018663e-09, 9.561717639883227e-09 ], "gamma_dfa": 0.042091405965038575, "acc_eval": 0.1201171875, "loss_eval": 5.809223175048828, "epoch": 82 }, { "hidden_norms": [ 74670.6484375, 390046144.0, 107241528.0, 130709072.0, 103311792.0 ], "bp_grad_norms_per_sample_med": [ 2.80954566278524e-08, 1.1238011909942003e-10, 1.1107993691528151e-10, 1.1111822573184327e-10, 1.1058326476742764e-10 ], "bp_grad_norms_F": [ 5.195881840336369e-06, 2.3944403793052516e-08, 1.0142765738407888e-08, 9.765725117460988e-09, 9.519601995577887e-09 ], "gamma_dfa": 0.042151874920818955, "acc_eval": 0.1201171875, "loss_eval": 5.789272785186768, "epoch": 83 }, { "hidden_norms": [ 74771.78125, 391740192.0, 107714400.0, 131203208.0, 103730008.0 ], "bp_grad_norms_per_sample_med": [ 2.8205375812717648e-08, 1.1187289983283222e-10, 1.1065893340544974e-10, 1.106964936381516e-10, 1.1018032319842774e-10 ], "bp_grad_norms_F": [ 5.16868840350071e-06, 2.363896278723132e-08, 1.0106472991822102e-08, 9.731052408312735e-09, 9.487330032698083e-09 ], "gamma_dfa": 0.042111018407013034, "acc_eval": 0.1201171875, "loss_eval": 5.778679847717285, "epoch": 84 }, { "hidden_norms": [ 74860.828125, 393210464.0, 108154200.0, 131674336.0, 104148832.0 ], "bp_grad_norms_per_sample_med": [ 2.8289822040505896e-08, 1.1139363043088935e-10, 1.1020819673523974e-10, 1.1024554186223057e-10, 1.0972771996575759e-10 ], "bp_grad_norms_F": [ 5.15709007231635e-06, 2.3636799184600932e-08, 1.008097960664145e-08, 9.703811088002112e-09, 9.460902283819905e-09 ], "gamma_dfa": 0.04205825741155422, "acc_eval": 0.1201171875, "loss_eval": 5.787901878356934, "epoch": 85 }, { "hidden_norms": [ 74942.4453125, 394569024.0, 108544648.0, 132082208.0, 104483976.0 ], "bp_grad_norms_per_sample_med": [ 2.8258760664812144e-08, 1.1120066673031559e-10, 1.0991466070642275e-10, 1.0995130500512929e-10, 1.0943435047039429e-10 ], "bp_grad_norms_F": [ 5.150290235178545e-06, 2.3486826705720887e-08, 1.0058711197302728e-08, 9.684677060306512e-09, 9.442134185633222e-09 ], "gamma_dfa": 0.042173042878857814, "acc_eval": 0.119140625, "loss_eval": 5.789056301116943, "epoch": 86 }, { "hidden_norms": [ 75009.5703125, 395748704.0, 108812392.0, 132420432.0, 104755352.0 ], "bp_grad_norms_per_sample_med": [ 2.825358436098213e-08, 1.1081059680950744e-10, 1.0968410901757153e-10, 1.0972003861020596e-10, 1.0920536697156535e-10 ], "bp_grad_norms_F": [ 5.127661552251084e-06, 2.3339271848499266e-08, 1.002943950112467e-08, 9.659677502327213e-09, 9.417544966083824e-09 ], "gamma_dfa": 0.04217808429893921, "acc_eval": 0.1201171875, "loss_eval": 5.776318550109863, "epoch": 87 }, { "hidden_norms": [ 75066.4921875, 396774016.0, 109070288.0, 132708432.0, 105002960.0 ], "bp_grad_norms_per_sample_med": [ 2.824552858271545e-08, 1.1050411280466577e-10, 1.0939484040850544e-10, 1.0943065897883741e-10, 1.0891805513058017e-10 ], "bp_grad_norms_F": [ 5.1081005949527025e-06, 2.2895029871961015e-08, 1.0016128371148625e-08, 9.644456788748812e-09, 9.40405175953174e-09 ], "gamma_dfa": 0.04221886159211863, "acc_eval": 0.1201171875, "loss_eval": 5.782362937927246, "epoch": 88 }, { "hidden_norms": [ 75117.3984375, 397629600.0, 109292216.0, 132974672.0, 105237816.0 ], "bp_grad_norms_per_sample_med": [ 2.8004475183251998e-08, 1.1032175173397718e-10, 1.092313739459172e-10, 1.092670676161589e-10, 1.0875097350426799e-10 ], "bp_grad_norms_F": [ 5.101501756143989e-06, 2.2761090789913396e-08, 9.993788907536327e-09, 9.627679986579096e-09, 9.387123967030675e-09 ], "gamma_dfa": 0.04218835258870968, "acc_eval": 0.119140625, "loss_eval": 5.786335468292236, "epoch": 89 }, { "hidden_norms": [ 75159.3515625, 398356864.0, 109470496.0, 133184088.0, 105416456.0 ], "bp_grad_norms_per_sample_med": [ 2.806424248547046e-08, 1.1018109341565108e-10, 1.0910816694575942e-10, 1.0914344428236689e-10, 1.0862655219767703e-10 ], "bp_grad_norms_F": [ 5.100384441902861e-06, 2.2749302885927136e-08, 9.977647152936697e-09, 9.612988627338837e-09, 9.37321864569185e-09 ], "gamma_dfa": 0.04216382784579764, "acc_eval": 0.1201171875, "loss_eval": 5.787578582763672, "epoch": 90 }, { "hidden_norms": [ 75196.53125, 398958272.0, 109628448.0, 133366784.0, 105577720.0 ], "bp_grad_norms_per_sample_med": [ 2.8093891657476888e-08, 1.0998777583148822e-10, 1.0895360308404989e-10, 1.0898840857587189e-10, 1.084766096393075e-10 ], "bp_grad_norms_F": [ 5.099497684568632e-06, 2.276015820257271e-08, 9.975322790012342e-09, 9.609090412254773e-09, 9.369199638342707e-09 ], "gamma_dfa": 0.0421357955710846, "acc_eval": 0.1201171875, "loss_eval": 5.788777828216553, "epoch": 91 }, { "hidden_norms": [ 75225.75, 399436800.0, 109753008.0, 133503392.0, 105709880.0 ], "bp_grad_norms_per_sample_med": [ 2.7958691362073296e-08, 1.098953844591577e-10, 1.0885654877501594e-10, 1.0889117385559643e-10, 1.0837702263399862e-10 ], "bp_grad_norms_F": [ 5.099244390294189e-06, 2.2776946551061883e-08, 9.965032354841696e-09, 9.599201433729831e-09, 9.359114372387012e-09 ], "gamma_dfa": 0.04213721772248391, "acc_eval": 0.1201171875, "loss_eval": 5.787423133850098, "epoch": 92 }, { "hidden_norms": [ 75247.3671875, 399815808.0, 109848648.0, 133619136.0, 105800656.0 ], "bp_grad_norms_per_sample_med": [ 2.813173693994031e-08, 1.0978142006567992e-10, 1.0878217771015386e-10, 1.0881660156281114e-10, 1.0830317198617934e-10 ], "bp_grad_norms_F": [ 5.097780103824334e-06, 2.278613919770578e-08, 9.958157853873217e-09, 9.592699079519207e-09, 9.35304633742362e-09 ], "gamma_dfa": 0.042139860528550344, "acc_eval": 0.1201171875, "loss_eval": 5.78769588470459, "epoch": 93 }, { "hidden_norms": [ 75264.9921875, 400121888.0, 109927240.0, 133712496.0, 105877656.0 ], "bp_grad_norms_per_sample_med": [ 2.8044253141956688e-08, 1.0970312158686824e-10, 1.0871267774881233e-10, 1.0874703221253057e-10, 1.0823512919255762e-10 ], "bp_grad_norms_F": [ 5.0932972044392955e-06, 2.2714601755069452e-08, 9.954023383329513e-09, 9.589306237955952e-09, 9.350141105812781e-09 ], "gamma_dfa": 0.04215262952493504, "acc_eval": 0.1201171875, "loss_eval": 5.787428379058838, "epoch": 94 }, { "hidden_norms": [ 75277.7421875, 400340192.0, 109981456.0, 133783368.0, 105935424.0 ], "bp_grad_norms_per_sample_med": [ 2.8024039977481152e-08, 1.0965856001021734e-10, 1.0866757493843693e-10, 1.0870188776879175e-10, 1.0818954065960895e-10 ], "bp_grad_norms_F": [ 5.093556865176652e-06, 2.269677956689975e-08, 9.948016632677081e-09, 9.583557947223653e-09, 9.344440776715146e-09 ], "gamma_dfa": 0.04216338234982686, "acc_eval": 0.1201171875, "loss_eval": 5.787187099456787, "epoch": 95 }, { "hidden_norms": [ 75285.703125, 400477120.0, 110015360.0, 133823992.0, 105968568.0 ], "bp_grad_norms_per_sample_med": [ 2.7959323745108122e-08, 1.096286394997037e-10, 1.0863549643191917e-10, 1.0866971211775933e-10, 1.0815728868074359e-10 ], "bp_grad_norms_F": [ 5.094433618069161e-06, 2.2707608238192734e-08, 9.945019030510593e-09, 9.580433335543148e-09, 9.341129647566504e-09 ], "gamma_dfa": 0.04217854590388015, "acc_eval": 0.1201171875, "loss_eval": 5.785982608795166, "epoch": 96 }, { "hidden_norms": [ 75289.953125, 400549248.0, 110035048.0, 133846800.0, 105987544.0 ], "bp_grad_norms_per_sample_med": [ 2.7980583183762064e-08, 1.0960886365207756e-10, 1.0861883614765588e-10, 1.0865301020013263e-10, 1.0814063533537421e-10 ], "bp_grad_norms_F": [ 5.094651896797586e-06, 2.2699452983943047e-08, 9.943881273954958e-09, 9.579290249916994e-09, 9.340033635396594e-09 ], "gamma_dfa": 0.04217962139227893, "acc_eval": 0.1201171875, "loss_eval": 5.78618860244751, "epoch": 97 }, { "hidden_norms": [ 75293.8203125, 400615232.0, 110052384.0, 133866488.0, 106003008.0 ], "bp_grad_norms_per_sample_med": [ 2.800710419137431e-08, 1.0960048146824164e-10, 1.0860957966318807e-10, 1.0864373983787701e-10, 1.0813145517873934e-10 ], "bp_grad_norms_F": [ 5.094465905131074e-06, 2.2699449431229368e-08, 9.942947798435853e-09, 9.578524640119213e-09, 9.339320428125575e-09 ], "gamma_dfa": 0.04218013053832692, "acc_eval": 0.1201171875, "loss_eval": 5.786159515380859, "epoch": 98 }, { "hidden_norms": [ 75295.7109375, 400646048.0, 110060248.0, 133875320.0, 106009248.0 ], "bp_grad_norms_per_sample_med": [ 2.8009079500179723e-08, 1.0959386176345731e-10, 1.0860166238524371e-10, 1.0863580868214484e-10, 1.0812370443424868e-10 ], "bp_grad_norms_F": [ 5.094112111692084e-06, 2.26939054215336e-08, 9.942577428034838e-09, 9.578169368751333e-09, 9.33901134203552e-09 ], "gamma_dfa": 0.042181356100627454, "acc_eval": 0.1201171875, "loss_eval": 5.786299705505371, "epoch": 99 }, { "hidden_norms": [ 75295.7421875, 400646208.0, 110060504.0, 133875616.0, 106009536.0 ], "bp_grad_norms_per_sample_med": [ 2.8005374019812734e-08, 1.0959412544142566e-10, 1.0860218280228651e-10, 1.0863632909918763e-10, 1.0812418321792805e-10 ], "bp_grad_norms_F": [ 5.0940698201884516e-06, 2.269248788877576e-08, 9.942581868926936e-09, 9.57817469782185e-09, 9.339016671106037e-09 ], "gamma_dfa": 0.042181452532531694, "acc_eval": 0.1201171875, "loss_eval": 5.786318302154541, "epoch": 100 } ] }