{ "fa_log": [ { "hidden_norms": [ 11.269571304321289, 11.290447235107422, 11.313605308532715, 11.351215362548828, 11.398087501525879 ], "bp_grad_per_sample_l2_med": [ 0.00028353024390526116, 0.0002828188880812377, 0.00028162598027847707, 0.0002799496578518301, 0.0002791006409097463 ], "bp_grad_F": [ 0.012684082612395287, 0.01264861598610878, 0.012589854188263416, 0.012511610053479671, 0.012471316382288933 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.08450000733137131, "loss_eval": 2.4790313243865967, "epoch": 0 }, { "hidden_norms": [ 11.269571304321289, 11.457883834838867, 11.697802543640137, 12.001762390136719, 12.303658485412598 ], "bp_grad_per_sample_l2_med": [ 0.0004113642207812518, 0.00037613665335811675, 0.0003495849668979645, 0.0003221812949050218, 0.00025295966770499945 ], "bp_grad_F": [ 0.018967075273394585, 0.017186719924211502, 0.015851320698857307, 0.01445167325437069, 0.011211601085960865 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5270000100135803, "loss_eval": 1.4865981340408325, "epoch": 1 }, { "hidden_norms": [ 11.269571304321289, 11.734084129333496, 12.481009483337402, 13.659913063049316, 15.730950355529785 ], "bp_grad_per_sample_l2_med": [ 0.0007782558677718043, 0.0006171928835101426, 0.0004891889402642846, 0.00038687532651238143, 0.000231728219659999 ], "bp_grad_F": [ 0.04103676602244377, 0.03172670304775238, 0.024926593527197838, 0.019472092390060425, 0.011657902970910072 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6360000371932983, "loss_eval": 0.965207040309906, "epoch": 2 }, { "hidden_norms": [ 11.269571304321289, 11.973358154296875, 13.411399841308594, 16.07562255859375, 20.911983489990234 ], "bp_grad_per_sample_l2_med": [ 0.0008172825910151005, 0.0005784342647530138, 0.000417369301430881, 0.0003010776126757264, 0.000168764207046479 ], "bp_grad_F": [ 0.05745441094040871, 0.04039904102683067, 0.028755735605955124, 0.020857004448771477, 0.011488317511975765 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.687000036239624, "loss_eval": 0.8154960870742798, "epoch": 3 }, { "hidden_norms": [ 11.269571304321289, 12.203580856323242, 14.659997940063477, 19.929065704345703, 27.998876571655273 ], "bp_grad_per_sample_l2_med": [ 0.0007437548483721912, 0.00048129685455933213, 0.00031908220262266695, 0.00022696926316712052, 0.00012886490731034428 ], "bp_grad_F": [ 0.06721046566963196, 0.043338593095541, 0.028462719172239304, 0.019943350926041603, 0.01114331278949976 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.703000009059906, "loss_eval": 0.7722610831260681, "epoch": 4 }, { "hidden_norms": [ 11.269571304321289, 12.476441383361816, 16.378177642822266, 25.748563766479492, 36.580970764160156 ], "bp_grad_per_sample_l2_med": [ 0.0007116686902008951, 0.00042677627061493695, 0.0002665013598743826, 0.00019125515245832503, 0.0001178958555101417 ], "bp_grad_F": [ 0.06977967172861099, 0.04175141453742981, 0.02600390836596489, 0.018256530165672302, 0.010964884422719479 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7070000171661377, "loss_eval": 0.7697932720184326, "epoch": 5 }, { "hidden_norms": [ 11.269571304321289, 12.808075904846191, 19.022871017456055, 33.50295639038086, 45.75634002685547 ], "bp_grad_per_sample_l2_med": [ 0.000760514521971345, 0.000416931085055694, 0.0002524603623896837, 0.00018262627418152988, 0.0001200677506858483 ], "bp_grad_F": [ 0.0695224478840828, 0.03927718475461006, 0.023749928921461105, 0.01698874868452549, 0.011118472553789616 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7035000324249268, "loss_eval": 0.7977719902992249, "epoch": 6 }, { "hidden_norms": [ 11.269571304321289, 13.191008567810059, 22.44864273071289, 42.65863800048828, 54.38147735595703 ], "bp_grad_per_sample_l2_med": [ 0.0007628297316841781, 0.0003877072886098176, 0.00022262487618718296, 0.00016918807523325086, 0.0001183631393359974 ], "bp_grad_F": [ 0.06797165423631668, 0.03639831766486168, 0.02157149650156498, 0.015874147415161133, 0.011150078848004341 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.70250004529953, "loss_eval": 0.8099735975265503, "epoch": 7 }, { "hidden_norms": [ 11.269571304321289, 13.587474822998047, 26.61025619506836, 51.025230407714844, 61.79695129394531 ], "bp_grad_per_sample_l2_med": [ 0.0007774661062285304, 0.00037008023355156183, 0.00019806883938144892, 0.0001550534798298031, 0.00011658846779027954 ], "bp_grad_F": [ 0.06822231411933899, 0.03484996780753136, 0.02039053477346897, 0.015457017347216606, 0.011438230983912945 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6920000314712524, "loss_eval": 0.8282882571220398, "epoch": 8 }, { "hidden_norms": [ 11.269571304321289, 14.02984619140625, 31.27604866027832, 59.14579391479492, 68.8819580078125 ], "bp_grad_per_sample_l2_med": [ 0.000821497815195471, 0.000388532382203266, 0.0002036481600953266, 0.0001647671015234664, 0.00012798182433471084 ], "bp_grad_F": [ 0.06896942853927612, 0.03378934785723686, 0.019570810720324516, 0.015211639925837517, 0.01168233621865511 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6785000562667847, "loss_eval": 0.8751994967460632, "epoch": 9 }, { "hidden_norms": [ 11.269571304321289, 14.566975593566895, 37.15107345581055, 66.83728790283203, 76.04595184326172 ], "bp_grad_per_sample_l2_med": [ 0.0008561373106203973, 0.00037220801459625363, 0.00018477423873264343, 0.0001600280374987051, 0.00012663347297348082 ], "bp_grad_F": [ 0.06949204951524734, 0.033161722123622894, 0.019245225936174393, 0.015247669070959091, 0.012057062238454819 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6585000157356262, "loss_eval": 0.9142682552337646, "epoch": 10 }, { "hidden_norms": [ 11.269571304321289, 15.22678279876709, 44.73517990112305, 74.21520233154297, 82.72914123535156 ], "bp_grad_per_sample_l2_med": [ 0.0008647029753774405, 0.0003551499976310879, 0.00016902851348277181, 0.00014951576304156333, 0.0001220703707076609 ], "bp_grad_F": [ 0.06799578666687012, 0.03190648928284645, 0.018390726298093796, 0.015047998167574406, 0.01216125674545765 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6635000109672546, "loss_eval": 0.9312959313392639, "epoch": 11 }, { "hidden_norms": [ 11.269571304321289, 15.982205390930176, 53.03363037109375, 81.01543426513672, 88.02293395996094 ], "bp_grad_per_sample_l2_med": [ 0.0008814894827082753, 0.0003609499253798276, 0.00016691464406903833, 0.00015374798385892063, 0.00012832213542424142 ], "bp_grad_F": [ 0.06737235933542252, 0.030633311718702316, 0.017514588311314583, 0.014722960069775581, 0.012166885659098625 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6665000319480896, "loss_eval": 0.9171096086502075, "epoch": 12 }, { "hidden_norms": [ 11.269571304321289, 17.348485946655273, 65.39360046386719, 94.1773452758789, 97.79885864257812 ], "bp_grad_per_sample_l2_med": [ 0.0008671359973959625, 0.0003543675411492586, 0.00017760474293027073, 0.00016833240806590766, 0.0001419015898136422 ], "bp_grad_F": [ 0.06303472071886063, 0.027784455567598343, 0.016537917777895927, 0.01453208364546299, 0.012470746412873268 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6520000100135803, "loss_eval": 0.9543019533157349, "epoch": 13 }, { "hidden_norms": [ 11.269571304321289, 19.79836082458496, 82.84272003173828, 118.11077880859375, 117.29456329345703 ], "bp_grad_per_sample_l2_med": [ 0.000835613114759326, 0.00034002913162112236, 0.00017855060286819935, 0.00017689696687739342, 0.0001562273973831907 ], "bp_grad_F": [ 0.05830768123269081, 0.025488071143627167, 0.01599927246570587, 0.014500983990728855, 0.012853534892201424 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6320000290870667, "loss_eval": 0.9986603260040283, "epoch": 14 }, { "hidden_norms": [ 11.269571304321289, 24.028667449951172, 104.24053192138672, 151.45233154296875, 148.85594177246094 ], "bp_grad_per_sample_l2_med": [ 0.0008604780305176973, 0.0003412840305827558, 0.00020471647439990193, 0.00020128543837927282, 0.00018673941667657346 ], "bp_grad_F": [ 0.05637207254767418, 0.023704711347818375, 0.016045723110437393, 0.015071108937263489, 0.013779145665466785 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6110000014305115, "loss_eval": 1.08339262008667, "epoch": 15 }, { "hidden_norms": [ 11.269571304321289, 31.199304580688477, 135.36643981933594, 190.8426971435547, 189.1505126953125 ], "bp_grad_per_sample_l2_med": [ 0.000760686700232327, 0.0002976131218019873, 0.00019266465096734464, 0.0001927861594595015, 0.0001783591287676245 ], "bp_grad_F": [ 0.04442710801959038, 0.020077738910913467, 0.0149933947250247, 0.014391067437827587, 0.01344863511621952 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6480000019073486, "loss_eval": 1.0371382236480713, "epoch": 16 }, { "hidden_norms": [ 11.269571304321289, 41.846805572509766, 170.3418731689453, 225.09695434570312, 224.6548614501953 ], "bp_grad_per_sample_l2_med": [ 0.0007461759960278869, 0.00026667246129363775, 0.00018387376621831208, 0.00018445710884407163, 0.00017204758478328586 ], "bp_grad_F": [ 0.039136338979005814, 0.018771812319755554, 0.015547079034149647, 0.01513050775974989, 0.01431551855057478 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6200000047683716, "loss_eval": 1.1162669658660889, "epoch": 17 }, { "hidden_norms": [ 11.269571304321289, 57.18465042114258, 206.83914184570312, 262.21197509765625, 260.03485107421875 ], "bp_grad_per_sample_l2_med": [ 0.0007871078560128808, 0.00029353986610658467, 0.00022458977764472365, 0.00022484370856545866, 0.00021257037587929517 ], "bp_grad_F": [ 0.03888345882296562, 0.01824026368558407, 0.015890181064605713, 0.015627194195985794, 0.014916189946234226 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5615000128746033, "loss_eval": 1.2106062173843384, "epoch": 18 }, { "hidden_norms": [ 11.269571304321289, 75.66644287109375, 241.24891662597656, 298.0739440917969, 293.95281982421875 ], "bp_grad_per_sample_l2_med": [ 0.000782749499194324, 0.0002943766303360462, 0.00024086510529741645, 0.00024184907670132816, 0.0002289286785526201 ], "bp_grad_F": [ 0.03717740252614021, 0.01794801466166973, 0.016123440116643906, 0.0158899687230587, 0.015260584652423859 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5680000185966492, "loss_eval": 1.1780248880386353, "epoch": 19 }, { "hidden_norms": [ 11.269571304321289, 97.68470764160156, 276.2217712402344, 334.56146240234375, 329.1627502441406 ], "bp_grad_per_sample_l2_med": [ 0.0007400053436867893, 0.00028874175040982664, 0.00024344309349544346, 0.0002433314366498962, 0.00023140427947510034 ], "bp_grad_F": [ 0.03569746017456055, 0.0169936865568161, 0.015504195354878902, 0.015339999459683895, 0.014785589650273323 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5745000243186951, "loss_eval": 1.1848244667053223, "epoch": 20 }, { "hidden_norms": [ 11.269571304321289, 123.06426239013672, 312.8515625, 373.4215087890625, 366.50213623046875 ], "bp_grad_per_sample_l2_med": [ 0.0007171913748607039, 0.00026914477348327637, 0.00023370776034425944, 0.00023370303097181022, 0.0002235924475826323 ], "bp_grad_F": [ 0.03427436947822571, 0.016933348029851913, 0.015780098736286163, 0.015659287571907043, 0.015169495716691017 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5715000033378601, "loss_eval": 1.2063732147216797, "epoch": 21 }, { "hidden_norms": [ 11.269571304321289, 153.3316650390625, 353.62042236328125, 417.3258361816406, 408.16680908203125 ], "bp_grad_per_sample_l2_med": [ 0.0007328973151743412, 0.000268118514213711, 0.00024018273688852787, 0.00024114495317917317, 0.0002314754092367366 ], "bp_grad_F": [ 0.033994678407907486, 0.016857070848345757, 0.01595945656299591, 0.01587284542620182, 0.015459166839718819 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5450000166893005, "loss_eval": 1.2801684141159058, "epoch": 22 }, { "hidden_norms": [ 11.269571304321289, 187.16934204101562, 397.18280029296875, 464.5965881347656, 453.26629638671875 ], "bp_grad_per_sample_l2_med": [ 0.0007429302204400301, 0.0002756037574727088, 0.0002533047809265554, 0.0002549285418353975, 0.00024467214825563133 ], "bp_grad_F": [ 0.03400976210832596, 0.017134130001068115, 0.016380103304982185, 0.016292234882712364, 0.015935255214571953 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5055000185966492, "loss_eval": 1.4238585233688354, "epoch": 23 }, { "hidden_norms": [ 11.269571304321289, 221.9723663330078, 441.26580810546875, 512.8148193359375, 498.7379455566406 ], "bp_grad_per_sample_l2_med": [ 0.0006891476223245263, 0.00027131737442687154, 0.0002505357551854104, 0.000251909252256155, 0.0002428782609058544 ], "bp_grad_F": [ 0.032484397292137146, 0.01684476062655449, 0.01627412810921669, 0.016195174306631088, 0.015904447063803673 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5290000438690186, "loss_eval": 1.3381338119506836, "epoch": 24 }, { "hidden_norms": [ 11.269571304321289, 256.86456298828125, 485.2987060546875, 561.24755859375, 544.2046508789062 ], "bp_grad_per_sample_l2_med": [ 0.0007065363461151719, 0.0002826322161126882, 0.00026495553902350366, 0.0002664696949068457, 0.0002584822941571474 ], "bp_grad_F": [ 0.032581742852926254, 0.017135880887508392, 0.01663898676633835, 0.01656418852508068, 0.016318844631314278 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.468500018119812, "loss_eval": 1.4673320055007935, "epoch": 25 }, { "hidden_norms": [ 11.269571304321289, 290.3281555175781, 528.4644165039062, 609.61181640625, 589.482421875 ], "bp_grad_per_sample_l2_med": [ 0.0007876601885072887, 0.000328866473864764, 0.0003142827481497079, 0.0003149702097289264, 0.00030780391534790397 ], "bp_grad_F": [ 0.0356873981654644, 0.01825507916510105, 0.01779749058187008, 0.017760321497917175, 0.0175130907446146 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35200002789497375, "loss_eval": 1.82278311252594, "epoch": 26 }, { "hidden_norms": [ 11.269571304321289, 324.2997131347656, 572.9197387695312, 659.7073364257812, 635.6883544921875 ], "bp_grad_per_sample_l2_med": [ 0.0006818437832407653, 0.000307896378217265, 0.0002974055823870003, 0.000297438440611586, 0.0002942352439276874 ], "bp_grad_F": [ 0.03148573637008667, 0.017155593261122704, 0.016821201890707016, 0.01674988865852356, 0.016609078273177147 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4540000259876251, "loss_eval": 1.4913204908370972, "epoch": 27 }, { "hidden_norms": [ 11.269571304321289, 357.986572265625, 616.8123168945312, 709.2523193359375, 681.3218994140625 ], "bp_grad_per_sample_l2_med": [ 0.0006822228315286338, 0.00030397844966501, 0.0002927799359895289, 0.0002928805770352483, 0.0002893624478019774 ], "bp_grad_F": [ 0.03142063319683075, 0.017380017787218094, 0.017113016918301582, 0.017052780836820602, 0.01693262904882431 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.42250001430511475, "loss_eval": 1.574558138847351, "epoch": 28 }, { "hidden_norms": [ 11.269571304321289, 391.00396728515625, 660.1432495117188, 758.46875, 726.479248046875 ], "bp_grad_per_sample_l2_med": [ 0.0006576834712177515, 0.00029913688194938004, 0.0002909695322159678, 0.00029160548001527786, 0.0002882194530684501 ], "bp_grad_F": [ 0.03063797578215599, 0.01751694455742836, 0.017304742708802223, 0.017256034538149834, 0.017157413065433502 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.41700002551078796, "loss_eval": 1.5943682193756104, "epoch": 29 }, { "hidden_norms": [ 11.269571304321289, 423.0135803222656, 702.8653564453125, 807.1064453125, 771.0443115234375 ], "bp_grad_per_sample_l2_med": [ 0.0007106211851350963, 0.00032867168192751706, 0.0003195058961864561, 0.0003205789253115654, 0.00031724729342386127 ], "bp_grad_F": [ 0.032083574682474136, 0.018385307863354683, 0.01818086951971054, 0.018159352242946625, 0.01808425784111023 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3240000009536743, "loss_eval": 1.9495495557785034, "epoch": 30 }, { "hidden_norms": [ 11.269571304321289, 453.1861267089844, 743.7100219726562, 853.8812255859375, 813.7102661132812 ], "bp_grad_per_sample_l2_med": [ 0.0006489204824902117, 0.0002889770839828998, 0.00028184326947666705, 0.00028282302082516253, 0.00027834190404973924 ], "bp_grad_F": [ 0.029847772791981697, 0.017620669677853584, 0.017466910183429718, 0.01743420958518982, 0.017375603318214417 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3970000147819519, "loss_eval": 1.6998002529144287, "epoch": 31 }, { "hidden_norms": [ 11.269571304321289, 480.8240661621094, 781.491943359375, 897.1333618164062, 853.1820678710938 ], "bp_grad_per_sample_l2_med": [ 0.0006337798549793661, 0.0003062748000957072, 0.0003002039447892457, 0.00030039221746847034, 0.0002973877126350999 ], "bp_grad_F": [ 0.029168229550123215, 0.017783651128411293, 0.017649564892053604, 0.017613932490348816, 0.01756826601922512 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3865000307559967, "loss_eval": 1.7693381309509277, "epoch": 32 }, { "hidden_norms": [ 11.269571304321289, 505.9931945800781, 816.3653564453125, 937.6511840820312, 890.0263061523438 ], "bp_grad_per_sample_l2_med": [ 0.0006363698630593717, 0.000327500601997599, 0.0003217202320229262, 0.0003208804700989276, 0.0003201036306563765 ], "bp_grad_F": [ 0.029376372694969177, 0.018225492909550667, 0.01810493879020214, 0.01805899664759636, 0.018048716709017754 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3400000035762787, "loss_eval": 1.777511477470398, "epoch": 33 }, { "hidden_norms": [ 11.269571304321289, 530.9385375976562, 850.9844970703125, 977.412841796875, 926.3417358398438 ], "bp_grad_per_sample_l2_med": [ 0.0006240232032723725, 0.00032233193633146584, 0.00031883586780168116, 0.0003202730731572956, 0.0003188494883943349 ], "bp_grad_F": [ 0.028516914695501328, 0.018217962235212326, 0.018127964809536934, 0.018103662878274918, 0.018076416105031967 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.36250001192092896, "loss_eval": 1.7461223602294922, "epoch": 34 }, { "hidden_norms": [ 11.269571304321289, 555.9691162109375, 885.6592407226562, 1017.6103515625, 962.8530883789062 ], "bp_grad_per_sample_l2_med": [ 0.0005949487676844001, 0.0003172095457557589, 0.00031312211649492383, 0.0003130651020910591, 0.0003118007443845272 ], "bp_grad_F": [ 0.027917204424738884, 0.018052855506539345, 0.017963001504540443, 0.01793370023369789, 0.017934400588274002 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3775000274181366, "loss_eval": 1.7961357831954956, "epoch": 35 }, { "hidden_norms": [ 11.269571304321289, 580.1717529296875, 919.149169921875, 1056.32470703125, 998.1345825195312 ], "bp_grad_per_sample_l2_med": [ 0.0006010148790664971, 0.0003237369528505951, 0.00031987245893105865, 0.00031991174910217524, 0.0003188104019500315 ], "bp_grad_F": [ 0.027771273627877235, 0.017915818840265274, 0.017828019335865974, 0.017802555114030838, 0.017808666452765465 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.37400001287460327, "loss_eval": 1.8124159574508667, "epoch": 36 }, { "hidden_norms": [ 11.269571304321289, 602.5966186523438, 950.484619140625, 1092.6507568359375, 1031.02294921875 ], "bp_grad_per_sample_l2_med": [ 0.0005852986359968781, 0.0003249783185310662, 0.00032142180134542286, 0.0003207105037290603, 0.00032108003506436944 ], "bp_grad_F": [ 0.02701820805668831, 0.01796947605907917, 0.017892232164740562, 0.017859354615211487, 0.01788966730237007 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34950003027915955, "loss_eval": 1.7797815799713135, "epoch": 37 }, { "hidden_norms": [ 11.269571304321289, 624.4447021484375, 981.1150512695312, 1127.90234375, 1063.09228515625 ], "bp_grad_per_sample_l2_med": [ 0.0005775236058980227, 0.0003046133788302541, 0.00030120721203275025, 0.00030136521672829986, 0.00029937425279058516 ], "bp_grad_F": [ 0.026447290554642677, 0.017799606546759605, 0.017730647698044777, 0.017701666802167892, 0.017717311158776283 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3630000054836273, "loss_eval": 1.7884948253631592, "epoch": 38 }, { "hidden_norms": [ 11.269571304321289, 644.9402465820312, 1010.1371459960938, 1161.7808837890625, 1093.9410400390625 ], "bp_grad_per_sample_l2_med": [ 0.000567529525142163, 0.00032071411260403693, 0.0003186226240359247, 0.0003186469548381865, 0.000316357531119138 ], "bp_grad_F": [ 0.02652687579393387, 0.018418341875076294, 0.018360882997512817, 0.018340308219194412, 0.018352536484599113 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3375000059604645, "loss_eval": 1.894034743309021, "epoch": 39 }, { "hidden_norms": [ 11.269571304321289, 664.6719970703125, 1038.15478515625, 1194.3914794921875, 1123.5455322265625 ], "bp_grad_per_sample_l2_med": [ 0.0005615526461042464, 0.0003110080724582076, 0.00030868081375956535, 0.00030884178704582155, 0.0003081669274251908 ], "bp_grad_F": [ 0.025895435363054276, 0.01783018186688423, 0.017772147431969643, 0.017754852771759033, 0.01777641288936138 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3395000100135803, "loss_eval": 1.9033000469207764, "epoch": 40 }, { "hidden_norms": [ 11.269571304321289, 683.78173828125, 1065.281005859375, 1225.9638671875, 1152.131591796875 ], "bp_grad_per_sample_l2_med": [ 0.0005448339506983757, 0.0003069988451898098, 0.0003048715298064053, 0.0003052430984098464, 0.00030476890970021486 ], "bp_grad_F": [ 0.025077223777770996, 0.017541181296110153, 0.017490437254309654, 0.01747160218656063, 0.017498185858130455 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3840000033378601, "loss_eval": 1.7054094076156616, "epoch": 41 }, { "hidden_norms": [ 11.269571304321289, 701.634033203125, 1090.699462890625, 1255.5677490234375, 1178.950927734375 ], "bp_grad_per_sample_l2_med": [ 0.0005554261151701212, 0.0003436058177612722, 0.0003414751263335347, 0.0003412873193155974, 0.0003412757650949061 ], "bp_grad_F": [ 0.025991667062044144, 0.018797792494297028, 0.01875895820558071, 0.018737811595201492, 0.01877579651772976 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.2985000014305115, "loss_eval": 1.9454095363616943, "epoch": 42 }, { "hidden_norms": [ 11.269571304321289, 718.1909790039062, 1114.3717041015625, 1283.2196044921875, 1204.0418701171875 ], "bp_grad_per_sample_l2_med": [ 0.0005466453148983419, 0.00032576482044532895, 0.00032447546254843473, 0.0003244927211198956, 0.0003245829720981419 ], "bp_grad_F": [ 0.025174839422106743, 0.01795799843966961, 0.01791331358253956, 0.017896415665745735, 0.017930971458554268 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3190000057220459, "loss_eval": 1.9117376804351807, "epoch": 43 }, { "hidden_norms": [ 11.269571304321289, 734.4074096679688, 1137.696044921875, 1310.3448486328125, 1228.5693359375 ], "bp_grad_per_sample_l2_med": [ 0.0005316757597029209, 0.00032565969740971923, 0.00032383095822297037, 0.00032448669662699103, 0.0003247321583330631 ], "bp_grad_F": [ 0.024759862571954727, 0.01794862188398838, 0.01790694147348404, 0.017891528084874153, 0.017931628972291946 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3320000171661377, "loss_eval": 1.8898653984069824, "epoch": 44 }, { "hidden_norms": [ 11.269571304321289, 749.4878540039062, 1159.565185546875, 1335.8013916015625, 1251.6041259765625 ], "bp_grad_per_sample_l2_med": [ 0.0005168311763554811, 0.00031509375548921525, 0.0003133788122795522, 0.0003133984573651105, 0.0003139932523481548 ], "bp_grad_F": [ 0.0242743082344532, 0.01778865046799183, 0.0177480336278677, 0.017732009291648865, 0.01776931621134281 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3360000252723694, "loss_eval": 1.809171199798584, "epoch": 45 }, { "hidden_norms": [ 11.269571304321289, 763.5787353515625, 1180.0230712890625, 1359.6865234375, 1273.1715087890625 ], "bp_grad_per_sample_l2_med": [ 0.0005242779734544456, 0.0003271555178798735, 0.00032485066913068295, 0.0003253788163419813, 0.00032494115293957293 ], "bp_grad_F": [ 0.024425320327281952, 0.01821528747677803, 0.018175508826971054, 0.018160372972488403, 0.01819770224392414 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3290000259876251, "loss_eval": 1.8727153539657593, "epoch": 46 }, { "hidden_norms": [ 11.269571304321289, 777.29833984375, 1199.8975830078125, 1382.7962646484375, 1294.0777587890625 ], "bp_grad_per_sample_l2_med": [ 0.0005091701750643551, 0.0003165322996210307, 0.00031451781978830695, 0.00031486450461670756, 0.00031427579233422875 ], "bp_grad_F": [ 0.023803148418664932, 0.017688797786831856, 0.017653871327638626, 0.01764090545475483, 0.017672821879386902 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3570000231266022, "loss_eval": 1.7817366123199463, "epoch": 47 }, { "hidden_norms": [ 11.269571304321289, 789.7103881835938, 1218.070556640625, 1403.869384765625, 1313.1611328125 ], "bp_grad_per_sample_l2_med": [ 0.000508163939230144, 0.00031658579246141016, 0.0003145384253002703, 0.0003149410185869783, 0.000314467353746295 ], "bp_grad_F": [ 0.023785017430782318, 0.017845386639237404, 0.01781085878610611, 0.017796490341424942, 0.017827292904257774 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3255000114440918, "loss_eval": 1.9139658212661743, "epoch": 48 }, { "hidden_norms": [ 11.269571304321289, 801.9373779296875, 1235.8994140625, 1424.5323486328125, 1331.8375244140625 ], "bp_grad_per_sample_l2_med": [ 0.0004862714558839798, 0.0002926513261627406, 0.0002908864407800138, 0.0002910781477112323, 0.0002900509862229228 ], "bp_grad_F": [ 0.023361189290881157, 0.01766069605946541, 0.01763027161359787, 0.017619280144572258, 0.017652587965130806 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.36100003123283386, "loss_eval": 1.8068753480911255, "epoch": 49 }, { "hidden_norms": [ 11.269571304321289, 813.853515625, 1253.337890625, 1444.873779296875, 1350.2630615234375 ], "bp_grad_per_sample_l2_med": [ 0.00048765321844257414, 0.000307347479974851, 0.00030599997262470424, 0.000306078844005242, 0.000305346620734781 ], "bp_grad_F": [ 0.023688213899731636, 0.01818004995584488, 0.018153388053178787, 0.018142297863960266, 0.018173247575759888 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3360000252723694, "loss_eval": 1.8813791275024414, "epoch": 50 }, { "hidden_norms": [ 11.269571304321289, 824.7192993164062, 1269.39208984375, 1463.5384521484375, 1367.15625 ], "bp_grad_per_sample_l2_med": [ 0.0004835445433855057, 0.0003096247965004295, 0.0003079361922573298, 0.00030804326524958014, 0.0003073872940149158 ], "bp_grad_F": [ 0.02330639213323593, 0.01797325722873211, 0.0179448202252388, 0.017932146787643433, 0.0179706122726202 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34150001406669617, "loss_eval": 1.8429521322250366, "epoch": 51 }, { "hidden_norms": [ 11.269571304321289, 834.9524536132812, 1284.4827880859375, 1481.0673828125, 1383.0155029296875 ], "bp_grad_per_sample_l2_med": [ 0.00047791830729693174, 0.0003027814091183245, 0.0003019821015186608, 0.0003020255535375327, 0.0003012260131072253 ], "bp_grad_F": [ 0.02303098328411579, 0.01771283708512783, 0.01768432930111885, 0.017673376947641373, 0.01770668476819992 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34850001335144043, "loss_eval": 1.8080617189407349, "epoch": 52 }, { "hidden_norms": [ 11.269571304321289, 844.5447998046875, 1298.628662109375, 1497.57373046875, 1397.9241943359375 ], "bp_grad_per_sample_l2_med": [ 0.000483115843962878, 0.0003182529762852937, 0.00031743990257382393, 0.0003175203746650368, 0.0003175794845446944 ], "bp_grad_F": [ 0.02306683361530304, 0.01790531352162361, 0.017880147323012352, 0.017869742587208748, 0.017903709784150124 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.33100003004074097, "loss_eval": 1.8166543245315552, "epoch": 53 }, { "hidden_norms": [ 11.269571304321289, 853.7017822265625, 1312.1446533203125, 1513.2933349609375, 1412.1080322265625 ], "bp_grad_per_sample_l2_med": [ 0.00047640595585107803, 0.00031948628020472825, 0.00031817753915674984, 0.00031873476109467447, 0.0003185000387020409 ], "bp_grad_F": [ 0.022898783907294273, 0.017956143245100975, 0.017929796129465103, 0.017917128279805183, 0.017962384968996048 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.33800002932548523, "loss_eval": 1.8004838228225708, "epoch": 54 }, { "hidden_norms": [ 11.269571304321289, 862.0558471679688, 1324.4920654296875, 1527.697509765625, 1425.1290283203125 ], "bp_grad_per_sample_l2_med": [ 0.0004698090488091111, 0.00029860963695682585, 0.0002971645735669881, 0.0002974079397972673, 0.00029624722083099186 ], "bp_grad_F": [ 0.022676818072795868, 0.01772218942642212, 0.017698047682642937, 0.017688868567347527, 0.01772254891693592 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3530000150203705, "loss_eval": 1.8075289726257324, "epoch": 55 }, { "hidden_norms": [ 11.269571304321289, 869.9756469726562, 1336.185791015625, 1541.3792724609375, 1437.4677734375 ], "bp_grad_per_sample_l2_med": [ 0.0004706987820100039, 0.0003098493325524032, 0.0003085599164478481, 0.0003086493816226721, 0.0003082384937442839 ], "bp_grad_F": [ 0.022675253450870514, 0.01779225468635559, 0.017767589539289474, 0.017757505178451538, 0.017791779711842537 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34150001406669617, "loss_eval": 1.827038288116455, "epoch": 56 }, { "hidden_norms": [ 11.269571304321289, 877.3834838867188, 1347.156982421875, 1554.1087646484375, 1448.9537353515625 ], "bp_grad_per_sample_l2_med": [ 0.000473314750706777, 0.00030716857872903347, 0.0003054763947147876, 0.0003060955787077546, 0.0003047685313504189 ], "bp_grad_F": [ 0.02272479608654976, 0.01781822182238102, 0.017794664949178696, 0.01778644695878029, 0.01781868003308773 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.32450002431869507, "loss_eval": 1.8790045976638794, "epoch": 57 }, { "hidden_norms": [ 11.269571304321289, 884.1793212890625, 1357.25146484375, 1565.88232421875, 1459.538818359375 ], "bp_grad_per_sample_l2_med": [ 0.00046717250370420516, 0.00030950061045587063, 0.000308411312289536, 0.00030838610837236047, 0.00030820758547633886 ], "bp_grad_F": [ 0.02260792814195156, 0.017898347228765488, 0.017876161262392998, 0.017865851521492004, 0.01790330745279789 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3225000202655792, "loss_eval": 1.8583427667617798, "epoch": 58 }, { "hidden_norms": [ 11.269571304321289, 890.4108276367188, 1366.517333984375, 1576.69921875, 1469.300537109375 ], "bp_grad_per_sample_l2_med": [ 0.0004612848279066384, 0.00030920191784389317, 0.0003086488868575543, 0.0003085103817284107, 0.0003084034251514822 ], "bp_grad_F": [ 0.022702287882566452, 0.018074622377753258, 0.01805359311401844, 0.018043993040919304, 0.018074078485369682 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.33250001072883606, "loss_eval": 1.8819878101348877, "epoch": 59 }, { "hidden_norms": [ 11.269571304321289, 896.1082763671875, 1374.973388671875, 1586.524169921875, 1478.1490478515625 ], "bp_grad_per_sample_l2_med": [ 0.00046731752809137106, 0.0003127296222373843, 0.00031115938327275217, 0.0003112337435595691, 0.00031117399339564145 ], "bp_grad_F": [ 0.022609086707234383, 0.018025977537035942, 0.01800408773124218, 0.017995676025748253, 0.018028175458312035 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3150000274181366, "loss_eval": 1.8731034994125366, "epoch": 60 }, { "hidden_norms": [ 11.269571304321289, 901.4246826171875, 1382.871337890625, 1595.7164306640625, 1486.465576171875 ], "bp_grad_per_sample_l2_med": [ 0.0004559764638543129, 0.00029873938183300197, 0.00029821961652487516, 0.0002982193836942315, 0.0002976148098241538 ], "bp_grad_F": [ 0.022443631663918495, 0.017807144671678543, 0.01778426393866539, 0.017775312066078186, 0.017809107899665833 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3190000057220459, "loss_eval": 1.9132741689682007, "epoch": 61 }, { "hidden_norms": [ 11.269571304321289, 906.219970703125, 1389.97998046875, 1603.95458984375, 1493.869384765625 ], "bp_grad_per_sample_l2_med": [ 0.00045692393905483186, 0.000307796144625172, 0.0003068537334911525, 0.0003067644138354808, 0.0003064550110138953 ], "bp_grad_F": [ 0.022245025262236595, 0.017795003950595856, 0.0177734587341547, 0.017764581367373466, 0.017800522968173027 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3270000219345093, "loss_eval": 1.8190391063690186, "epoch": 62 }, { "hidden_norms": [ 11.269571304321289, 910.5570678710938, 1396.3927001953125, 1611.4957275390625, 1500.6524658203125 ], "bp_grad_per_sample_l2_med": [ 0.00045115925604477525, 0.00029847086989320815, 0.0002977230178657919, 0.0002977572148665786, 0.0002975583774968982 ], "bp_grad_F": [ 0.02203645370900631, 0.017681924626231194, 0.01766141690313816, 0.017652763053774834, 0.0176865067332983 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35500001907348633, "loss_eval": 1.7965762615203857, "epoch": 63 }, { "hidden_norms": [ 11.269571304321289, 914.5003662109375, 1402.2757568359375, 1618.2999267578125, 1506.7991943359375 ], "bp_grad_per_sample_l2_med": [ 0.0004569143056869507, 0.00029972344054840505, 0.0002987241605296731, 0.0002987434563692659, 0.00029907189309597015 ], "bp_grad_F": [ 0.022272884845733643, 0.01781252957880497, 0.017791228368878365, 0.017782466486096382, 0.017818717285990715 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.328000009059906, "loss_eval": 1.8610442876815796, "epoch": 64 }, { "hidden_norms": [ 11.269571304321289, 918.0006103515625, 1407.5118408203125, 1624.3853759765625, 1512.30029296875 ], "bp_grad_per_sample_l2_med": [ 0.00045414711348712444, 0.00030931030050851405, 0.0003081976028624922, 0.0003081892791669816, 0.0003081847680732608 ], "bp_grad_F": [ 0.022085461765527725, 0.01779778115451336, 0.017776912078261375, 0.017768092453479767, 0.01780613884329796 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34300002455711365, "loss_eval": 1.804802417755127, "epoch": 65 }, { "hidden_norms": [ 11.269571304321289, 921.121826171875, 1412.175537109375, 1629.830810546875, 1517.2005615234375 ], "bp_grad_per_sample_l2_med": [ 0.0004531690792646259, 0.00031135816243477166, 0.00031044447678141296, 0.00031072759884409606, 0.0003106470685452223 ], "bp_grad_F": [ 0.022044293582439423, 0.017750630155205727, 0.017730476334691048, 0.017722314223647118, 0.017757223919034004 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34150001406669617, "loss_eval": 1.8111987113952637, "epoch": 66 }, { "hidden_norms": [ 11.269571304321289, 923.8903198242188, 1416.300048828125, 1634.646484375, 1521.5411376953125 ], "bp_grad_per_sample_l2_med": [ 0.0004468595434445888, 0.0003022409218829125, 0.00030127677018754184, 0.00030117464484646916, 0.00030144210904836655 ], "bp_grad_F": [ 0.02193099819123745, 0.017699316143989563, 0.017679594457149506, 0.017671333625912666, 0.017706507816910744 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3525000214576721, "loss_eval": 1.797281265258789, "epoch": 67 }, { "hidden_norms": [ 11.269571304321289, 926.2950439453125, 1419.8856201171875, 1638.8184814453125, 1525.284423828125 ], "bp_grad_per_sample_l2_med": [ 0.00044905568938702345, 0.00030229080584831536, 0.00030173707637004554, 0.0003015522670466453, 0.0003012538072653115 ], "bp_grad_F": [ 0.021881939843297005, 0.017657367512583733, 0.017637958750128746, 0.017629873007535934, 0.01766354590654373 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34800001978874207, "loss_eval": 1.8036439418792725, "epoch": 68 }, { "hidden_norms": [ 11.269571304321289, 928.36181640625, 1422.943359375, 1642.3917236328125, 1528.47705078125 ], "bp_grad_per_sample_l2_med": [ 0.0004465414967853576, 0.00030299098580144346, 0.00030190899269655347, 0.00030191292171366513, 0.000301982625387609 ], "bp_grad_F": [ 0.02188783325254917, 0.01768629439175129, 0.01766696758568287, 0.017658723518252373, 0.017692700028419495 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.359000027179718, "loss_eval": 1.7996938228607178, "epoch": 69 }, { "hidden_norms": [ 11.269571304321289, 930.1182861328125, 1425.561279296875, 1645.422607421875, 1531.2088623046875 ], "bp_grad_per_sample_l2_med": [ 0.0004439539334271103, 0.00030093194800429046, 0.00030001465347595513, 0.0003001568838953972, 0.0002998457639478147 ], "bp_grad_F": [ 0.021926432847976685, 0.01775786094367504, 0.017738472670316696, 0.01773017831146717, 0.01776653714478016 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35200002789497375, "loss_eval": 1.8030681610107422, "epoch": 70 }, { "hidden_norms": [ 11.269571304321289, 931.579345703125, 1427.7337646484375, 1647.9693603515625, 1533.509033203125 ], "bp_grad_per_sample_l2_med": [ 0.00044511700980365276, 0.00030080872238613665, 0.00030003004940226674, 0.0003000932920258492, 0.00029993904172442853 ], "bp_grad_F": [ 0.021828416734933853, 0.017681054770946503, 0.017661932855844498, 0.017653752118349075, 0.017688728868961334 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35200002789497375, "loss_eval": 1.7960853576660156, "epoch": 71 }, { "hidden_norms": [ 11.269571304321289, 932.7696533203125, 1429.520751953125, 1650.0577392578125, 1535.389892578125 ], "bp_grad_per_sample_l2_med": [ 0.0004446738166734576, 0.0003006414044648409, 0.00030009649344719946, 0.0003001675067935139, 0.00029965140856802464 ], "bp_grad_F": [ 0.021837500855326653, 0.01768680103123188, 0.017667656764388084, 0.017659684643149376, 0.017694275826215744 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35450002551078796, "loss_eval": 1.8004000186920166, "epoch": 72 }, { "hidden_norms": [ 11.269571304321289, 933.7157592773438, 1430.9381103515625, 1651.7154541015625, 1536.879638671875 ], "bp_grad_per_sample_l2_med": [ 0.00044473307207226753, 0.00030047594918869436, 0.0002997968113049865, 0.00029963525594212115, 0.00029955641366541386 ], "bp_grad_F": [ 0.0217889491468668, 0.01765742339193821, 0.01763851009309292, 0.01763063855469227, 0.017664924263954163 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3555000126361847, "loss_eval": 1.7942780256271362, "epoch": 73 }, { "hidden_norms": [ 11.269571304321289, 934.4593505859375, 1432.0382080078125, 1652.9989013671875, 1538.0234375 ], "bp_grad_per_sample_l2_med": [ 0.0004453740257304162, 0.0003002033627126366, 0.00029949398594908416, 0.00029964259010739625, 0.0002993734087795019 ], "bp_grad_F": [ 0.021799130365252495, 0.017666727304458618, 0.0176478810608387, 0.017639974132180214, 0.017674267292022705 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.34550002217292786, "loss_eval": 1.800949215888977, "epoch": 74 }, { "hidden_norms": [ 11.269571304321289, 934.9984741210938, 1432.84814453125, 1653.939697265625, 1538.8624267578125 ], "bp_grad_per_sample_l2_med": [ 0.00044546957360580564, 0.0003038236463908106, 0.000302964064758271, 0.00030298702768050134, 0.00030283271917141974 ], "bp_grad_F": [ 0.021853182464838028, 0.017717286944389343, 0.017698239535093307, 0.017690137028694153, 0.01772582344710827 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35600000619888306, "loss_eval": 1.800832986831665, "epoch": 75 }, { "hidden_norms": [ 11.269571304321289, 935.3856201171875, 1433.427490234375, 1654.6126708984375, 1539.4669189453125 ], "bp_grad_per_sample_l2_med": [ 0.00044487748527899384, 0.00030164900817908347, 0.00030081532895565033, 0.00030082385637797415, 0.000300481216982007 ], "bp_grad_F": [ 0.02177177555859089, 0.017657004296779633, 0.017638202756643295, 0.017630264163017273, 0.01766461506485939 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3490000069141388, "loss_eval": 1.794891119003296, "epoch": 76 }, { "hidden_norms": [ 11.269571304321289, 935.636474609375, 1433.79345703125, 1655.038330078125, 1539.8505859375 ], "bp_grad_per_sample_l2_med": [ 0.0004437313473317772, 0.00030232034623622894, 0.0003012971137650311, 0.00030129036167636514, 0.00030084658646956086 ], "bp_grad_F": [ 0.021787401288747787, 0.0176764614880085, 0.017657602205872536, 0.017649594694375992, 0.017684470862150192 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35350000858306885, "loss_eval": 1.7952260971069336, "epoch": 77 }, { "hidden_norms": [ 11.269571304321289, 935.7716064453125, 1433.996826171875, 1655.2738037109375, 1540.06298828125 ], "bp_grad_per_sample_l2_med": [ 0.00044510490261018276, 0.0003025131591130048, 0.00030167156364768744, 0.0003019055584445596, 0.00030186952790245414 ], "bp_grad_F": [ 0.02179691381752491, 0.017687244340777397, 0.017668338492512703, 0.017660312354564667, 0.01769554615020752 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35200002789497375, "loss_eval": 1.7945536375045776, "epoch": 78 }, { "hidden_norms": [ 11.269571304321289, 935.8350830078125, 1434.09326171875, 1655.3861083984375, 1540.164794921875 ], "bp_grad_per_sample_l2_med": [ 0.00044426857493817806, 0.0003006447514053434, 0.0002995560353156179, 0.0002996143593918532, 0.0002996891853399575 ], "bp_grad_F": [ 0.02177303098142147, 0.017660290002822876, 0.017641469836235046, 0.017633574083447456, 0.01766815222799778 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.35850000381469727, "loss_eval": 1.7939436435699463, "epoch": 79 }, { "hidden_norms": [ 11.269571304321289, 935.8506469726562, 1434.11669921875, 1655.4130859375, 1540.189208984375 ], "bp_grad_per_sample_l2_med": [ 0.00044382456690073013, 0.0003010118380188942, 0.0003002960584126413, 0.00030042475555092096, 0.00029991925111971796 ], "bp_grad_F": [ 0.021775126457214355, 0.01766343042254448, 0.017644599080085754, 0.017636677250266075, 0.017671329900622368 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3595000207424164, "loss_eval": 1.7936068773269653, "epoch": 80 } ], "seed": 42, "alpha": 1.0, "depth": 4, "d_hidden": 128 }