{ "fa_log": [ { "hidden_norms": [ 11.269571304321289, 11.290447235107422, 11.313605308532715, 11.351215362548828, 11.398087501525879 ], "bp_grad_per_sample_l2_med": [ 0.00028353024390526116, 0.0002828188880812377, 0.00028162598027847707, 0.0002799496578518301, 0.0002791006409097463 ], "bp_grad_F": [ 0.012684082612395287, 0.01264861598610878, 0.012589854188263416, 0.012511610053479671, 0.012471316382288933 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.08450000733137131, "loss_eval": 2.4790313243865967, "epoch": 0 }, { "hidden_norms": [ 11.269571304321289, 11.460872650146484, 11.70040512084961, 12.004783630371094, 12.311223030090332 ], "bp_grad_per_sample_l2_med": [ 0.0004118149809073657, 0.0003761148836929351, 0.00034950554254464805, 0.00032246875343844295, 0.0002528287877794355 ], "bp_grad_F": [ 0.018988799303770065, 0.017196672037243843, 0.015853216871619225, 0.014456234872341156, 0.011207858100533485 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5265000462532043, "loss_eval": 1.4851115942001343, "epoch": 1 }, { "hidden_norms": [ 11.269571304321289, 11.751569747924805, 12.541290283203125, 13.77841567993164, 15.976567268371582 ], "bp_grad_per_sample_l2_med": [ 0.0007904200465418398, 0.0006201046635396779, 0.0004867047828156501, 0.0003823215956799686, 0.00022867691586725414 ], "bp_grad_F": [ 0.041881538927555084, 0.03210915997624397, 0.025059428066015244, 0.01950555481016636, 0.011618814431130886 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6350000500679016, "loss_eval": 0.959205687046051, "epoch": 2 }, { "hidden_norms": [ 11.269571304321289, 12.018173217773438, 13.625839233398438, 16.65739631652832, 22.032325744628906 ], "bp_grad_per_sample_l2_med": [ 0.0008111135102808475, 0.0005643682088702917, 0.0004009789554402232, 0.00029031067970208824, 0.00016489777772221714 ], "bp_grad_F": [ 0.059235598891973495, 0.040808264166116714, 0.02855612151324749, 0.020608671009540558, 0.011410079896450043 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6855000257492065, "loss_eval": 0.818859875202179, "epoch": 3 }, { "hidden_norms": [ 11.269571304321289, 12.308274269104004, 15.27676010131836, 21.78426170349121, 30.742971420288086 ], "bp_grad_per_sample_l2_med": [ 0.0007430269033648074, 0.000469190941657871, 0.00030379975214600563, 0.00021638885664287955, 0.00012503107427619398 ], "bp_grad_F": [ 0.06859903037548065, 0.04267093911767006, 0.027331173419952393, 0.01921078749001026, 0.01109629962593317 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6940000057220459, "loss_eval": 0.7901937365531921, "epoch": 4 }, { "hidden_norms": [ 11.269571304321289, 12.659590721130371, 17.736019134521484, 29.108901977539062, 40.405487060546875 ], "bp_grad_per_sample_l2_med": [ 0.0007397185545414686, 0.0004240924317855388, 0.00025522997020743787, 0.00018211310089100152, 0.00011715881555574015 ], "bp_grad_F": [ 0.07044756412506104, 0.040140341967344284, 0.024354523047804832, 0.017343631014227867, 0.01095715630799532 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6975000500679016, "loss_eval": 0.8005170822143555, "epoch": 5 }, { "hidden_norms": [ 11.269571304321289, 13.09460735321045, 21.214082717895508, 38.0382194519043, 49.941673278808594 ], "bp_grad_per_sample_l2_med": [ 0.0007781236781738698, 0.00040500680916011333, 0.00022763953893445432, 0.00017000116349663585, 0.0001182492560474202 ], "bp_grad_F": [ 0.0692453384399414, 0.037047095596790314, 0.021944386884570122, 0.016124187037348747, 0.011101995594799519 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6925000548362732, "loss_eval": 0.8182728290557861, "epoch": 6 }, { "hidden_norms": [ 11.269571304321289, 13.613083839416504, 25.80984878540039, 47.72332763671875, 58.812931060791016 ], "bp_grad_per_sample_l2_med": [ 0.0007534404867328703, 0.00035873899469152093, 0.00019843837071675807, 0.00015793486090842634, 0.00011804765381384641 ], "bp_grad_F": [ 0.06768736243247986, 0.034021928906440735, 0.019909236580133438, 0.015198245644569397, 0.011175908148288727 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6945000290870667, "loss_eval": 0.8370131254196167, "epoch": 7 }, { "hidden_norms": [ 11.269571304321289, 14.181544303894043, 31.215173721313477, 57.29954147338867, 67.44005584716797 ], "bp_grad_per_sample_l2_med": [ 0.0008308067917823792, 0.0003639743954408914, 0.00018776576325763017, 0.00015568821982014924, 0.00012153007264714688 ], "bp_grad_F": [ 0.0664583221077919, 0.03186826407909393, 0.018696729093790054, 0.014834162779152393, 0.011486423201858997 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6775000095367432, "loss_eval": 0.8666528463363647, "epoch": 8 }, { "hidden_norms": [ 11.269571304321289, 14.879924774169922, 37.906219482421875, 67.32949829101562, 75.90506744384766 ], "bp_grad_per_sample_l2_med": [ 0.000856662227306515, 0.0003640915092546493, 0.0001897388428915292, 0.00016743727610446513, 0.00013579493679571897 ], "bp_grad_F": [ 0.06490001082420349, 0.0302249975502491, 0.018041465431451797, 0.014820784330368042, 0.011990511789917946 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6565000414848328, "loss_eval": 0.9446665048599243, "epoch": 9 }, { "hidden_norms": [ 11.269571304321289, 15.732318878173828, 45.59952163696289, 76.33224487304688, 84.44403076171875 ], "bp_grad_per_sample_l2_med": [ 0.0008764212252572179, 0.00035432647564448416, 0.00017862815002445132, 0.00016163433610927314, 0.0001364263880532235 ], "bp_grad_F": [ 0.06546498835086823, 0.02990337274968624, 0.01799662783741951, 0.015155031345784664, 0.012622621841728687 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6390000581741333, "loss_eval": 1.0291955471038818, "epoch": 10 }, { "hidden_norms": [ 11.269571304321289, 16.836196899414062, 55.33602523803711, 84.32881164550781, 92.9534912109375 ], "bp_grad_per_sample_l2_med": [ 0.000854950922075659, 0.00036200409522280097, 0.00018266236293129623, 0.0001705951290205121, 0.00014654053666163236 ], "bp_grad_F": [ 0.06433594971895218, 0.0289771668612957, 0.017391620203852654, 0.015173865482211113, 0.012928354553878307 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6330000162124634, "loss_eval": 1.076339840888977, "epoch": 11 }, { "hidden_norms": [ 11.269571304321289, 19.05539894104004, 69.66182708740234, 97.1963119506836, 102.74567413330078 ], "bp_grad_per_sample_l2_med": [ 0.0008397337514907122, 0.00034183592651970685, 0.00018204437219537795, 0.00017718512390274554, 0.0001551504828967154 ], "bp_grad_F": [ 0.062221452593803406, 0.027522921562194824, 0.01681770198047161, 0.01498384214937687, 0.013089192099869251 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.643500030040741, "loss_eval": 1.0531169176101685, "epoch": 12 }, { "hidden_norms": [ 11.269571304321289, 23.65813636779785, 86.25741577148438, 120.24312591552734, 124.2949447631836 ], "bp_grad_per_sample_l2_med": [ 0.0008297308231703937, 0.0003140757908113301, 0.00017996964743360877, 0.00017669204680714756, 0.00015717324276920408 ], "bp_grad_F": [ 0.06484393030405045, 0.028613954782485962, 0.01715104468166828, 0.01567785255610943, 0.014462707564234734 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6255000233650208, "loss_eval": 1.3249526023864746, "epoch": 13 }, { "hidden_norms": [ 11.269571304321289, 30.92644500732422, 102.1397705078125, 147.9296417236328, 157.7542266845703 ], "bp_grad_per_sample_l2_med": [ 0.0008446995634585619, 0.000312876160023734, 0.00019047399109695107, 0.00018901094153989106, 0.00017103466961998492 ], "bp_grad_F": [ 0.063303142786026, 0.02876628190279007, 0.01635562814772129, 0.015436392277479172, 0.014697290025651455 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6045000553131104, "loss_eval": 1.394450306892395, "epoch": 14 }, { "hidden_norms": [ 11.269571304321289, 40.05237579345703, 123.65401458740234, 173.33119201660156, 188.9973907470703 ], "bp_grad_per_sample_l2_med": [ 0.0008657039143145084, 0.0003323613782413304, 0.0002161249576602131, 0.0002138354757335037, 0.00019650986359920353 ], "bp_grad_F": [ 0.054496586322784424, 0.025836922228336334, 0.0159344132989645, 0.015238149091601372, 0.014629158191382885 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5950000286102295, "loss_eval": 1.1977143287658691, "epoch": 15 }, { "hidden_norms": [ 11.269571304321289, 50.589420318603516, 147.02255249023438, 197.975830078125, 217.0601806640625 ], "bp_grad_per_sample_l2_med": [ 0.0008191568194888532, 0.00030697352485731244, 0.00021884859597776085, 0.00021713844034820795, 0.00020184220920782536 ], "bp_grad_F": [ 0.04439451918005943, 0.021627753973007202, 0.015079431235790253, 0.0144795598462224, 0.014037052169442177 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6115000247955322, "loss_eval": 1.1207692623138428, "epoch": 16 }, { "hidden_norms": [ 11.269571304321289, 61.36143112182617, 169.08056640625, 221.02748107910156, 240.8756561279297 ], "bp_grad_per_sample_l2_med": [ 0.0007864299113862216, 0.0002859561063814908, 0.0002155074180336669, 0.00021533406106755137, 0.00020066267461515963 ], "bp_grad_F": [ 0.04005742073059082, 0.01873522810637951, 0.014609597623348236, 0.014084910042583942, 0.013653460890054703 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6175000071525574, "loss_eval": 1.059693694114685, "epoch": 17 }, { "hidden_norms": [ 11.269571304321289, 72.36003875732422, 188.58563232421875, 241.86294555664062, 258.58087158203125 ], "bp_grad_per_sample_l2_med": [ 0.0007837018347345293, 0.0002863232512027025, 0.00022506402456201613, 0.00022481133055407554, 0.00021070068760309368 ], "bp_grad_F": [ 0.039807844907045364, 0.01775156892836094, 0.01470963191241026, 0.014359688386321068, 0.01395167876034975 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6025000214576721, "loss_eval": 1.1027324199676514, "epoch": 18 }, { "hidden_norms": [ 11.269571304321289, 81.18446350097656, 200.67935180664062, 257.0839538574219, 267.81317138671875 ], "bp_grad_per_sample_l2_med": [ 0.00082020164700225, 0.0003102799819316715, 0.0002470446634106338, 0.0002463961427565664, 0.00023495900677517056 ], "bp_grad_F": [ 0.041444260627031326, 0.01803578995168209, 0.014944672584533691, 0.014712288975715637, 0.014517528004944324 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5820000171661377, "loss_eval": 1.146970272064209, "epoch": 19 }, { "hidden_norms": [ 11.269571304321289, 91.12315368652344, 208.71234130859375, 269.7666931152344, 278.79949951171875 ], "bp_grad_per_sample_l2_med": [ 0.0008638632134534419, 0.0003278621006757021, 0.00026185397291556, 0.00026034258189611137, 0.0002510476915631443 ], "bp_grad_F": [ 0.04429177567362785, 0.018727537244558334, 0.015489915385842323, 0.01529665943235159, 0.015330186113715172 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5394999980926514, "loss_eval": 1.2919961214065552, "epoch": 20 }, { "hidden_norms": [ 11.269571304321289, 104.20027160644531, 224.12327575683594, 292.86212158203125, 302.2417297363281 ], "bp_grad_per_sample_l2_med": [ 0.0008091026684269309, 0.0002788364654406905, 0.0002307023387402296, 0.0002291825512656942, 0.0002224020572612062 ], "bp_grad_F": [ 0.043314289301633835, 0.018204446882009506, 0.01538326870650053, 0.015148352831602097, 0.015248478390276432 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5615000128746033, "loss_eval": 1.3774936199188232, "epoch": 21 }, { "hidden_norms": [ 11.269571304321289, 119.46916198730469, 246.84373474121094, 322.8492736816406, 331.5632019042969 ], "bp_grad_per_sample_l2_med": [ 0.0007946055266074836, 0.0002993302186951041, 0.0002581049920991063, 0.00025690835900604725, 0.00025083290529437363 ], "bp_grad_F": [ 0.04004265367984772, 0.017564039677381516, 0.015413369052112103, 0.01514766737818718, 0.015221393667161465 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5430000424385071, "loss_eval": 1.3054314851760864, "epoch": 22 }, { "hidden_norms": [ 11.269571304321289, 136.81655883789062, 275.0496826171875, 359.30596923828125, 365.4009704589844 ], "bp_grad_per_sample_l2_med": [ 0.0007907089893706143, 0.00031880626920610666, 0.00028100365307182074, 0.0002786303812172264, 0.00027127860812470317 ], "bp_grad_F": [ 0.03825194016098976, 0.017261793836951256, 0.01555734220892191, 0.01527914684265852, 0.015313600189983845 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5270000100135803, "loss_eval": 1.3047609329223633, "epoch": 23 }, { "hidden_norms": [ 11.269571304321289, 154.3377227783203, 303.1491394042969, 395.8551330566406, 398.4109191894531 ], "bp_grad_per_sample_l2_med": [ 0.0007455120794475079, 0.0002850848250091076, 0.00025729817571118474, 0.00025698516401462257, 0.0002516870736144483 ], "bp_grad_F": [ 0.03626802936196327, 0.01676987297832966, 0.015425236895680428, 0.015152523294091225, 0.015204805880784988 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5555000305175781, "loss_eval": 1.2945412397384644, "epoch": 24 }, { "hidden_norms": [ 11.269571304321289, 172.51333618164062, 332.53106689453125, 434.6177978515625, 432.9015197753906 ], "bp_grad_per_sample_l2_med": [ 0.0007499566418118775, 0.00028473397833295166, 0.0002601774758659303, 0.0002574811805970967, 0.00025375629775226116 ], "bp_grad_F": [ 0.035628896206617355, 0.016559967771172523, 0.015500359237194061, 0.015283019281923771, 0.01530501153320074 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5250000357627869, "loss_eval": 1.348174810409546, "epoch": 25 }, { "hidden_norms": [ 11.269571304321289, 191.6818084716797, 362.3817138671875, 473.73529052734375, 468.3863830566406 ], "bp_grad_per_sample_l2_med": [ 0.00077909289393574, 0.0003061260504182428, 0.0002848915464710444, 0.000283668254269287, 0.00027828654856421053 ], "bp_grad_F": [ 0.03710347041487694, 0.01679745502769947, 0.01587643474340439, 0.01569107361137867, 0.015713181346654892 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.48750001192092896, "loss_eval": 1.513879418373108, "epoch": 26 }, { "hidden_norms": [ 11.269571304321289, 212.49392700195312, 393.7915954589844, 515.7852172851562, 507.1173095703125 ], "bp_grad_per_sample_l2_med": [ 0.0007443951326422393, 0.000309632858261466, 0.00028767462936230004, 0.0002863617264665663, 0.00028263547574169934 ], "bp_grad_F": [ 0.034536320716142654, 0.01654498465359211, 0.015813451260328293, 0.015621310099959373, 0.0156637541949749 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5090000033378601, "loss_eval": 1.345898151397705, "epoch": 27 }, { "hidden_norms": [ 11.269571304321289, 231.91209411621094, 422.3776550292969, 553.1364135742188, 540.5762329101562 ], "bp_grad_per_sample_l2_med": [ 0.0007372196414507926, 0.0002908413589466363, 0.00027582875918596983, 0.0002760514325927943, 0.00027193804271519184 ], "bp_grad_F": [ 0.034806184470653534, 0.01654907502233982, 0.01595865748822689, 0.01580234244465828, 0.01584061235189438 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4970000088214874, "loss_eval": 1.4695581197738647, "epoch": 28 }, { "hidden_norms": [ 11.269571304321289, 251.87222290039062, 452.5732116699219, 591.4275512695312, 574.1845703125 ], "bp_grad_per_sample_l2_med": [ 0.0007362416945397854, 0.0002964947489090264, 0.0002815316547639668, 0.0002831071906257421, 0.0002781452494673431 ], "bp_grad_F": [ 0.034162748605012894, 0.016219308599829674, 0.01574064791202545, 0.015600688755512238, 0.015627028420567513 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.48100003600120544, "loss_eval": 1.4220975637435913, "epoch": 29 }, { "hidden_norms": [ 11.269571304321289, 272.3019104003906, 483.1678161621094, 631.2042846679688, 609.8804931640625 ], "bp_grad_per_sample_l2_med": [ 0.0007130270241759717, 0.0003075756540056318, 0.00029428518610075116, 0.00029221284785307944, 0.0002892380871344358 ], "bp_grad_F": [ 0.033144623041152954, 0.01614796556532383, 0.015754450112581253, 0.015617748722434044, 0.015651794150471687 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.49550002813339233, "loss_eval": 1.398095726966858, "epoch": 30 }, { "hidden_norms": [ 11.269571304321289, 293.1174621582031, 513.9456176757812, 671.4954223632812, 646.9434204101562 ], "bp_grad_per_sample_l2_med": [ 0.0007292498485185206, 0.0003146968665532768, 0.0003013227542396635, 0.000301573658362031, 0.00029794115107506514 ], "bp_grad_F": [ 0.033789947628974915, 0.016436096280813217, 0.016089752316474915, 0.015960095450282097, 0.0159769207239151 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4570000171661377, "loss_eval": 1.5174756050109863, "epoch": 31 }, { "hidden_norms": [ 11.269571304321289, 312.291748046875, 542.6367797851562, 708.0426025390625, 679.9037475585938 ], "bp_grad_per_sample_l2_med": [ 0.0007159899105317891, 0.0003197023761458695, 0.00030903122387826443, 0.0003080730966757983, 0.00030512994271703064 ], "bp_grad_F": [ 0.03305007144808769, 0.016458848491311073, 0.0161746796220541, 0.01604822278022766, 0.016068853437900543 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.45350003242492676, "loss_eval": 1.4785963296890259, "epoch": 32 }, { "hidden_norms": [ 11.269571304321289, 330.2493896484375, 569.4765625, 741.90380859375, 710.49609375 ], "bp_grad_per_sample_l2_med": [ 0.0007181349792517722, 0.0003215835604351014, 0.00031238331575877964, 0.00031264303834177554, 0.0003104021889157593 ], "bp_grad_F": [ 0.0329170823097229, 0.016988366842269897, 0.01674317568540573, 0.01661907136440277, 0.01665792241692543 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4320000112056732, "loss_eval": 1.545434594154358, "epoch": 33 }, { "hidden_norms": [ 11.269571304321289, 348.3463439941406, 596.8388061523438, 776.8276977539062, 742.1928100585938 ], "bp_grad_per_sample_l2_med": [ 0.0006930733215995133, 0.0003099350433330983, 0.0003020780859515071, 0.0003008935309480876, 0.00029881703085266054 ], "bp_grad_F": [ 0.03210154175758362, 0.0165875144302845, 0.016380906105041504, 0.016269827261567116, 0.01630542054772377 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.46150001883506775, "loss_eval": 1.4990708827972412, "epoch": 34 }, { "hidden_norms": [ 11.269571304321289, 367.8572998046875, 624.6773071289062, 813.023193359375, 774.825439453125 ], "bp_grad_per_sample_l2_med": [ 0.0006842412985861301, 0.00032654378446750343, 0.00031924000359140337, 0.0003176531463395804, 0.00031533741275779903 ], "bp_grad_F": [ 0.03194142132997513, 0.016769496724009514, 0.01658361405134201, 0.016465021297335625, 0.016491062939167023 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4345000088214874, "loss_eval": 1.5226876735687256, "epoch": 35 }, { "hidden_norms": [ 11.269571304321289, 386.9555969238281, 652.0831298828125, 847.6653442382812, 805.962158203125 ], "bp_grad_per_sample_l2_med": [ 0.0007009130204096437, 0.00033408711897209287, 0.00032650009961798787, 0.00032573731732554734, 0.00032366803498007357 ], "bp_grad_F": [ 0.032547831535339355, 0.01727951131761074, 0.017110776156187057, 0.017009133473038673, 0.017040319740772247 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4025000333786011, "loss_eval": 1.6661202907562256, "epoch": 36 }, { "hidden_norms": [ 11.269571304321289, 405.57061767578125, 678.9530639648438, 881.5497436523438, 835.913330078125 ], "bp_grad_per_sample_l2_med": [ 0.0006714131450280547, 0.00031647825380787253, 0.0003093808190897107, 0.00030856815283186734, 0.00030731584411114454 ], "bp_grad_F": [ 0.030830882489681244, 0.016467954963445663, 0.016322584822773933, 0.016228536143898964, 0.01625511236488819 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.44850000739097595, "loss_eval": 1.5340722799301147, "epoch": 37 }, { "hidden_norms": [ 11.269571304321289, 423.3720703125, 705.0136108398438, 914.5001831054688, 865.4478759765625 ], "bp_grad_per_sample_l2_med": [ 0.0006793327047489583, 0.0003244458057451993, 0.0003182501532137394, 0.00031923994538374245, 0.00031612347811460495 ], "bp_grad_F": [ 0.03101767599582672, 0.01673293113708496, 0.01659614033997059, 0.016509832814335823, 0.01653491146862507 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.42000001668930054, "loss_eval": 1.6198900938034058, "epoch": 38 }, { "hidden_norms": [ 11.269571304321289, 440.53741455078125, 729.8703002929688, 945.1349487304688, 892.7785034179688 ], "bp_grad_per_sample_l2_med": [ 0.0006624915986321867, 0.00031068388489075005, 0.00030363586847670376, 0.00030243129003793, 0.00030108148348517716 ], "bp_grad_F": [ 0.030339404940605164, 0.01675509847700596, 0.016639690846204758, 0.01655009388923645, 0.016594169661402702 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4280000329017639, "loss_eval": 1.6058467626571655, "epoch": 39 }, { "hidden_norms": [ 11.269571304321289, 457.5261535644531, 754.3056640625, 975.5144653320312, 919.8758544921875 ], "bp_grad_per_sample_l2_med": [ 0.0006706257117912173, 0.0003283233381807804, 0.00032177154207602143, 0.0003207549743819982, 0.0003196784819010645 ], "bp_grad_F": [ 0.03072393499314785, 0.016925832256674767, 0.01681169681251049, 0.01673683524131775, 0.016768047586083412 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.39000001549720764, "loss_eval": 1.7052431106567383, "epoch": 40 }, { "hidden_norms": [ 11.269571304321289, 474.70233154296875, 778.4963989257812, 1005.5798950195312, 947.08251953125 ], "bp_grad_per_sample_l2_med": [ 0.0006340838735923171, 0.00030884164152666926, 0.000303937413264066, 0.00030318956123664975, 0.0003018545394297689 ], "bp_grad_F": [ 0.02923908829689026, 0.016514884307980537, 0.016419367864727974, 0.016349095851182938, 0.0163878221064806 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4390000104904175, "loss_eval": 1.564381718635559, "epoch": 41 }, { "hidden_norms": [ 11.269571304321289, 489.3309631347656, 799.4293823242188, 1031.868408203125, 970.6136474609375 ], "bp_grad_per_sample_l2_med": [ 0.0006363792927004397, 0.00032453436870127916, 0.000319232844049111, 0.0003183995431754738, 0.00031706615118309855 ], "bp_grad_F": [ 0.02950570173561573, 0.016813522204756737, 0.016721611842513084, 0.016652515158057213, 0.016693497076630592 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.42100003361701965, "loss_eval": 1.605594515800476, "epoch": 42 }, { "hidden_norms": [ 11.269571304321289, 502.8161315917969, 819.462890625, 1056.7576904296875, 992.5881958007812 ], "bp_grad_per_sample_l2_med": [ 0.0006477028946392238, 0.00033125586924143136, 0.0003257581265643239, 0.000326100125676021, 0.00032460023066960275 ], "bp_grad_F": [ 0.029688136652112007, 0.01694806106388569, 0.01685865968465805, 0.016797136515378952, 0.016836510971188545 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3830000162124634, "loss_eval": 1.673546552658081, "epoch": 43 }, { "hidden_norms": [ 11.269571304321289, 517.00634765625, 839.9920654296875, 1082.26025390625, 1015.0608520507812 ], "bp_grad_per_sample_l2_med": [ 0.0006337560480460525, 0.0003340205585118383, 0.00032972541521303356, 0.00032889688736759126, 0.0003277511859778315 ], "bp_grad_F": [ 0.029322637245059013, 0.01695762574672699, 0.016879092901945114, 0.01681896671652794, 0.016858574002981186 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.38350000977516174, "loss_eval": 1.6975816488265991, "epoch": 44 }, { "hidden_norms": [ 11.269571304321289, 529.66064453125, 858.3285522460938, 1104.83544921875, 1035.074951171875 ], "bp_grad_per_sample_l2_med": [ 0.0006231985753402114, 0.00033350964076817036, 0.00032944625127129257, 0.00032876565819606185, 0.00032806835952214897 ], "bp_grad_F": [ 0.029069310054183006, 0.016890447586774826, 0.016818689182400703, 0.016763897612690926, 0.016804050654172897 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3930000066757202, "loss_eval": 1.676193356513977, "epoch": 45 }, { "hidden_norms": [ 11.269571304321289, 541.9931030273438, 875.95556640625, 1126.6197509765625, 1054.3516845703125 ], "bp_grad_per_sample_l2_med": [ 0.0006226357654668391, 0.00032438969356007874, 0.0003203299711458385, 0.0003203903906978667, 0.00031863307231105864 ], "bp_grad_F": [ 0.028472919017076492, 0.016746005043387413, 0.016683315858244896, 0.016633223742246628, 0.016673142090439796 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4165000319480896, "loss_eval": 1.6569225788116455, "epoch": 46 }, { "hidden_norms": [ 11.269571304321289, 555.5247802734375, 895.108642578125, 1150.2750244140625, 1075.3402099609375 ], "bp_grad_per_sample_l2_med": [ 0.0006058313883841038, 0.00031499756732955575, 0.00031102998764254153, 0.0003108317614533007, 0.00030999473528936505 ], "bp_grad_F": [ 0.028057299554347992, 0.016642672941088676, 0.016584018245339394, 0.016536688432097435, 0.016577772796154022 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.41850000619888306, "loss_eval": 1.622230887413025, "epoch": 47 }, { "hidden_norms": [ 11.269571304321289, 566.745361328125, 911.0077514648438, 1169.5748291015625, 1092.4599609375 ], "bp_grad_per_sample_l2_med": [ 0.000616180885117501, 0.0003297157527413219, 0.00032601068960502744, 0.0003262106911279261, 0.00032522634137421846 ], "bp_grad_F": [ 0.02835526503622532, 0.016961509361863136, 0.016903148964047432, 0.01685917004942894, 0.01690032333135605 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.39250001311302185, "loss_eval": 1.714435338973999, "epoch": 48 }, { "hidden_norms": [ 11.269571304321289, 578.6380004882812, 927.9735107421875, 1190.5294189453125, 1111.001220703125 ], "bp_grad_per_sample_l2_med": [ 0.0006051660166122019, 0.0003138712199870497, 0.0003094248822890222, 0.000309422001009807, 0.0003081281029153615 ], "bp_grad_F": [ 0.027995921671390533, 0.016778133809566498, 0.016729604452848434, 0.01668645441532135, 0.016727875918149948 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40450000762939453, "loss_eval": 1.6801645755767822, "epoch": 49 }, { "hidden_norms": [ 11.269571304321289, 591.34326171875, 945.9314575195312, 1212.5030517578125, 1130.69580078125 ], "bp_grad_per_sample_l2_med": [ 0.000600961095187813, 0.00032534165075048804, 0.0003221939841751009, 0.00032207692856900394, 0.00032122948323376477 ], "bp_grad_F": [ 0.027977745980024338, 0.017148323357105255, 0.017105158418416977, 0.017058631405234337, 0.01710781268775463 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3930000066757202, "loss_eval": 1.7086997032165527, "epoch": 50 }, { "hidden_norms": [ 11.269571304321289, 602.791015625, 962.1253051757812, 1232.407958984375, 1148.6063232421875 ], "bp_grad_per_sample_l2_med": [ 0.0005954196094535291, 0.00032203743467107415, 0.0003193309239577502, 0.00031976529862731695, 0.00031836770358495414 ], "bp_grad_F": [ 0.027640262618660927, 0.016875414177775383, 0.01683391071856022, 0.016794128343462944, 0.016835639253258705 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.38750001788139343, "loss_eval": 1.7161617279052734, "epoch": 51 }, { "hidden_norms": [ 11.269571304321289, 613.0055541992188, 976.7833251953125, 1250.490966796875, 1164.8575439453125 ], "bp_grad_per_sample_l2_med": [ 0.0005885999999009073, 0.00031236460199579597, 0.00030869650072418153, 0.00030896696262061596, 0.0003076815919484943 ], "bp_grad_F": [ 0.027101732790470123, 0.01670675352215767, 0.016670193523168564, 0.01663014106452465, 0.016672657802700996 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.41100001335144043, "loss_eval": 1.6481956243515015, "epoch": 52 }, { "hidden_norms": [ 11.269571304321289, 622.8380126953125, 990.931640625, 1267.7691650390625, 1180.291015625 ], "bp_grad_per_sample_l2_med": [ 0.000587237358558923, 0.0003190709976479411, 0.0003160224005114287, 0.00031612091697752476, 0.00031501890043728054 ], "bp_grad_F": [ 0.027042290195822716, 0.016803324222564697, 0.016769535839557648, 0.016731148585677147, 0.016775181517004967 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40450000762939453, "loss_eval": 1.6591061353683472, "epoch": 53 }, { "hidden_norms": [ 11.269571304321289, 632.4323120117188, 1004.666259765625, 1284.4637451171875, 1195.189697265625 ], "bp_grad_per_sample_l2_med": [ 0.0005885775317437947, 0.0003397047985345125, 0.0003383393050171435, 0.00033765248372219503, 0.00033701834036037326 ], "bp_grad_F": [ 0.027301670983433723, 0.017337650060653687, 0.017313728109002113, 0.017269184812903404, 0.0173148512840271 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3565000295639038, "loss_eval": 1.7250425815582275, "epoch": 54 }, { "hidden_norms": [ 11.269571304321289, 639.983154296875, 1015.8214721679688, 1297.94091796875, 1207.160400390625 ], "bp_grad_per_sample_l2_med": [ 0.0005771536380052567, 0.00031455705175176263, 0.0003114652936346829, 0.0003115544968750328, 0.00031060961191542447 ], "bp_grad_F": [ 0.026900731027126312, 0.01682351529598236, 0.01679442636668682, 0.016759345307946205, 0.016801798716187477 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.398000031709671, "loss_eval": 1.6931191682815552, "epoch": 55 }, { "hidden_norms": [ 11.269571304321289, 648.44189453125, 1027.905517578125, 1312.5484619140625, 1220.3349609375 ], "bp_grad_per_sample_l2_med": [ 0.0005807234556414187, 0.0003243165265303105, 0.00032131426269188523, 0.0003215263714082539, 0.0003202861698810011 ], "bp_grad_F": [ 0.02689860761165619, 0.016972798854112625, 0.016945669427514076, 0.016909556463360786, 0.01695423573255539 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3850000202655792, "loss_eval": 1.713501214981079, "epoch": 56 }, { "hidden_norms": [ 11.269571304321289, 656.1256103515625, 1038.9337158203125, 1326.0384521484375, 1232.491455078125 ], "bp_grad_per_sample_l2_med": [ 0.0005809550639241934, 0.0003213974996469915, 0.0003191177383996546, 0.0003187706752214581, 0.0003176441532559693 ], "bp_grad_F": [ 0.026944397017359734, 0.016979368403553963, 0.01695428043603897, 0.01692255586385727, 0.016963332891464233 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3800000250339508, "loss_eval": 1.7483241558074951, "epoch": 57 }, { "hidden_norms": [ 11.269571304321289, 663.1458740234375, 1049.1085205078125, 1338.4049072265625, 1243.709228515625 ], "bp_grad_per_sample_l2_med": [ 0.0005775660974904895, 0.00032701215241104364, 0.000323877960909158, 0.00032368660322390497, 0.00032316104625351727 ], "bp_grad_F": [ 0.026842813938856125, 0.017009008675813675, 0.016984863206744194, 0.016950154677033424, 0.016992947086691856 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.36650002002716064, "loss_eval": 1.7447302341461182, "epoch": 58 }, { "hidden_norms": [ 11.269571304321289, 669.32080078125, 1058.1265869140625, 1349.383544921875, 1253.68603515625 ], "bp_grad_per_sample_l2_med": [ 0.0005691531114280224, 0.0003169954870827496, 0.0003141614724881947, 0.00031412398675456643, 0.00031352281803265214 ], "bp_grad_F": [ 0.026560034602880478, 0.01695145107805729, 0.016930771991610527, 0.016894754022359848, 0.016942735761404037 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3830000162124634, "loss_eval": 1.7227482795715332, "epoch": 59 }, { "hidden_norms": [ 11.269571304321289, 675.035888671875, 1066.407958984375, 1359.420654296875, 1262.8460693359375 ], "bp_grad_per_sample_l2_med": [ 0.000574529985897243, 0.000330567971104756, 0.0003291864413768053, 0.0003286501159891486, 0.00032822080538608134 ], "bp_grad_F": [ 0.02670128643512726, 0.017140112817287445, 0.017120162025094032, 0.01708981581032276, 0.017130881547927856 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.37800002098083496, "loss_eval": 1.7512460947036743, "epoch": 60 }, { "hidden_norms": [ 11.269571304321289, 680.7155151367188, 1074.5833740234375, 1369.3917236328125, 1271.9488525390625 ], "bp_grad_per_sample_l2_med": [ 0.0005727651296183467, 0.00031855711131356657, 0.0003159786283504218, 0.00031576541368849576, 0.0003150397096760571 ], "bp_grad_F": [ 0.02646380476653576, 0.016906103119254112, 0.016886914148926735, 0.016857335343956947, 0.016896924003958702 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.39100003242492676, "loss_eval": 1.7765766382217407, "epoch": 61 }, { "hidden_norms": [ 11.269571304321289, 685.6483154296875, 1081.7335205078125, 1378.0848388671875, 1279.824462890625 ], "bp_grad_per_sample_l2_med": [ 0.0005669392994605005, 0.00032193740480579436, 0.0003195095050614327, 0.00031930883415043354, 0.00031847937498241663 ], "bp_grad_F": [ 0.02628612145781517, 0.01694479025900364, 0.016926957294344902, 0.016897274181246758, 0.016937877982854843 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.38200002908706665, "loss_eval": 1.6996668577194214, "epoch": 62 }, { "hidden_norms": [ 11.269571304321289, 690.3829345703125, 1088.4320068359375, 1386.209228515625, 1287.180908203125 ], "bp_grad_per_sample_l2_med": [ 0.0005609798245131969, 0.0003164574736729264, 0.00031414616387337446, 0.0003141844645142555, 0.0003133733116555959 ], "bp_grad_F": [ 0.025919275358319283, 0.01681407354772091, 0.016797930002212524, 0.01676807552576065, 0.016810856759548187 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4035000205039978, "loss_eval": 1.6783148050308228, "epoch": 63 }, { "hidden_norms": [ 11.269571304321289, 694.658935546875, 1094.5535888671875, 1393.6761474609375, 1293.9659423828125 ], "bp_grad_per_sample_l2_med": [ 0.0005624280893243849, 0.00031574408058077097, 0.0003139691543765366, 0.00031461575417779386, 0.00031346286414191127 ], "bp_grad_F": [ 0.02617610991001129, 0.016873449087142944, 0.016857409849762917, 0.01682792603969574, 0.016867902129888535 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3830000162124634, "loss_eval": 1.7127265930175781, "epoch": 64 }, { "hidden_norms": [ 11.269571304321289, 698.4141235351562, 1099.921875, 1400.2060546875, 1299.92919921875 ], "bp_grad_per_sample_l2_med": [ 0.0005497613456100225, 0.00031591873266734183, 0.00031333384686149657, 0.00031392619712278247, 0.00031339324777945876 ], "bp_grad_F": [ 0.025806115940213203, 0.016780776903033257, 0.016766363754868507, 0.016736920922994614, 0.01677793264389038 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4165000319480896, "loss_eval": 1.6823266744613647, "epoch": 65 }, { "hidden_norms": [ 11.269571304321289, 701.8402099609375, 1104.8636474609375, 1406.2545166015625, 1305.4110107421875 ], "bp_grad_per_sample_l2_med": [ 0.0005536439130082726, 0.0003222717496100813, 0.0003193898010067642, 0.0003197654150426388, 0.00031906200456433 ], "bp_grad_F": [ 0.02591872774064541, 0.016899071633815765, 0.01688431203365326, 0.01685412786900997, 0.016896730288863182 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3895000219345093, "loss_eval": 1.6973413228988647, "epoch": 66 }, { "hidden_norms": [ 11.269571304321289, 704.84814453125, 1109.2054443359375, 1411.5528564453125, 1310.220458984375 ], "bp_grad_per_sample_l2_med": [ 0.0005509129259735346, 0.0003127358213532716, 0.00031018650042824447, 0.00031017058063298464, 0.0003093581763096154 ], "bp_grad_F": [ 0.02567744068801403, 0.01674523949623108, 0.01673281565308571, 0.016704324632883072, 0.01674455776810646 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40400001406669617, "loss_eval": 1.6765486001968384, "epoch": 67 }, { "hidden_norms": [ 11.269571304321289, 707.4666137695312, 1112.9517822265625, 1416.120361328125, 1314.365478515625 ], "bp_grad_per_sample_l2_med": [ 0.0005525590386241674, 0.0003146192757412791, 0.000312337331706658, 0.0003126179799437523, 0.00031193779432214797 ], "bp_grad_F": [ 0.025625307112932205, 0.016738714650273323, 0.01672603376209736, 0.016697421669960022, 0.016738519072532654 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.406000018119812, "loss_eval": 1.681616187095642, "epoch": 68 }, { "hidden_norms": [ 11.269571304321289, 709.6942749023438, 1116.1553955078125, 1420.0328369140625, 1317.9129638671875 ], "bp_grad_per_sample_l2_med": [ 0.0005520040867850184, 0.0003149699477944523, 0.0003132218262180686, 0.00031297295936383307, 0.0003122398047707975 ], "bp_grad_F": [ 0.02563839592039585, 0.01678294688463211, 0.016770213842391968, 0.01674121432006359, 0.01678287237882614 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3985000252723694, "loss_eval": 1.6824655532836914, "epoch": 69 }, { "hidden_norms": [ 11.269571304321289, 711.4514770507812, 1118.6820068359375, 1423.118408203125, 1320.7220458984375 ], "bp_grad_per_sample_l2_med": [ 0.0005478749517351389, 0.0003126654773950577, 0.00031092006247490644, 0.0003107163356617093, 0.00030992255778983235 ], "bp_grad_F": [ 0.025653105229139328, 0.016804352402687073, 0.01679334044456482, 0.016765642911195755, 0.016805216670036316 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3970000147819519, "loss_eval": 1.6816198825836182, "epoch": 70 }, { "hidden_norms": [ 11.269571304321289, 712.941162109375, 1120.8258056640625, 1425.7293701171875, 1323.110595703125 ], "bp_grad_per_sample_l2_med": [ 0.0005502297426573932, 0.00031594440224580467, 0.00031323955045081675, 0.0003133862919639796, 0.00031268122256733477 ], "bp_grad_F": [ 0.025557825341820717, 0.01675795204937458, 0.01674625650048256, 0.01671820878982544, 0.016758527606725693 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4025000333786011, "loss_eval": 1.6777657270431519, "epoch": 71 }, { "hidden_norms": [ 11.269571304321289, 714.2026977539062, 1122.637451171875, 1427.94921875, 1325.1287841796875 ], "bp_grad_per_sample_l2_med": [ 0.0005491463234648108, 0.0003148230316583067, 0.00031261687399819493, 0.0003126751398667693, 0.00031198892975226045 ], "bp_grad_F": [ 0.025629354640841484, 0.016796274110674858, 0.016784505918622017, 0.016756094992160797, 0.01679658703505993 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.3985000252723694, "loss_eval": 1.6832109689712524, "epoch": 72 }, { "hidden_norms": [ 11.269571304321289, 715.1837158203125, 1124.0401611328125, 1429.676025390625, 1326.6959228515625 ], "bp_grad_per_sample_l2_med": [ 0.0005472805933095515, 0.00031123129883781075, 0.0003085967618972063, 0.00030910191708244383, 0.00030826785950921476 ], "bp_grad_F": [ 0.025491509586572647, 0.01673061214387417, 0.016719412058591843, 0.01669108308851719, 0.016732096672058105 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.41350001096725464, "loss_eval": 1.6768076419830322, "epoch": 73 }, { "hidden_norms": [ 11.269571304321289, 715.9666137695312, 1125.15869140625, 1431.054931640625, 1327.940185546875 ], "bp_grad_per_sample_l2_med": [ 0.0005469402531161904, 0.0003141815832350403, 0.0003117373853456229, 0.0003121092449873686, 0.00031146654509939253 ], "bp_grad_F": [ 0.02553613670170307, 0.016766469925642014, 0.016755321994423866, 0.01672743633389473, 0.01676766574382782 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40050002932548523, "loss_eval": 1.6803343296051025, "epoch": 74 }, { "hidden_norms": [ 11.269571304321289, 716.54345703125, 1125.9932861328125, 1432.0760498046875, 1328.8612060546875 ], "bp_grad_per_sample_l2_med": [ 0.000544340000487864, 0.0003152569697704166, 0.00031408306676894426, 0.00031385221518576145, 0.0003130683908239007 ], "bp_grad_F": [ 0.025559071451425552, 0.016799958422780037, 0.01678895764052868, 0.016760708764195442, 0.01680118963122368 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40050002932548523, "loss_eval": 1.6816425323486328, "epoch": 75 }, { "hidden_norms": [ 11.269571304321289, 716.944580078125, 1126.5697021484375, 1432.786376953125, 1329.5032958984375 ], "bp_grad_per_sample_l2_med": [ 0.0005474911304190755, 0.00031179687357507646, 0.0003097430744674057, 0.00030947139021009207, 0.00030854580109007657 ], "bp_grad_F": [ 0.025479920208454132, 0.01673789508640766, 0.016726836562156677, 0.016698846593499184, 0.01673932373523712 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4010000228881836, "loss_eval": 1.6769893169403076, "epoch": 76 }, { "hidden_norms": [ 11.269571304321289, 717.2020263671875, 1126.9422607421875, 1433.2410888671875, 1329.9195556640625 ], "bp_grad_per_sample_l2_med": [ 0.000546319643035531, 0.00031345203751698136, 0.000311522395350039, 0.000311847630655393, 0.0003111722180619836 ], "bp_grad_F": [ 0.025481175631284714, 0.01675844006240368, 0.016747308894991875, 0.016719479113817215, 0.0167598407715559 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4075000286102295, "loss_eval": 1.6769570112228394, "epoch": 77 }, { "hidden_norms": [ 11.269571304321289, 717.3436889648438, 1127.1475830078125, 1433.49072265625, 1330.1451416015625 ], "bp_grad_per_sample_l2_med": [ 0.0005438647349365056, 0.00031364860478788614, 0.0003113296115770936, 0.0003115428553428501, 0.00031094413134269416 ], "bp_grad_F": [ 0.025495020672678947, 0.016764776781201363, 0.016753805801272392, 0.016725784167647362, 0.016766248270869255 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.40800002217292786, "loss_eval": 1.6758222579956055, "epoch": 78 }, { "hidden_norms": [ 11.269571304321289, 717.4073486328125, 1127.239501953125, 1433.60302734375, 1330.2476806640625 ], "bp_grad_per_sample_l2_med": [ 0.0005444776033982635, 0.0003124381182715297, 0.0003098779125139117, 0.0003102763439528644, 0.0003094278508797288 ], "bp_grad_F": [ 0.025471549481153488, 0.016743116080760956, 0.016732197254896164, 0.016704153269529343, 0.016744764521718025 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.41450002789497375, "loss_eval": 1.675687551498413, "epoch": 79 }, { "hidden_norms": [ 11.269571304321289, 717.4231567382812, 1127.262451171875, 1433.6309814453125, 1330.273193359375 ], "bp_grad_per_sample_l2_med": [ 0.0005445098504424095, 0.0003131923731416464, 0.00031077052699401975, 0.0003107219818048179, 0.00031013842090032995 ], "bp_grad_F": [ 0.02547312155365944, 0.016745658591389656, 0.016734709963202477, 0.016706665977835655, 0.016747286543250084 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4140000343322754, "loss_eval": 1.6754448413848877, "epoch": 80 } ], "seed": 42, "alpha": 1.0, "depth": 4, "d_hidden": 128 }