summaryrefslogtreecommitdiff
path: root/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json')
-rw-r--r--results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json2276
1 files changed, 2276 insertions, 0 deletions
diff --git a/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json
new file mode 100644
index 0000000..438739c
--- /dev/null
+++ b/results/snapshot_synth_v1/snapshot_fa_synth_a1.0_L4_s42.json
@@ -0,0 +1,2276 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.460872650146484,
+ 11.70040512084961,
+ 12.004783630371094,
+ 12.311223030090332
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004118149809073657,
+ 0.0003761148836929351,
+ 0.00034950554254464805,
+ 0.00032246875343844295,
+ 0.0002528287877794355
+ ],
+ "bp_grad_F": [
+ 0.018988799303770065,
+ 0.017196672037243843,
+ 0.015853216871619225,
+ 0.014456234872341156,
+ 0.011207858100533485
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5265000462532043,
+ "loss_eval": 1.4851115942001343,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.751569747924805,
+ 12.541290283203125,
+ 13.77841567993164,
+ 15.976567268371582
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007904200465418398,
+ 0.0006201046635396779,
+ 0.0004867047828156501,
+ 0.0003823215956799686,
+ 0.00022867691586725414
+ ],
+ "bp_grad_F": [
+ 0.041881538927555084,
+ 0.03210915997624397,
+ 0.025059428066015244,
+ 0.01950555481016636,
+ 0.011618814431130886
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6350000500679016,
+ "loss_eval": 0.959205687046051,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.018173217773438,
+ 13.625839233398438,
+ 16.65739631652832,
+ 22.032325744628906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008111135102808475,
+ 0.0005643682088702917,
+ 0.0004009789554402232,
+ 0.00029031067970208824,
+ 0.00016489777772221714
+ ],
+ "bp_grad_F": [
+ 0.059235598891973495,
+ 0.040808264166116714,
+ 0.02855612151324749,
+ 0.020608671009540558,
+ 0.011410079896450043
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6855000257492065,
+ "loss_eval": 0.818859875202179,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.308274269104004,
+ 15.27676010131836,
+ 21.78426170349121,
+ 30.742971420288086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007430269033648074,
+ 0.000469190941657871,
+ 0.00030379975214600563,
+ 0.00021638885664287955,
+ 0.00012503107427619398
+ ],
+ "bp_grad_F": [
+ 0.06859903037548065,
+ 0.04267093911767006,
+ 0.027331173419952393,
+ 0.01921078749001026,
+ 0.01109629962593317
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6940000057220459,
+ "loss_eval": 0.7901937365531921,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.659590721130371,
+ 17.736019134521484,
+ 29.108901977539062,
+ 40.405487060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007397185545414686,
+ 0.0004240924317855388,
+ 0.00025522997020743787,
+ 0.00018211310089100152,
+ 0.00011715881555574015
+ ],
+ "bp_grad_F": [
+ 0.07044756412506104,
+ 0.040140341967344284,
+ 0.024354523047804832,
+ 0.017343631014227867,
+ 0.01095715630799532
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6975000500679016,
+ "loss_eval": 0.8005170822143555,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.09460735321045,
+ 21.214082717895508,
+ 38.0382194519043,
+ 49.941673278808594
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007781236781738698,
+ 0.00040500680916011333,
+ 0.00022763953893445432,
+ 0.00017000116349663585,
+ 0.0001182492560474202
+ ],
+ "bp_grad_F": [
+ 0.0692453384399414,
+ 0.037047095596790314,
+ 0.021944386884570122,
+ 0.016124187037348747,
+ 0.011101995594799519
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6925000548362732,
+ "loss_eval": 0.8182728290557861,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.613083839416504,
+ 25.80984878540039,
+ 47.72332763671875,
+ 58.812931060791016
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007534404867328703,
+ 0.00035873899469152093,
+ 0.00019843837071675807,
+ 0.00015793486090842634,
+ 0.00011804765381384641
+ ],
+ "bp_grad_F": [
+ 0.06768736243247986,
+ 0.034021928906440735,
+ 0.019909236580133438,
+ 0.015198245644569397,
+ 0.011175908148288727
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6945000290870667,
+ "loss_eval": 0.8370131254196167,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.181544303894043,
+ 31.215173721313477,
+ 57.29954147338867,
+ 67.44005584716797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008308067917823792,
+ 0.0003639743954408914,
+ 0.00018776576325763017,
+ 0.00015568821982014924,
+ 0.00012153007264714688
+ ],
+ "bp_grad_F": [
+ 0.0664583221077919,
+ 0.03186826407909393,
+ 0.018696729093790054,
+ 0.014834162779152393,
+ 0.011486423201858997
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6775000095367432,
+ "loss_eval": 0.8666528463363647,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.879924774169922,
+ 37.906219482421875,
+ 67.32949829101562,
+ 75.90506744384766
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000856662227306515,
+ 0.0003640915092546493,
+ 0.0001897388428915292,
+ 0.00016743727610446513,
+ 0.00013579493679571897
+ ],
+ "bp_grad_F": [
+ 0.06490001082420349,
+ 0.0302249975502491,
+ 0.018041465431451797,
+ 0.014820784330368042,
+ 0.011990511789917946
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6565000414848328,
+ "loss_eval": 0.9446665048599243,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.732318878173828,
+ 45.59952163696289,
+ 76.33224487304688,
+ 84.44403076171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008764212252572179,
+ 0.00035432647564448416,
+ 0.00017862815002445132,
+ 0.00016163433610927314,
+ 0.0001364263880532235
+ ],
+ "bp_grad_F": [
+ 0.06546498835086823,
+ 0.02990337274968624,
+ 0.01799662783741951,
+ 0.015155031345784664,
+ 0.012622621841728687
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6390000581741333,
+ "loss_eval": 1.0291955471038818,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 16.836196899414062,
+ 55.33602523803711,
+ 84.32881164550781,
+ 92.9534912109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000854950922075659,
+ 0.00036200409522280097,
+ 0.00018266236293129623,
+ 0.0001705951290205121,
+ 0.00014654053666163236
+ ],
+ "bp_grad_F": [
+ 0.06433594971895218,
+ 0.0289771668612957,
+ 0.017391620203852654,
+ 0.015173865482211113,
+ 0.012928354553878307
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6330000162124634,
+ "loss_eval": 1.076339840888977,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 19.05539894104004,
+ 69.66182708740234,
+ 97.1963119506836,
+ 102.74567413330078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008397337514907122,
+ 0.00034183592651970685,
+ 0.00018204437219537795,
+ 0.00017718512390274554,
+ 0.0001551504828967154
+ ],
+ "bp_grad_F": [
+ 0.062221452593803406,
+ 0.027522921562194824,
+ 0.01681770198047161,
+ 0.01498384214937687,
+ 0.013089192099869251
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.643500030040741,
+ "loss_eval": 1.0531169176101685,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 23.65813636779785,
+ 86.25741577148438,
+ 120.24312591552734,
+ 124.2949447631836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008297308231703937,
+ 0.0003140757908113301,
+ 0.00017996964743360877,
+ 0.00017669204680714756,
+ 0.00015717324276920408
+ ],
+ "bp_grad_F": [
+ 0.06484393030405045,
+ 0.028613954782485962,
+ 0.01715104468166828,
+ 0.01567785255610943,
+ 0.014462707564234734
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6255000233650208,
+ "loss_eval": 1.3249526023864746,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 30.92644500732422,
+ 102.1397705078125,
+ 147.9296417236328,
+ 157.7542266845703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008446995634585619,
+ 0.000312876160023734,
+ 0.00019047399109695107,
+ 0.00018901094153989106,
+ 0.00017103466961998492
+ ],
+ "bp_grad_F": [
+ 0.063303142786026,
+ 0.02876628190279007,
+ 0.01635562814772129,
+ 0.015436392277479172,
+ 0.014697290025651455
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6045000553131104,
+ "loss_eval": 1.394450306892395,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 40.05237579345703,
+ 123.65401458740234,
+ 173.33119201660156,
+ 188.9973907470703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008657039143145084,
+ 0.0003323613782413304,
+ 0.0002161249576602131,
+ 0.0002138354757335037,
+ 0.00019650986359920353
+ ],
+ "bp_grad_F": [
+ 0.054496586322784424,
+ 0.025836922228336334,
+ 0.0159344132989645,
+ 0.015238149091601372,
+ 0.014629158191382885
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5950000286102295,
+ "loss_eval": 1.1977143287658691,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 50.589420318603516,
+ 147.02255249023438,
+ 197.975830078125,
+ 217.0601806640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008191568194888532,
+ 0.00030697352485731244,
+ 0.00021884859597776085,
+ 0.00021713844034820795,
+ 0.00020184220920782536
+ ],
+ "bp_grad_F": [
+ 0.04439451918005943,
+ 0.021627753973007202,
+ 0.015079431235790253,
+ 0.0144795598462224,
+ 0.014037052169442177
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6115000247955322,
+ "loss_eval": 1.1207692623138428,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 61.36143112182617,
+ 169.08056640625,
+ 221.02748107910156,
+ 240.8756561279297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007864299113862216,
+ 0.0002859561063814908,
+ 0.0002155074180336669,
+ 0.00021533406106755137,
+ 0.00020066267461515963
+ ],
+ "bp_grad_F": [
+ 0.04005742073059082,
+ 0.01873522810637951,
+ 0.014609597623348236,
+ 0.014084910042583942,
+ 0.013653460890054703
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6175000071525574,
+ "loss_eval": 1.059693694114685,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 72.36003875732422,
+ 188.58563232421875,
+ 241.86294555664062,
+ 258.58087158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007837018347345293,
+ 0.0002863232512027025,
+ 0.00022506402456201613,
+ 0.00022481133055407554,
+ 0.00021070068760309368
+ ],
+ "bp_grad_F": [
+ 0.039807844907045364,
+ 0.01775156892836094,
+ 0.01470963191241026,
+ 0.014359688386321068,
+ 0.01395167876034975
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6025000214576721,
+ "loss_eval": 1.1027324199676514,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 81.18446350097656,
+ 200.67935180664062,
+ 257.0839538574219,
+ 267.81317138671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00082020164700225,
+ 0.0003102799819316715,
+ 0.0002470446634106338,
+ 0.0002463961427565664,
+ 0.00023495900677517056
+ ],
+ "bp_grad_F": [
+ 0.041444260627031326,
+ 0.01803578995168209,
+ 0.014944672584533691,
+ 0.014712288975715637,
+ 0.014517528004944324
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5820000171661377,
+ "loss_eval": 1.146970272064209,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 91.12315368652344,
+ 208.71234130859375,
+ 269.7666931152344,
+ 278.79949951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008638632134534419,
+ 0.0003278621006757021,
+ 0.00026185397291556,
+ 0.00026034258189611137,
+ 0.0002510476915631443
+ ],
+ "bp_grad_F": [
+ 0.04429177567362785,
+ 0.018727537244558334,
+ 0.015489915385842323,
+ 0.01529665943235159,
+ 0.015330186113715172
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5394999980926514,
+ "loss_eval": 1.2919961214065552,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 104.20027160644531,
+ 224.12327575683594,
+ 292.86212158203125,
+ 302.2417297363281
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008091026684269309,
+ 0.0002788364654406905,
+ 0.0002307023387402296,
+ 0.0002291825512656942,
+ 0.0002224020572612062
+ ],
+ "bp_grad_F": [
+ 0.043314289301633835,
+ 0.018204446882009506,
+ 0.01538326870650053,
+ 0.015148352831602097,
+ 0.015248478390276432
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615000128746033,
+ "loss_eval": 1.3774936199188232,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 119.46916198730469,
+ 246.84373474121094,
+ 322.8492736816406,
+ 331.5632019042969
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007946055266074836,
+ 0.0002993302186951041,
+ 0.0002581049920991063,
+ 0.00025690835900604725,
+ 0.00025083290529437363
+ ],
+ "bp_grad_F": [
+ 0.04004265367984772,
+ 0.017564039677381516,
+ 0.015413369052112103,
+ 0.01514766737818718,
+ 0.015221393667161465
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5430000424385071,
+ "loss_eval": 1.3054314851760864,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 136.81655883789062,
+ 275.0496826171875,
+ 359.30596923828125,
+ 365.4009704589844
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007907089893706143,
+ 0.00031880626920610666,
+ 0.00028100365307182074,
+ 0.0002786303812172264,
+ 0.00027127860812470317
+ ],
+ "bp_grad_F": [
+ 0.03825194016098976,
+ 0.017261793836951256,
+ 0.01555734220892191,
+ 0.01527914684265852,
+ 0.015313600189983845
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5270000100135803,
+ "loss_eval": 1.3047609329223633,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 154.3377227783203,
+ 303.1491394042969,
+ 395.8551330566406,
+ 398.4109191894531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007455120794475079,
+ 0.0002850848250091076,
+ 0.00025729817571118474,
+ 0.00025698516401462257,
+ 0.0002516870736144483
+ ],
+ "bp_grad_F": [
+ 0.03626802936196327,
+ 0.01676987297832966,
+ 0.015425236895680428,
+ 0.015152523294091225,
+ 0.015204805880784988
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5555000305175781,
+ "loss_eval": 1.2945412397384644,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 172.51333618164062,
+ 332.53106689453125,
+ 434.6177978515625,
+ 432.9015197753906
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007499566418118775,
+ 0.00028473397833295166,
+ 0.0002601774758659303,
+ 0.0002574811805970967,
+ 0.00025375629775226116
+ ],
+ "bp_grad_F": [
+ 0.035628896206617355,
+ 0.016559967771172523,
+ 0.015500359237194061,
+ 0.015283019281923771,
+ 0.01530501153320074
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5250000357627869,
+ "loss_eval": 1.348174810409546,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 191.6818084716797,
+ 362.3817138671875,
+ 473.73529052734375,
+ 468.3863830566406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00077909289393574,
+ 0.0003061260504182428,
+ 0.0002848915464710444,
+ 0.000283668254269287,
+ 0.00027828654856421053
+ ],
+ "bp_grad_F": [
+ 0.03710347041487694,
+ 0.01679745502769947,
+ 0.01587643474340439,
+ 0.01569107361137867,
+ 0.015713181346654892
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.48750001192092896,
+ "loss_eval": 1.513879418373108,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 212.49392700195312,
+ 393.7915954589844,
+ 515.7852172851562,
+ 507.1173095703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007443951326422393,
+ 0.000309632858261466,
+ 0.00028767462936230004,
+ 0.0002863617264665663,
+ 0.00028263547574169934
+ ],
+ "bp_grad_F": [
+ 0.034536320716142654,
+ 0.01654498465359211,
+ 0.015813451260328293,
+ 0.015621310099959373,
+ 0.0156637541949749
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5090000033378601,
+ "loss_eval": 1.345898151397705,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 231.91209411621094,
+ 422.3776550292969,
+ 553.1364135742188,
+ 540.5762329101562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007372196414507926,
+ 0.0002908413589466363,
+ 0.00027582875918596983,
+ 0.0002760514325927943,
+ 0.00027193804271519184
+ ],
+ "bp_grad_F": [
+ 0.034806184470653534,
+ 0.01654907502233982,
+ 0.01595865748822689,
+ 0.01580234244465828,
+ 0.01584061235189438
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4970000088214874,
+ "loss_eval": 1.4695581197738647,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 251.87222290039062,
+ 452.5732116699219,
+ 591.4275512695312,
+ 574.1845703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007362416945397854,
+ 0.0002964947489090264,
+ 0.0002815316547639668,
+ 0.0002831071906257421,
+ 0.0002781452494673431
+ ],
+ "bp_grad_F": [
+ 0.034162748605012894,
+ 0.016219308599829674,
+ 0.01574064791202545,
+ 0.015600688755512238,
+ 0.015627028420567513
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.48100003600120544,
+ "loss_eval": 1.4220975637435913,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 272.3019104003906,
+ 483.1678161621094,
+ 631.2042846679688,
+ 609.8804931640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007130270241759717,
+ 0.0003075756540056318,
+ 0.00029428518610075116,
+ 0.00029221284785307944,
+ 0.0002892380871344358
+ ],
+ "bp_grad_F": [
+ 0.033144623041152954,
+ 0.01614796556532383,
+ 0.015754450112581253,
+ 0.015617748722434044,
+ 0.015651794150471687
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.49550002813339233,
+ "loss_eval": 1.398095726966858,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 293.1174621582031,
+ 513.9456176757812,
+ 671.4954223632812,
+ 646.9434204101562
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007292498485185206,
+ 0.0003146968665532768,
+ 0.0003013227542396635,
+ 0.000301573658362031,
+ 0.00029794115107506514
+ ],
+ "bp_grad_F": [
+ 0.033789947628974915,
+ 0.016436096280813217,
+ 0.016089752316474915,
+ 0.015960095450282097,
+ 0.0159769207239151
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4570000171661377,
+ "loss_eval": 1.5174756050109863,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 312.291748046875,
+ 542.6367797851562,
+ 708.0426025390625,
+ 679.9037475585938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007159899105317891,
+ 0.0003197023761458695,
+ 0.00030903122387826443,
+ 0.0003080730966757983,
+ 0.00030512994271703064
+ ],
+ "bp_grad_F": [
+ 0.03305007144808769,
+ 0.016458848491311073,
+ 0.0161746796220541,
+ 0.01604822278022766,
+ 0.016068853437900543
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.45350003242492676,
+ "loss_eval": 1.4785963296890259,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 330.2493896484375,
+ 569.4765625,
+ 741.90380859375,
+ 710.49609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007181349792517722,
+ 0.0003215835604351014,
+ 0.00031238331575877964,
+ 0.00031264303834177554,
+ 0.0003104021889157593
+ ],
+ "bp_grad_F": [
+ 0.0329170823097229,
+ 0.016988366842269897,
+ 0.01674317568540573,
+ 0.01661907136440277,
+ 0.01665792241692543
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4320000112056732,
+ "loss_eval": 1.545434594154358,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 348.3463439941406,
+ 596.8388061523438,
+ 776.8276977539062,
+ 742.1928100585938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006930733215995133,
+ 0.0003099350433330983,
+ 0.0003020780859515071,
+ 0.0003008935309480876,
+ 0.00029881703085266054
+ ],
+ "bp_grad_F": [
+ 0.03210154175758362,
+ 0.0165875144302845,
+ 0.016380906105041504,
+ 0.016269827261567116,
+ 0.01630542054772377
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.46150001883506775,
+ "loss_eval": 1.4990708827972412,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 367.8572998046875,
+ 624.6773071289062,
+ 813.023193359375,
+ 774.825439453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006842412985861301,
+ 0.00032654378446750343,
+ 0.00031924000359140337,
+ 0.0003176531463395804,
+ 0.00031533741275779903
+ ],
+ "bp_grad_F": [
+ 0.03194142132997513,
+ 0.016769496724009514,
+ 0.01658361405134201,
+ 0.016465021297335625,
+ 0.016491062939167023
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4345000088214874,
+ "loss_eval": 1.5226876735687256,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 386.9555969238281,
+ 652.0831298828125,
+ 847.6653442382812,
+ 805.962158203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007009130204096437,
+ 0.00033408711897209287,
+ 0.00032650009961798787,
+ 0.00032573731732554734,
+ 0.00032366803498007357
+ ],
+ "bp_grad_F": [
+ 0.032547831535339355,
+ 0.01727951131761074,
+ 0.017110776156187057,
+ 0.017009133473038673,
+ 0.017040319740772247
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4025000333786011,
+ "loss_eval": 1.6661202907562256,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 405.57061767578125,
+ 678.9530639648438,
+ 881.5497436523438,
+ 835.913330078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006714131450280547,
+ 0.00031647825380787253,
+ 0.0003093808190897107,
+ 0.00030856815283186734,
+ 0.00030731584411114454
+ ],
+ "bp_grad_F": [
+ 0.030830882489681244,
+ 0.016467954963445663,
+ 0.016322584822773933,
+ 0.016228536143898964,
+ 0.01625511236488819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.44850000739097595,
+ "loss_eval": 1.5340722799301147,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 423.3720703125,
+ 705.0136108398438,
+ 914.5001831054688,
+ 865.4478759765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006793327047489583,
+ 0.0003244458057451993,
+ 0.0003182501532137394,
+ 0.00031923994538374245,
+ 0.00031612347811460495
+ ],
+ "bp_grad_F": [
+ 0.03101767599582672,
+ 0.01673293113708496,
+ 0.01659614033997059,
+ 0.016509832814335823,
+ 0.01653491146862507
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42000001668930054,
+ "loss_eval": 1.6198900938034058,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 440.53741455078125,
+ 729.8703002929688,
+ 945.1349487304688,
+ 892.7785034179688
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006624915986321867,
+ 0.00031068388489075005,
+ 0.00030363586847670376,
+ 0.00030243129003793,
+ 0.00030108148348517716
+ ],
+ "bp_grad_F": [
+ 0.030339404940605164,
+ 0.01675509847700596,
+ 0.016639690846204758,
+ 0.01655009388923645,
+ 0.016594169661402702
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4280000329017639,
+ "loss_eval": 1.6058467626571655,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 457.5261535644531,
+ 754.3056640625,
+ 975.5144653320312,
+ 919.8758544921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006706257117912173,
+ 0.0003283233381807804,
+ 0.00032177154207602143,
+ 0.0003207549743819982,
+ 0.0003196784819010645
+ ],
+ "bp_grad_F": [
+ 0.03072393499314785,
+ 0.016925832256674767,
+ 0.01681169681251049,
+ 0.01673683524131775,
+ 0.016768047586083412
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39000001549720764,
+ "loss_eval": 1.7052431106567383,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 474.70233154296875,
+ 778.4963989257812,
+ 1005.5798950195312,
+ 947.08251953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006340838735923171,
+ 0.00030884164152666926,
+ 0.000303937413264066,
+ 0.00030318956123664975,
+ 0.0003018545394297689
+ ],
+ "bp_grad_F": [
+ 0.02923908829689026,
+ 0.016514884307980537,
+ 0.016419367864727974,
+ 0.016349095851182938,
+ 0.0163878221064806
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4390000104904175,
+ "loss_eval": 1.564381718635559,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 489.3309631347656,
+ 799.4293823242188,
+ 1031.868408203125,
+ 970.6136474609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006363792927004397,
+ 0.00032453436870127916,
+ 0.000319232844049111,
+ 0.0003183995431754738,
+ 0.00031706615118309855
+ ],
+ "bp_grad_F": [
+ 0.02950570173561573,
+ 0.016813522204756737,
+ 0.016721611842513084,
+ 0.016652515158057213,
+ 0.016693497076630592
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42100003361701965,
+ "loss_eval": 1.605594515800476,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 502.8161315917969,
+ 819.462890625,
+ 1056.7576904296875,
+ 992.5881958007812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006477028946392238,
+ 0.00033125586924143136,
+ 0.0003257581265643239,
+ 0.000326100125676021,
+ 0.00032460023066960275
+ ],
+ "bp_grad_F": [
+ 0.029688136652112007,
+ 0.01694806106388569,
+ 0.01685865968465805,
+ 0.016797136515378952,
+ 0.016836510971188545
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.673546552658081,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 517.00634765625,
+ 839.9920654296875,
+ 1082.26025390625,
+ 1015.0608520507812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006337560480460525,
+ 0.0003340205585118383,
+ 0.00032972541521303356,
+ 0.00032889688736759126,
+ 0.0003277511859778315
+ ],
+ "bp_grad_F": [
+ 0.029322637245059013,
+ 0.01695762574672699,
+ 0.016879092901945114,
+ 0.01681896671652794,
+ 0.016858574002981186
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38350000977516174,
+ "loss_eval": 1.6975816488265991,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 529.66064453125,
+ 858.3285522460938,
+ 1104.83544921875,
+ 1035.074951171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006231985753402114,
+ 0.00033350964076817036,
+ 0.00032944625127129257,
+ 0.00032876565819606185,
+ 0.00032806835952214897
+ ],
+ "bp_grad_F": [
+ 0.029069310054183006,
+ 0.016890447586774826,
+ 0.016818689182400703,
+ 0.016763897612690926,
+ 0.016804050654172897
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3930000066757202,
+ "loss_eval": 1.676193356513977,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 541.9931030273438,
+ 875.95556640625,
+ 1126.6197509765625,
+ 1054.3516845703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006226357654668391,
+ 0.00032438969356007874,
+ 0.0003203299711458385,
+ 0.0003203903906978667,
+ 0.00031863307231105864
+ ],
+ "bp_grad_F": [
+ 0.028472919017076492,
+ 0.016746005043387413,
+ 0.016683315858244896,
+ 0.016633223742246628,
+ 0.016673142090439796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4165000319480896,
+ "loss_eval": 1.6569225788116455,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 555.5247802734375,
+ 895.108642578125,
+ 1150.2750244140625,
+ 1075.3402099609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006058313883841038,
+ 0.00031499756732955575,
+ 0.00031102998764254153,
+ 0.0003108317614533007,
+ 0.00030999473528936505
+ ],
+ "bp_grad_F": [
+ 0.028057299554347992,
+ 0.016642672941088676,
+ 0.016584018245339394,
+ 0.016536688432097435,
+ 0.016577772796154022
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41850000619888306,
+ "loss_eval": 1.622230887413025,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 566.745361328125,
+ 911.0077514648438,
+ 1169.5748291015625,
+ 1092.4599609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000616180885117501,
+ 0.0003297157527413219,
+ 0.00032601068960502744,
+ 0.0003262106911279261,
+ 0.00032522634137421846
+ ],
+ "bp_grad_F": [
+ 0.02835526503622532,
+ 0.016961509361863136,
+ 0.016903148964047432,
+ 0.01685917004942894,
+ 0.01690032333135605
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39250001311302185,
+ "loss_eval": 1.714435338973999,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 578.6380004882812,
+ 927.9735107421875,
+ 1190.5294189453125,
+ 1111.001220703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006051660166122019,
+ 0.0003138712199870497,
+ 0.0003094248822890222,
+ 0.000309422001009807,
+ 0.0003081281029153615
+ ],
+ "bp_grad_F": [
+ 0.027995921671390533,
+ 0.016778133809566498,
+ 0.016729604452848434,
+ 0.01668645441532135,
+ 0.016727875918149948
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40450000762939453,
+ "loss_eval": 1.6801645755767822,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 591.34326171875,
+ 945.9314575195312,
+ 1212.5030517578125,
+ 1130.69580078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000600961095187813,
+ 0.00032534165075048804,
+ 0.0003221939841751009,
+ 0.00032207692856900394,
+ 0.00032122948323376477
+ ],
+ "bp_grad_F": [
+ 0.027977745980024338,
+ 0.017148323357105255,
+ 0.017105158418416977,
+ 0.017058631405234337,
+ 0.01710781268775463
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3930000066757202,
+ "loss_eval": 1.7086997032165527,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 602.791015625,
+ 962.1253051757812,
+ 1232.407958984375,
+ 1148.6063232421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005954196094535291,
+ 0.00032203743467107415,
+ 0.0003193309239577502,
+ 0.00031976529862731695,
+ 0.00031836770358495414
+ ],
+ "bp_grad_F": [
+ 0.027640262618660927,
+ 0.016875414177775383,
+ 0.01683391071856022,
+ 0.016794128343462944,
+ 0.016835639253258705
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38750001788139343,
+ "loss_eval": 1.7161617279052734,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 613.0055541992188,
+ 976.7833251953125,
+ 1250.490966796875,
+ 1164.8575439453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005885999999009073,
+ 0.00031236460199579597,
+ 0.00030869650072418153,
+ 0.00030896696262061596,
+ 0.0003076815919484943
+ ],
+ "bp_grad_F": [
+ 0.027101732790470123,
+ 0.01670675352215767,
+ 0.016670193523168564,
+ 0.01663014106452465,
+ 0.016672657802700996
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41100001335144043,
+ "loss_eval": 1.6481956243515015,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 622.8380126953125,
+ 990.931640625,
+ 1267.7691650390625,
+ 1180.291015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000587237358558923,
+ 0.0003190709976479411,
+ 0.0003160224005114287,
+ 0.00031612091697752476,
+ 0.00031501890043728054
+ ],
+ "bp_grad_F": [
+ 0.027042290195822716,
+ 0.016803324222564697,
+ 0.016769535839557648,
+ 0.016731148585677147,
+ 0.016775181517004967
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40450000762939453,
+ "loss_eval": 1.6591061353683472,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 632.4323120117188,
+ 1004.666259765625,
+ 1284.4637451171875,
+ 1195.189697265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005885775317437947,
+ 0.0003397047985345125,
+ 0.0003383393050171435,
+ 0.00033765248372219503,
+ 0.00033701834036037326
+ ],
+ "bp_grad_F": [
+ 0.027301670983433723,
+ 0.017337650060653687,
+ 0.017313728109002113,
+ 0.017269184812903404,
+ 0.0173148512840271
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3565000295639038,
+ "loss_eval": 1.7250425815582275,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 639.983154296875,
+ 1015.8214721679688,
+ 1297.94091796875,
+ 1207.160400390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005771536380052567,
+ 0.00031455705175176263,
+ 0.0003114652936346829,
+ 0.0003115544968750328,
+ 0.00031060961191542447
+ ],
+ "bp_grad_F": [
+ 0.026900731027126312,
+ 0.01682351529598236,
+ 0.01679442636668682,
+ 0.016759345307946205,
+ 0.016801798716187477
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.398000031709671,
+ "loss_eval": 1.6931191682815552,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 648.44189453125,
+ 1027.905517578125,
+ 1312.5484619140625,
+ 1220.3349609375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005807234556414187,
+ 0.0003243165265303105,
+ 0.00032131426269188523,
+ 0.0003215263714082539,
+ 0.0003202861698810011
+ ],
+ "bp_grad_F": [
+ 0.02689860761165619,
+ 0.016972798854112625,
+ 0.016945669427514076,
+ 0.016909556463360786,
+ 0.01695423573255539
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3850000202655792,
+ "loss_eval": 1.713501214981079,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 656.1256103515625,
+ 1038.9337158203125,
+ 1326.0384521484375,
+ 1232.491455078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005809550639241934,
+ 0.0003213974996469915,
+ 0.0003191177383996546,
+ 0.0003187706752214581,
+ 0.0003176441532559693
+ ],
+ "bp_grad_F": [
+ 0.026944397017359734,
+ 0.016979368403553963,
+ 0.01695428043603897,
+ 0.01692255586385727,
+ 0.016963332891464233
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3800000250339508,
+ "loss_eval": 1.7483241558074951,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 663.1458740234375,
+ 1049.1085205078125,
+ 1338.4049072265625,
+ 1243.709228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005775660974904895,
+ 0.00032701215241104364,
+ 0.000323877960909158,
+ 0.00032368660322390497,
+ 0.00032316104625351727
+ ],
+ "bp_grad_F": [
+ 0.026842813938856125,
+ 0.017009008675813675,
+ 0.016984863206744194,
+ 0.016950154677033424,
+ 0.016992947086691856
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36650002002716064,
+ "loss_eval": 1.7447302341461182,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 669.32080078125,
+ 1058.1265869140625,
+ 1349.383544921875,
+ 1253.68603515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005691531114280224,
+ 0.0003169954870827496,
+ 0.0003141614724881947,
+ 0.00031412398675456643,
+ 0.00031352281803265214
+ ],
+ "bp_grad_F": [
+ 0.026560034602880478,
+ 0.01695145107805729,
+ 0.016930771991610527,
+ 0.016894754022359848,
+ 0.016942735761404037
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.7227482795715332,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 675.035888671875,
+ 1066.407958984375,
+ 1359.420654296875,
+ 1262.8460693359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000574529985897243,
+ 0.000330567971104756,
+ 0.0003291864413768053,
+ 0.0003286501159891486,
+ 0.00032822080538608134
+ ],
+ "bp_grad_F": [
+ 0.02670128643512726,
+ 0.017140112817287445,
+ 0.017120162025094032,
+ 0.01708981581032276,
+ 0.017130881547927856
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.37800002098083496,
+ "loss_eval": 1.7512460947036743,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 680.7155151367188,
+ 1074.5833740234375,
+ 1369.3917236328125,
+ 1271.9488525390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005727651296183467,
+ 0.00031855711131356657,
+ 0.0003159786283504218,
+ 0.00031576541368849576,
+ 0.0003150397096760571
+ ],
+ "bp_grad_F": [
+ 0.02646380476653576,
+ 0.016906103119254112,
+ 0.016886914148926735,
+ 0.016857335343956947,
+ 0.016896924003958702
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.39100003242492676,
+ "loss_eval": 1.7765766382217407,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 685.6483154296875,
+ 1081.7335205078125,
+ 1378.0848388671875,
+ 1279.824462890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005669392994605005,
+ 0.00032193740480579436,
+ 0.0003195095050614327,
+ 0.00031930883415043354,
+ 0.00031847937498241663
+ ],
+ "bp_grad_F": [
+ 0.02628612145781517,
+ 0.01694479025900364,
+ 0.016926957294344902,
+ 0.016897274181246758,
+ 0.016937877982854843
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.38200002908706665,
+ "loss_eval": 1.6996668577194214,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 690.3829345703125,
+ 1088.4320068359375,
+ 1386.209228515625,
+ 1287.180908203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005609798245131969,
+ 0.0003164574736729264,
+ 0.00031414616387337446,
+ 0.0003141844645142555,
+ 0.0003133733116555959
+ ],
+ "bp_grad_F": [
+ 0.025919275358319283,
+ 0.01681407354772091,
+ 0.016797930002212524,
+ 0.01676807552576065,
+ 0.016810856759548187
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4035000205039978,
+ "loss_eval": 1.6783148050308228,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 694.658935546875,
+ 1094.5535888671875,
+ 1393.6761474609375,
+ 1293.9659423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005624280893243849,
+ 0.00031574408058077097,
+ 0.0003139691543765366,
+ 0.00031461575417779386,
+ 0.00031346286414191127
+ ],
+ "bp_grad_F": [
+ 0.02617610991001129,
+ 0.016873449087142944,
+ 0.016857409849762917,
+ 0.01682792603969574,
+ 0.016867902129888535
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3830000162124634,
+ "loss_eval": 1.7127265930175781,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 698.4141235351562,
+ 1099.921875,
+ 1400.2060546875,
+ 1299.92919921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005497613456100225,
+ 0.00031591873266734183,
+ 0.00031333384686149657,
+ 0.00031392619712278247,
+ 0.00031339324777945876
+ ],
+ "bp_grad_F": [
+ 0.025806115940213203,
+ 0.016780776903033257,
+ 0.016766363754868507,
+ 0.016736920922994614,
+ 0.01677793264389038
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4165000319480896,
+ "loss_eval": 1.6823266744613647,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 701.8402099609375,
+ 1104.8636474609375,
+ 1406.2545166015625,
+ 1305.4110107421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005536439130082726,
+ 0.0003222717496100813,
+ 0.0003193898010067642,
+ 0.0003197654150426388,
+ 0.00031906200456433
+ ],
+ "bp_grad_F": [
+ 0.02591872774064541,
+ 0.016899071633815765,
+ 0.01688431203365326,
+ 0.01685412786900997,
+ 0.016896730288863182
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3895000219345093,
+ "loss_eval": 1.6973413228988647,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 704.84814453125,
+ 1109.2054443359375,
+ 1411.5528564453125,
+ 1310.220458984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005509129259735346,
+ 0.0003127358213532716,
+ 0.00031018650042824447,
+ 0.00031017058063298464,
+ 0.0003093581763096154
+ ],
+ "bp_grad_F": [
+ 0.02567744068801403,
+ 0.01674523949623108,
+ 0.01673281565308571,
+ 0.016704324632883072,
+ 0.01674455776810646
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40400001406669617,
+ "loss_eval": 1.6765486001968384,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 707.4666137695312,
+ 1112.9517822265625,
+ 1416.120361328125,
+ 1314.365478515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005525590386241674,
+ 0.0003146192757412791,
+ 0.000312337331706658,
+ 0.0003126179799437523,
+ 0.00031193779432214797
+ ],
+ "bp_grad_F": [
+ 0.025625307112932205,
+ 0.016738714650273323,
+ 0.01672603376209736,
+ 0.016697421669960022,
+ 0.016738519072532654
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.406000018119812,
+ "loss_eval": 1.681616187095642,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 709.6942749023438,
+ 1116.1553955078125,
+ 1420.0328369140625,
+ 1317.9129638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005520040867850184,
+ 0.0003149699477944523,
+ 0.0003132218262180686,
+ 0.00031297295936383307,
+ 0.0003122398047707975
+ ],
+ "bp_grad_F": [
+ 0.02563839592039585,
+ 0.01678294688463211,
+ 0.016770213842391968,
+ 0.01674121432006359,
+ 0.01678287237882614
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3985000252723694,
+ "loss_eval": 1.6824655532836914,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 711.4514770507812,
+ 1118.6820068359375,
+ 1423.118408203125,
+ 1320.7220458984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005478749517351389,
+ 0.0003126654773950577,
+ 0.00031092006247490644,
+ 0.0003107163356617093,
+ 0.00030992255778983235
+ ],
+ "bp_grad_F": [
+ 0.025653105229139328,
+ 0.016804352402687073,
+ 0.01679334044456482,
+ 0.016765642911195755,
+ 0.016805216670036316
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3970000147819519,
+ "loss_eval": 1.6816198825836182,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 712.941162109375,
+ 1120.8258056640625,
+ 1425.7293701171875,
+ 1323.110595703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005502297426573932,
+ 0.00031594440224580467,
+ 0.00031323955045081675,
+ 0.0003133862919639796,
+ 0.00031268122256733477
+ ],
+ "bp_grad_F": [
+ 0.025557825341820717,
+ 0.01675795204937458,
+ 0.01674625650048256,
+ 0.01671820878982544,
+ 0.016758527606725693
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4025000333786011,
+ "loss_eval": 1.6777657270431519,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 714.2026977539062,
+ 1122.637451171875,
+ 1427.94921875,
+ 1325.1287841796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005491463234648108,
+ 0.0003148230316583067,
+ 0.00031261687399819493,
+ 0.0003126751398667693,
+ 0.00031198892975226045
+ ],
+ "bp_grad_F": [
+ 0.025629354640841484,
+ 0.016796274110674858,
+ 0.016784505918622017,
+ 0.016756094992160797,
+ 0.01679658703505993
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3985000252723694,
+ "loss_eval": 1.6832109689712524,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 715.1837158203125,
+ 1124.0401611328125,
+ 1429.676025390625,
+ 1326.6959228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005472805933095515,
+ 0.00031123129883781075,
+ 0.0003085967618972063,
+ 0.00030910191708244383,
+ 0.00030826785950921476
+ ],
+ "bp_grad_F": [
+ 0.025491509586572647,
+ 0.01673061214387417,
+ 0.016719412058591843,
+ 0.01669108308851719,
+ 0.016732096672058105
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41350001096725464,
+ "loss_eval": 1.6768076419830322,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 715.9666137695312,
+ 1125.15869140625,
+ 1431.054931640625,
+ 1327.940185546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005469402531161904,
+ 0.0003141815832350403,
+ 0.0003117373853456229,
+ 0.0003121092449873686,
+ 0.00031146654509939253
+ ],
+ "bp_grad_F": [
+ 0.02553613670170307,
+ 0.016766469925642014,
+ 0.016755321994423866,
+ 0.01672743633389473,
+ 0.01676766574382782
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40050002932548523,
+ "loss_eval": 1.6803343296051025,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 716.54345703125,
+ 1125.9932861328125,
+ 1432.0760498046875,
+ 1328.8612060546875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000544340000487864,
+ 0.0003152569697704166,
+ 0.00031408306676894426,
+ 0.00031385221518576145,
+ 0.0003130683908239007
+ ],
+ "bp_grad_F": [
+ 0.025559071451425552,
+ 0.016799958422780037,
+ 0.01678895764052868,
+ 0.016760708764195442,
+ 0.01680118963122368
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40050002932548523,
+ "loss_eval": 1.6816425323486328,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 716.944580078125,
+ 1126.5697021484375,
+ 1432.786376953125,
+ 1329.5032958984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005474911304190755,
+ 0.00031179687357507646,
+ 0.0003097430744674057,
+ 0.00030947139021009207,
+ 0.00030854580109007657
+ ],
+ "bp_grad_F": [
+ 0.025479920208454132,
+ 0.01673789508640766,
+ 0.016726836562156677,
+ 0.016698846593499184,
+ 0.01673932373523712
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4010000228881836,
+ "loss_eval": 1.6769893169403076,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.2020263671875,
+ 1126.9422607421875,
+ 1433.2410888671875,
+ 1329.9195556640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000546319643035531,
+ 0.00031345203751698136,
+ 0.000311522395350039,
+ 0.000311847630655393,
+ 0.0003111722180619836
+ ],
+ "bp_grad_F": [
+ 0.025481175631284714,
+ 0.01675844006240368,
+ 0.016747308894991875,
+ 0.016719479113817215,
+ 0.0167598407715559
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4075000286102295,
+ "loss_eval": 1.6769570112228394,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.3436889648438,
+ 1127.1475830078125,
+ 1433.49072265625,
+ 1330.1451416015625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005438647349365056,
+ 0.00031364860478788614,
+ 0.0003113296115770936,
+ 0.0003115428553428501,
+ 0.00031094413134269416
+ ],
+ "bp_grad_F": [
+ 0.025495020672678947,
+ 0.016764776781201363,
+ 0.016753805801272392,
+ 0.016725784167647362,
+ 0.016766248270869255
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.40800002217292786,
+ "loss_eval": 1.6758222579956055,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.4073486328125,
+ 1127.239501953125,
+ 1433.60302734375,
+ 1330.2476806640625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005444776033982635,
+ 0.0003124381182715297,
+ 0.0003098779125139117,
+ 0.0003102763439528644,
+ 0.0003094278508797288
+ ],
+ "bp_grad_F": [
+ 0.025471549481153488,
+ 0.016743116080760956,
+ 0.016732197254896164,
+ 0.016704153269529343,
+ 0.016744764521718025
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41450002789497375,
+ "loss_eval": 1.675687551498413,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 717.4231567382812,
+ 1127.262451171875,
+ 1433.6309814453125,
+ 1330.273193359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005445098504424095,
+ 0.0003131923731416464,
+ 0.00031077052699401975,
+ 0.0003107219818048179,
+ 0.00031013842090032995
+ ],
+ "bp_grad_F": [
+ 0.02547312155365944,
+ 0.016745658591389656,
+ 0.016734709963202477,
+ 0.016706665977835655,
+ 0.016747286543250084
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4140000343322754,
+ "loss_eval": 1.6754448413848877,
+ "epoch": 80
+ }
+ ],
+ "seed": 42,
+ "alpha": 1.0,
+ "depth": 4,
+ "d_hidden": 128
+} \ No newline at end of file