summaryrefslogtreecommitdiff
path: root/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_synth_v1/snapshot_fa_canonical_s42.json')
-rw-r--r--results/snapshot_synth_v1/snapshot_fa_canonical_s42.json2276
1 files changed, 2276 insertions, 0 deletions
diff --git a/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json
new file mode 100644
index 0000000..6ff85e7
--- /dev/null
+++ b/results/snapshot_synth_v1/snapshot_fa_canonical_s42.json
@@ -0,0 +1,2276 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.290447235107422,
+ 11.313605308532715,
+ 11.351215362548828,
+ 11.398087501525879
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00028353024390526116,
+ 0.0002828188880812377,
+ 0.00028162598027847707,
+ 0.0002799496578518301,
+ 0.0002791006409097463
+ ],
+ "bp_grad_F": [
+ 0.012684082612395287,
+ 0.01264861598610878,
+ 0.012589854188263416,
+ 0.012511610053479671,
+ 0.012471316382288933
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.08450000733137131,
+ "loss_eval": 2.4790313243865967,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.457883834838867,
+ 11.697802543640137,
+ 12.001762390136719,
+ 12.303658485412598
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004113642207812518,
+ 0.00037613665335811675,
+ 0.0003495849668979645,
+ 0.0003221812949050218,
+ 0.00025295966770499945
+ ],
+ "bp_grad_F": [
+ 0.018967075273394585,
+ 0.017186719924211502,
+ 0.015851320698857307,
+ 0.01445167325437069,
+ 0.011211601085960865
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5270000100135803,
+ "loss_eval": 1.4865981340408325,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.734084129333496,
+ 12.481009483337402,
+ 13.659913063049316,
+ 15.730950355529785
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007782558677718043,
+ 0.0006171928835101426,
+ 0.0004891889402642846,
+ 0.00038687532651238143,
+ 0.000231728219659999
+ ],
+ "bp_grad_F": [
+ 0.04103676602244377,
+ 0.03172670304775238,
+ 0.024926593527197838,
+ 0.019472092390060425,
+ 0.011657902970910072
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6360000371932983,
+ "loss_eval": 0.965207040309906,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 11.973358154296875,
+ 13.411399841308594,
+ 16.07562255859375,
+ 20.911983489990234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008172825910151005,
+ 0.0005784342647530138,
+ 0.000417369301430881,
+ 0.0003010776126757264,
+ 0.000168764207046479
+ ],
+ "bp_grad_F": [
+ 0.05745441094040871,
+ 0.04039904102683067,
+ 0.028755735605955124,
+ 0.020857004448771477,
+ 0.011488317511975765
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.687000036239624,
+ "loss_eval": 0.8154960870742798,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.203580856323242,
+ 14.659997940063477,
+ 19.929065704345703,
+ 27.998876571655273
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007437548483721912,
+ 0.00048129685455933213,
+ 0.00031908220262266695,
+ 0.00022696926316712052,
+ 0.00012886490731034428
+ ],
+ "bp_grad_F": [
+ 0.06721046566963196,
+ 0.043338593095541,
+ 0.028462719172239304,
+ 0.019943350926041603,
+ 0.01114331278949976
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.703000009059906,
+ "loss_eval": 0.7722610831260681,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.476441383361816,
+ 16.378177642822266,
+ 25.748563766479492,
+ 36.580970764160156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007116686902008951,
+ 0.00042677627061493695,
+ 0.0002665013598743826,
+ 0.00019125515245832503,
+ 0.0001178958555101417
+ ],
+ "bp_grad_F": [
+ 0.06977967172861099,
+ 0.04175141453742981,
+ 0.02600390836596489,
+ 0.018256530165672302,
+ 0.010964884422719479
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7070000171661377,
+ "loss_eval": 0.7697932720184326,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 12.808075904846191,
+ 19.022871017456055,
+ 33.50295639038086,
+ 45.75634002685547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000760514521971345,
+ 0.000416931085055694,
+ 0.0002524603623896837,
+ 0.00018262627418152988,
+ 0.0001200677506858483
+ ],
+ "bp_grad_F": [
+ 0.0695224478840828,
+ 0.03927718475461006,
+ 0.023749928921461105,
+ 0.01698874868452549,
+ 0.011118472553789616
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7035000324249268,
+ "loss_eval": 0.7977719902992249,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.191008567810059,
+ 22.44864273071289,
+ 42.65863800048828,
+ 54.38147735595703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007628297316841781,
+ 0.0003877072886098176,
+ 0.00022262487618718296,
+ 0.00016918807523325086,
+ 0.0001183631393359974
+ ],
+ "bp_grad_F": [
+ 0.06797165423631668,
+ 0.03639831766486168,
+ 0.02157149650156498,
+ 0.015874147415161133,
+ 0.011150078848004341
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.70250004529953,
+ "loss_eval": 0.8099735975265503,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 13.587474822998047,
+ 26.61025619506836,
+ 51.025230407714844,
+ 61.79695129394531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007774661062285304,
+ 0.00037008023355156183,
+ 0.00019806883938144892,
+ 0.0001550534798298031,
+ 0.00011658846779027954
+ ],
+ "bp_grad_F": [
+ 0.06822231411933899,
+ 0.03484996780753136,
+ 0.02039053477346897,
+ 0.015457017347216606,
+ 0.011438230983912945
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6920000314712524,
+ "loss_eval": 0.8282882571220398,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.02984619140625,
+ 31.27604866027832,
+ 59.14579391479492,
+ 68.8819580078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000821497815195471,
+ 0.000388532382203266,
+ 0.0002036481600953266,
+ 0.0001647671015234664,
+ 0.00012798182433471084
+ ],
+ "bp_grad_F": [
+ 0.06896942853927612,
+ 0.03378934785723686,
+ 0.019570810720324516,
+ 0.015211639925837517,
+ 0.01168233621865511
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6785000562667847,
+ "loss_eval": 0.8751994967460632,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 14.566975593566895,
+ 37.15107345581055,
+ 66.83728790283203,
+ 76.04595184326172
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008561373106203973,
+ 0.00037220801459625363,
+ 0.00018477423873264343,
+ 0.0001600280374987051,
+ 0.00012663347297348082
+ ],
+ "bp_grad_F": [
+ 0.06949204951524734,
+ 0.033161722123622894,
+ 0.019245225936174393,
+ 0.015247669070959091,
+ 0.012057062238454819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6585000157356262,
+ "loss_eval": 0.9142682552337646,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.22678279876709,
+ 44.73517990112305,
+ 74.21520233154297,
+ 82.72914123535156
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008647029753774405,
+ 0.0003551499976310879,
+ 0.00016902851348277181,
+ 0.00014951576304156333,
+ 0.0001220703707076609
+ ],
+ "bp_grad_F": [
+ 0.06799578666687012,
+ 0.03190648928284645,
+ 0.018390726298093796,
+ 0.015047998167574406,
+ 0.01216125674545765
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6635000109672546,
+ "loss_eval": 0.9312959313392639,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 15.982205390930176,
+ 53.03363037109375,
+ 81.01543426513672,
+ 88.02293395996094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008814894827082753,
+ 0.0003609499253798276,
+ 0.00016691464406903833,
+ 0.00015374798385892063,
+ 0.00012832213542424142
+ ],
+ "bp_grad_F": [
+ 0.06737235933542252,
+ 0.030633311718702316,
+ 0.017514588311314583,
+ 0.014722960069775581,
+ 0.012166885659098625
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6665000319480896,
+ "loss_eval": 0.9171096086502075,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 17.348485946655273,
+ 65.39360046386719,
+ 94.1773452758789,
+ 97.79885864257812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008671359973959625,
+ 0.0003543675411492586,
+ 0.00017760474293027073,
+ 0.00016833240806590766,
+ 0.0001419015898136422
+ ],
+ "bp_grad_F": [
+ 0.06303472071886063,
+ 0.027784455567598343,
+ 0.016537917777895927,
+ 0.01453208364546299,
+ 0.012470746412873268
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6520000100135803,
+ "loss_eval": 0.9543019533157349,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 19.79836082458496,
+ 82.84272003173828,
+ 118.11077880859375,
+ 117.29456329345703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000835613114759326,
+ 0.00034002913162112236,
+ 0.00017855060286819935,
+ 0.00017689696687739342,
+ 0.0001562273973831907
+ ],
+ "bp_grad_F": [
+ 0.05830768123269081,
+ 0.025488071143627167,
+ 0.01599927246570587,
+ 0.014500983990728855,
+ 0.012853534892201424
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6320000290870667,
+ "loss_eval": 0.9986603260040283,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 24.028667449951172,
+ 104.24053192138672,
+ 151.45233154296875,
+ 148.85594177246094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008604780305176973,
+ 0.0003412840305827558,
+ 0.00020471647439990193,
+ 0.00020128543837927282,
+ 0.00018673941667657346
+ ],
+ "bp_grad_F": [
+ 0.05637207254767418,
+ 0.023704711347818375,
+ 0.016045723110437393,
+ 0.015071108937263489,
+ 0.013779145665466785
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6110000014305115,
+ "loss_eval": 1.08339262008667,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 31.199304580688477,
+ 135.36643981933594,
+ 190.8426971435547,
+ 189.1505126953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000760686700232327,
+ 0.0002976131218019873,
+ 0.00019266465096734464,
+ 0.0001927861594595015,
+ 0.0001783591287676245
+ ],
+ "bp_grad_F": [
+ 0.04442710801959038,
+ 0.020077738910913467,
+ 0.0149933947250247,
+ 0.014391067437827587,
+ 0.01344863511621952
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6480000019073486,
+ "loss_eval": 1.0371382236480713,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 41.846805572509766,
+ 170.3418731689453,
+ 225.09695434570312,
+ 224.6548614501953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007461759960278869,
+ 0.00026667246129363775,
+ 0.00018387376621831208,
+ 0.00018445710884407163,
+ 0.00017204758478328586
+ ],
+ "bp_grad_F": [
+ 0.039136338979005814,
+ 0.018771812319755554,
+ 0.015547079034149647,
+ 0.01513050775974989,
+ 0.01431551855057478
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6200000047683716,
+ "loss_eval": 1.1162669658660889,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 57.18465042114258,
+ 206.83914184570312,
+ 262.21197509765625,
+ 260.03485107421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007871078560128808,
+ 0.00029353986610658467,
+ 0.00022458977764472365,
+ 0.00022484370856545866,
+ 0.00021257037587929517
+ ],
+ "bp_grad_F": [
+ 0.03888345882296562,
+ 0.01824026368558407,
+ 0.015890181064605713,
+ 0.015627194195985794,
+ 0.014916189946234226
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5615000128746033,
+ "loss_eval": 1.2106062173843384,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 75.66644287109375,
+ 241.24891662597656,
+ 298.0739440917969,
+ 293.95281982421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000782749499194324,
+ 0.0002943766303360462,
+ 0.00024086510529741645,
+ 0.00024184907670132816,
+ 0.0002289286785526201
+ ],
+ "bp_grad_F": [
+ 0.03717740252614021,
+ 0.01794801466166973,
+ 0.016123440116643906,
+ 0.0158899687230587,
+ 0.015260584652423859
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5680000185966492,
+ "loss_eval": 1.1780248880386353,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 97.68470764160156,
+ 276.2217712402344,
+ 334.56146240234375,
+ 329.1627502441406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007400053436867893,
+ 0.00028874175040982664,
+ 0.00024344309349544346,
+ 0.0002433314366498962,
+ 0.00023140427947510034
+ ],
+ "bp_grad_F": [
+ 0.03569746017456055,
+ 0.0169936865568161,
+ 0.015504195354878902,
+ 0.015339999459683895,
+ 0.014785589650273323
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5745000243186951,
+ "loss_eval": 1.1848244667053223,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 123.06426239013672,
+ 312.8515625,
+ 373.4215087890625,
+ 366.50213623046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007171913748607039,
+ 0.00026914477348327637,
+ 0.00023370776034425944,
+ 0.00023370303097181022,
+ 0.0002235924475826323
+ ],
+ "bp_grad_F": [
+ 0.03427436947822571,
+ 0.016933348029851913,
+ 0.015780098736286163,
+ 0.015659287571907043,
+ 0.015169495716691017
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5715000033378601,
+ "loss_eval": 1.2063732147216797,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 153.3316650390625,
+ 353.62042236328125,
+ 417.3258361816406,
+ 408.16680908203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007328973151743412,
+ 0.000268118514213711,
+ 0.00024018273688852787,
+ 0.00024114495317917317,
+ 0.0002314754092367366
+ ],
+ "bp_grad_F": [
+ 0.033994678407907486,
+ 0.016857070848345757,
+ 0.01595945656299591,
+ 0.01587284542620182,
+ 0.015459166839718819
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5450000166893005,
+ "loss_eval": 1.2801684141159058,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 187.16934204101562,
+ 397.18280029296875,
+ 464.5965881347656,
+ 453.26629638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007429302204400301,
+ 0.0002756037574727088,
+ 0.0002533047809265554,
+ 0.0002549285418353975,
+ 0.00024467214825563133
+ ],
+ "bp_grad_F": [
+ 0.03400976210832596,
+ 0.017134130001068115,
+ 0.016380103304982185,
+ 0.016292234882712364,
+ 0.015935255214571953
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5055000185966492,
+ "loss_eval": 1.4238585233688354,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 221.9723663330078,
+ 441.26580810546875,
+ 512.8148193359375,
+ 498.7379455566406
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006891476223245263,
+ 0.00027131737442687154,
+ 0.0002505357551854104,
+ 0.000251909252256155,
+ 0.0002428782609058544
+ ],
+ "bp_grad_F": [
+ 0.032484397292137146,
+ 0.01684476062655449,
+ 0.01627412810921669,
+ 0.016195174306631088,
+ 0.015904447063803673
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5290000438690186,
+ "loss_eval": 1.3381338119506836,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 256.86456298828125,
+ 485.2987060546875,
+ 561.24755859375,
+ 544.2046508789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007065363461151719,
+ 0.0002826322161126882,
+ 0.00026495553902350366,
+ 0.0002664696949068457,
+ 0.0002584822941571474
+ ],
+ "bp_grad_F": [
+ 0.032581742852926254,
+ 0.017135880887508392,
+ 0.01663898676633835,
+ 0.01656418852508068,
+ 0.016318844631314278
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.468500018119812,
+ "loss_eval": 1.4673320055007935,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 290.3281555175781,
+ 528.4644165039062,
+ 609.61181640625,
+ 589.482421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007876601885072887,
+ 0.000328866473864764,
+ 0.0003142827481497079,
+ 0.0003149702097289264,
+ 0.00030780391534790397
+ ],
+ "bp_grad_F": [
+ 0.0356873981654644,
+ 0.01825507916510105,
+ 0.01779749058187008,
+ 0.017760321497917175,
+ 0.0175130907446146
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.82278311252594,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 324.2997131347656,
+ 572.9197387695312,
+ 659.7073364257812,
+ 635.6883544921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006818437832407653,
+ 0.000307896378217265,
+ 0.0002974055823870003,
+ 0.000297438440611586,
+ 0.0002942352439276874
+ ],
+ "bp_grad_F": [
+ 0.03148573637008667,
+ 0.017155593261122704,
+ 0.016821201890707016,
+ 0.01674988865852356,
+ 0.016609078273177147
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4540000259876251,
+ "loss_eval": 1.4913204908370972,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 357.986572265625,
+ 616.8123168945312,
+ 709.2523193359375,
+ 681.3218994140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006822228315286338,
+ 0.00030397844966501,
+ 0.0002927799359895289,
+ 0.0002928805770352483,
+ 0.0002893624478019774
+ ],
+ "bp_grad_F": [
+ 0.03142063319683075,
+ 0.017380017787218094,
+ 0.017113016918301582,
+ 0.017052780836820602,
+ 0.01693262904882431
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.42250001430511475,
+ "loss_eval": 1.574558138847351,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 391.00396728515625,
+ 660.1432495117188,
+ 758.46875,
+ 726.479248046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006576834712177515,
+ 0.00029913688194938004,
+ 0.0002909695322159678,
+ 0.00029160548001527786,
+ 0.0002882194530684501
+ ],
+ "bp_grad_F": [
+ 0.03063797578215599,
+ 0.01751694455742836,
+ 0.017304742708802223,
+ 0.017256034538149834,
+ 0.017157413065433502
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.41700002551078796,
+ "loss_eval": 1.5943682193756104,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 423.0135803222656,
+ 702.8653564453125,
+ 807.1064453125,
+ 771.0443115234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007106211851350963,
+ 0.00032867168192751706,
+ 0.0003195058961864561,
+ 0.0003205789253115654,
+ 0.00031724729342386127
+ ],
+ "bp_grad_F": [
+ 0.032083574682474136,
+ 0.018385307863354683,
+ 0.01818086951971054,
+ 0.018159352242946625,
+ 0.01808425784111023
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3240000009536743,
+ "loss_eval": 1.9495495557785034,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 453.1861267089844,
+ 743.7100219726562,
+ 853.8812255859375,
+ 813.7102661132812
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006489204824902117,
+ 0.0002889770839828998,
+ 0.00028184326947666705,
+ 0.00028282302082516253,
+ 0.00027834190404973924
+ ],
+ "bp_grad_F": [
+ 0.029847772791981697,
+ 0.017620669677853584,
+ 0.017466910183429718,
+ 0.01743420958518982,
+ 0.017375603318214417
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3970000147819519,
+ "loss_eval": 1.6998002529144287,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 480.8240661621094,
+ 781.491943359375,
+ 897.1333618164062,
+ 853.1820678710938
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006337798549793661,
+ 0.0003062748000957072,
+ 0.0003002039447892457,
+ 0.00030039221746847034,
+ 0.0002973877126350999
+ ],
+ "bp_grad_F": [
+ 0.029168229550123215,
+ 0.017783651128411293,
+ 0.017649564892053604,
+ 0.017613932490348816,
+ 0.01756826601922512
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3865000307559967,
+ "loss_eval": 1.7693381309509277,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 505.9931945800781,
+ 816.3653564453125,
+ 937.6511840820312,
+ 890.0263061523438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006363698630593717,
+ 0.000327500601997599,
+ 0.0003217202320229262,
+ 0.0003208804700989276,
+ 0.0003201036306563765
+ ],
+ "bp_grad_F": [
+ 0.029376372694969177,
+ 0.018225492909550667,
+ 0.01810493879020214,
+ 0.01805899664759636,
+ 0.018048716709017754
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3400000035762787,
+ "loss_eval": 1.777511477470398,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 530.9385375976562,
+ 850.9844970703125,
+ 977.412841796875,
+ 926.3417358398438
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006240232032723725,
+ 0.00032233193633146584,
+ 0.00031883586780168116,
+ 0.0003202730731572956,
+ 0.0003188494883943349
+ ],
+ "bp_grad_F": [
+ 0.028516914695501328,
+ 0.018217962235212326,
+ 0.018127964809536934,
+ 0.018103662878274918,
+ 0.018076416105031967
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36250001192092896,
+ "loss_eval": 1.7461223602294922,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 555.9691162109375,
+ 885.6592407226562,
+ 1017.6103515625,
+ 962.8530883789062
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005949487676844001,
+ 0.0003172095457557589,
+ 0.00031312211649492383,
+ 0.0003130651020910591,
+ 0.0003118007443845272
+ ],
+ "bp_grad_F": [
+ 0.027917204424738884,
+ 0.018052855506539345,
+ 0.017963001504540443,
+ 0.01793370023369789,
+ 0.017934400588274002
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3775000274181366,
+ "loss_eval": 1.7961357831954956,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 580.1717529296875,
+ 919.149169921875,
+ 1056.32470703125,
+ 998.1345825195312
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006010148790664971,
+ 0.0003237369528505951,
+ 0.00031987245893105865,
+ 0.00031991174910217524,
+ 0.0003188104019500315
+ ],
+ "bp_grad_F": [
+ 0.027771273627877235,
+ 0.017915818840265274,
+ 0.017828019335865974,
+ 0.017802555114030838,
+ 0.017808666452765465
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.37400001287460327,
+ "loss_eval": 1.8124159574508667,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 602.5966186523438,
+ 950.484619140625,
+ 1092.6507568359375,
+ 1031.02294921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005852986359968781,
+ 0.0003249783185310662,
+ 0.00032142180134542286,
+ 0.0003207105037290603,
+ 0.00032108003506436944
+ ],
+ "bp_grad_F": [
+ 0.02701820805668831,
+ 0.01796947605907917,
+ 0.017892232164740562,
+ 0.017859354615211487,
+ 0.01788966730237007
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34950003027915955,
+ "loss_eval": 1.7797815799713135,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 624.4447021484375,
+ 981.1150512695312,
+ 1127.90234375,
+ 1063.09228515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005775236058980227,
+ 0.0003046133788302541,
+ 0.00030120721203275025,
+ 0.00030136521672829986,
+ 0.00029937425279058516
+ ],
+ "bp_grad_F": [
+ 0.026447290554642677,
+ 0.017799606546759605,
+ 0.017730647698044777,
+ 0.017701666802167892,
+ 0.017717311158776283
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3630000054836273,
+ "loss_eval": 1.7884948253631592,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 644.9402465820312,
+ 1010.1371459960938,
+ 1161.7808837890625,
+ 1093.9410400390625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000567529525142163,
+ 0.00032071411260403693,
+ 0.0003186226240359247,
+ 0.0003186469548381865,
+ 0.000316357531119138
+ ],
+ "bp_grad_F": [
+ 0.02652687579393387,
+ 0.018418341875076294,
+ 0.018360882997512817,
+ 0.018340308219194412,
+ 0.018352536484599113
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3375000059604645,
+ "loss_eval": 1.894034743309021,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 664.6719970703125,
+ 1038.15478515625,
+ 1194.3914794921875,
+ 1123.5455322265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005615526461042464,
+ 0.0003110080724582076,
+ 0.00030868081375956535,
+ 0.00030884178704582155,
+ 0.0003081669274251908
+ ],
+ "bp_grad_F": [
+ 0.025895435363054276,
+ 0.01783018186688423,
+ 0.017772147431969643,
+ 0.017754852771759033,
+ 0.01777641288936138
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3395000100135803,
+ "loss_eval": 1.9033000469207764,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 683.78173828125,
+ 1065.281005859375,
+ 1225.9638671875,
+ 1152.131591796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005448339506983757,
+ 0.0003069988451898098,
+ 0.0003048715298064053,
+ 0.0003052430984098464,
+ 0.00030476890970021486
+ ],
+ "bp_grad_F": [
+ 0.025077223777770996,
+ 0.017541181296110153,
+ 0.017490437254309654,
+ 0.01747160218656063,
+ 0.017498185858130455
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3840000033378601,
+ "loss_eval": 1.7054094076156616,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 701.634033203125,
+ 1090.699462890625,
+ 1255.5677490234375,
+ 1178.950927734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005554261151701212,
+ 0.0003436058177612722,
+ 0.0003414751263335347,
+ 0.0003412873193155974,
+ 0.0003412757650949061
+ ],
+ "bp_grad_F": [
+ 0.025991667062044144,
+ 0.018797792494297028,
+ 0.01875895820558071,
+ 0.018737811595201492,
+ 0.01877579651772976
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.2985000014305115,
+ "loss_eval": 1.9454095363616943,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 718.1909790039062,
+ 1114.3717041015625,
+ 1283.2196044921875,
+ 1204.0418701171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005466453148983419,
+ 0.00032576482044532895,
+ 0.00032447546254843473,
+ 0.0003244927211198956,
+ 0.0003245829720981419
+ ],
+ "bp_grad_F": [
+ 0.025174839422106743,
+ 0.01795799843966961,
+ 0.01791331358253956,
+ 0.017896415665745735,
+ 0.017930971458554268
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3190000057220459,
+ "loss_eval": 1.9117376804351807,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 734.4074096679688,
+ 1137.696044921875,
+ 1310.3448486328125,
+ 1228.5693359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005316757597029209,
+ 0.00032565969740971923,
+ 0.00032383095822297037,
+ 0.00032448669662699103,
+ 0.0003247321583330631
+ ],
+ "bp_grad_F": [
+ 0.024759862571954727,
+ 0.01794862188398838,
+ 0.01790694147348404,
+ 0.017891528084874153,
+ 0.017931628972291946
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3320000171661377,
+ "loss_eval": 1.8898653984069824,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 749.4878540039062,
+ 1159.565185546875,
+ 1335.8013916015625,
+ 1251.6041259765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005168311763554811,
+ 0.00031509375548921525,
+ 0.0003133788122795522,
+ 0.0003133984573651105,
+ 0.0003139932523481548
+ ],
+ "bp_grad_F": [
+ 0.0242743082344532,
+ 0.01778865046799183,
+ 0.0177480336278677,
+ 0.017732009291648865,
+ 0.01776931621134281
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3360000252723694,
+ "loss_eval": 1.809171199798584,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 763.5787353515625,
+ 1180.0230712890625,
+ 1359.6865234375,
+ 1273.1715087890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005242779734544456,
+ 0.0003271555178798735,
+ 0.00032485066913068295,
+ 0.0003253788163419813,
+ 0.00032494115293957293
+ ],
+ "bp_grad_F": [
+ 0.024425320327281952,
+ 0.01821528747677803,
+ 0.018175508826971054,
+ 0.018160372972488403,
+ 0.01819770224392414
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3290000259876251,
+ "loss_eval": 1.8727153539657593,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 777.29833984375,
+ 1199.8975830078125,
+ 1382.7962646484375,
+ 1294.0777587890625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005091701750643551,
+ 0.0003165322996210307,
+ 0.00031451781978830695,
+ 0.00031486450461670756,
+ 0.00031427579233422875
+ ],
+ "bp_grad_F": [
+ 0.023803148418664932,
+ 0.017688797786831856,
+ 0.017653871327638626,
+ 0.01764090545475483,
+ 0.017672821879386902
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3570000231266022,
+ "loss_eval": 1.7817366123199463,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 789.7103881835938,
+ 1218.070556640625,
+ 1403.869384765625,
+ 1313.1611328125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000508163939230144,
+ 0.00031658579246141016,
+ 0.0003145384253002703,
+ 0.0003149410185869783,
+ 0.000314467353746295
+ ],
+ "bp_grad_F": [
+ 0.023785017430782318,
+ 0.017845386639237404,
+ 0.01781085878610611,
+ 0.017796490341424942,
+ 0.017827292904257774
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3255000114440918,
+ "loss_eval": 1.9139658212661743,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 801.9373779296875,
+ 1235.8994140625,
+ 1424.5323486328125,
+ 1331.8375244140625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004862714558839798,
+ 0.0002926513261627406,
+ 0.0002908864407800138,
+ 0.0002910781477112323,
+ 0.0002900509862229228
+ ],
+ "bp_grad_F": [
+ 0.023361189290881157,
+ 0.01766069605946541,
+ 0.01763027161359787,
+ 0.017619280144572258,
+ 0.017652587965130806
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.36100003123283386,
+ "loss_eval": 1.8068753480911255,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 813.853515625,
+ 1253.337890625,
+ 1444.873779296875,
+ 1350.2630615234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00048765321844257414,
+ 0.000307347479974851,
+ 0.00030599997262470424,
+ 0.000306078844005242,
+ 0.000305346620734781
+ ],
+ "bp_grad_F": [
+ 0.023688213899731636,
+ 0.01818004995584488,
+ 0.018153388053178787,
+ 0.018142297863960266,
+ 0.018173247575759888
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3360000252723694,
+ "loss_eval": 1.8813791275024414,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 824.7192993164062,
+ 1269.39208984375,
+ 1463.5384521484375,
+ 1367.15625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004835445433855057,
+ 0.0003096247965004295,
+ 0.0003079361922573298,
+ 0.00030804326524958014,
+ 0.0003073872940149158
+ ],
+ "bp_grad_F": [
+ 0.02330639213323593,
+ 0.01797325722873211,
+ 0.0179448202252388,
+ 0.017932146787643433,
+ 0.0179706122726202
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.8429521322250366,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 834.9524536132812,
+ 1284.4827880859375,
+ 1481.0673828125,
+ 1383.0155029296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047791830729693174,
+ 0.0003027814091183245,
+ 0.0003019821015186608,
+ 0.0003020255535375327,
+ 0.0003012260131072253
+ ],
+ "bp_grad_F": [
+ 0.02303098328411579,
+ 0.01771283708512783,
+ 0.01768432930111885,
+ 0.017673376947641373,
+ 0.01770668476819992
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34850001335144043,
+ "loss_eval": 1.8080617189407349,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 844.5447998046875,
+ 1298.628662109375,
+ 1497.57373046875,
+ 1397.9241943359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000483115843962878,
+ 0.0003182529762852937,
+ 0.00031743990257382393,
+ 0.0003175203746650368,
+ 0.0003175794845446944
+ ],
+ "bp_grad_F": [
+ 0.02306683361530304,
+ 0.01790531352162361,
+ 0.017880147323012352,
+ 0.017869742587208748,
+ 0.017903709784150124
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33100003004074097,
+ "loss_eval": 1.8166543245315552,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 853.7017822265625,
+ 1312.1446533203125,
+ 1513.2933349609375,
+ 1412.1080322265625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047640595585107803,
+ 0.00031948628020472825,
+ 0.00031817753915674984,
+ 0.00031873476109467447,
+ 0.0003185000387020409
+ ],
+ "bp_grad_F": [
+ 0.022898783907294273,
+ 0.017956143245100975,
+ 0.017929796129465103,
+ 0.017917128279805183,
+ 0.017962384968996048
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33800002932548523,
+ "loss_eval": 1.8004838228225708,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 862.0558471679688,
+ 1324.4920654296875,
+ 1527.697509765625,
+ 1425.1290283203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004698090488091111,
+ 0.00029860963695682585,
+ 0.0002971645735669881,
+ 0.0002974079397972673,
+ 0.00029624722083099186
+ ],
+ "bp_grad_F": [
+ 0.022676818072795868,
+ 0.01772218942642212,
+ 0.017698047682642937,
+ 0.017688868567347527,
+ 0.01772254891693592
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3530000150203705,
+ "loss_eval": 1.8075289726257324,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 869.9756469726562,
+ 1336.185791015625,
+ 1541.3792724609375,
+ 1437.4677734375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004706987820100039,
+ 0.0003098493325524032,
+ 0.0003085599164478481,
+ 0.0003086493816226721,
+ 0.0003082384937442839
+ ],
+ "bp_grad_F": [
+ 0.022675253450870514,
+ 0.01779225468635559,
+ 0.017767589539289474,
+ 0.017757505178451538,
+ 0.017791779711842537
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.827038288116455,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 877.3834838867188,
+ 1347.156982421875,
+ 1554.1087646484375,
+ 1448.9537353515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000473314750706777,
+ 0.00030716857872903347,
+ 0.0003054763947147876,
+ 0.0003060955787077546,
+ 0.0003047685313504189
+ ],
+ "bp_grad_F": [
+ 0.02272479608654976,
+ 0.01781822182238102,
+ 0.017794664949178696,
+ 0.01778644695878029,
+ 0.01781868003308773
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.32450002431869507,
+ "loss_eval": 1.8790045976638794,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 884.1793212890625,
+ 1357.25146484375,
+ 1565.88232421875,
+ 1459.538818359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046717250370420516,
+ 0.00030950061045587063,
+ 0.000308411312289536,
+ 0.00030838610837236047,
+ 0.00030820758547633886
+ ],
+ "bp_grad_F": [
+ 0.02260792814195156,
+ 0.017898347228765488,
+ 0.017876161262392998,
+ 0.017865851521492004,
+ 0.01790330745279789
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3225000202655792,
+ "loss_eval": 1.8583427667617798,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 890.4108276367188,
+ 1366.517333984375,
+ 1576.69921875,
+ 1469.300537109375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004612848279066384,
+ 0.00030920191784389317,
+ 0.0003086488868575543,
+ 0.0003085103817284107,
+ 0.0003084034251514822
+ ],
+ "bp_grad_F": [
+ 0.022702287882566452,
+ 0.018074622377753258,
+ 0.01805359311401844,
+ 0.018043993040919304,
+ 0.018074078485369682
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.33250001072883606,
+ "loss_eval": 1.8819878101348877,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 896.1082763671875,
+ 1374.973388671875,
+ 1586.524169921875,
+ 1478.1490478515625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046731752809137106,
+ 0.0003127296222373843,
+ 0.00031115938327275217,
+ 0.0003112337435595691,
+ 0.00031117399339564145
+ ],
+ "bp_grad_F": [
+ 0.022609086707234383,
+ 0.018025977537035942,
+ 0.01800408773124218,
+ 0.017995676025748253,
+ 0.018028175458312035
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3150000274181366,
+ "loss_eval": 1.8731034994125366,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 901.4246826171875,
+ 1382.871337890625,
+ 1595.7164306640625,
+ 1486.465576171875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004559764638543129,
+ 0.00029873938183300197,
+ 0.00029821961652487516,
+ 0.0002982193836942315,
+ 0.0002976148098241538
+ ],
+ "bp_grad_F": [
+ 0.022443631663918495,
+ 0.017807144671678543,
+ 0.01778426393866539,
+ 0.017775312066078186,
+ 0.017809107899665833
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3190000057220459,
+ "loss_eval": 1.9132741689682007,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 906.219970703125,
+ 1389.97998046875,
+ 1603.95458984375,
+ 1493.869384765625
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045692393905483186,
+ 0.000307796144625172,
+ 0.0003068537334911525,
+ 0.0003067644138354808,
+ 0.0003064550110138953
+ ],
+ "bp_grad_F": [
+ 0.022245025262236595,
+ 0.017795003950595856,
+ 0.0177734587341547,
+ 0.017764581367373466,
+ 0.017800522968173027
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3270000219345093,
+ "loss_eval": 1.8190391063690186,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 910.5570678710938,
+ 1396.3927001953125,
+ 1611.4957275390625,
+ 1500.6524658203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045115925604477525,
+ 0.00029847086989320815,
+ 0.0002977230178657919,
+ 0.0002977572148665786,
+ 0.0002975583774968982
+ ],
+ "bp_grad_F": [
+ 0.02203645370900631,
+ 0.017681924626231194,
+ 0.01766141690313816,
+ 0.017652763053774834,
+ 0.0176865067332983
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35500001907348633,
+ "loss_eval": 1.7965762615203857,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 914.5003662109375,
+ 1402.2757568359375,
+ 1618.2999267578125,
+ 1506.7991943359375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004569143056869507,
+ 0.00029972344054840505,
+ 0.0002987241605296731,
+ 0.0002987434563692659,
+ 0.00029907189309597015
+ ],
+ "bp_grad_F": [
+ 0.022272884845733643,
+ 0.01781252957880497,
+ 0.017791228368878365,
+ 0.017782466486096382,
+ 0.017818717285990715
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.328000009059906,
+ "loss_eval": 1.8610442876815796,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 918.0006103515625,
+ 1407.5118408203125,
+ 1624.3853759765625,
+ 1512.30029296875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00045414711348712444,
+ 0.00030931030050851405,
+ 0.0003081976028624922,
+ 0.0003081892791669816,
+ 0.0003081847680732608
+ ],
+ "bp_grad_F": [
+ 0.022085461765527725,
+ 0.01779778115451336,
+ 0.017776912078261375,
+ 0.017768092453479767,
+ 0.01780613884329796
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34300002455711365,
+ "loss_eval": 1.804802417755127,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 921.121826171875,
+ 1412.175537109375,
+ 1629.830810546875,
+ 1517.2005615234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004531690792646259,
+ 0.00031135816243477166,
+ 0.00031044447678141296,
+ 0.00031072759884409606,
+ 0.0003106470685452223
+ ],
+ "bp_grad_F": [
+ 0.022044293582439423,
+ 0.017750630155205727,
+ 0.017730476334691048,
+ 0.017722314223647118,
+ 0.017757223919034004
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34150001406669617,
+ "loss_eval": 1.8111987113952637,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 923.8903198242188,
+ 1416.300048828125,
+ 1634.646484375,
+ 1521.5411376953125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004468595434445888,
+ 0.0003022409218829125,
+ 0.00030127677018754184,
+ 0.00030117464484646916,
+ 0.00030144210904836655
+ ],
+ "bp_grad_F": [
+ 0.02193099819123745,
+ 0.017699316143989563,
+ 0.017679594457149506,
+ 0.017671333625912666,
+ 0.017706507816910744
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3525000214576721,
+ "loss_eval": 1.797281265258789,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 926.2950439453125,
+ 1419.8856201171875,
+ 1638.8184814453125,
+ 1525.284423828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044905568938702345,
+ 0.00030229080584831536,
+ 0.00030173707637004554,
+ 0.0003015522670466453,
+ 0.0003012538072653115
+ ],
+ "bp_grad_F": [
+ 0.021881939843297005,
+ 0.017657367512583733,
+ 0.017637958750128746,
+ 0.017629873007535934,
+ 0.01766354590654373
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34800001978874207,
+ "loss_eval": 1.8036439418792725,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 928.36181640625,
+ 1422.943359375,
+ 1642.3917236328125,
+ 1528.47705078125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004465414967853576,
+ 0.00030299098580144346,
+ 0.00030190899269655347,
+ 0.00030191292171366513,
+ 0.000301982625387609
+ ],
+ "bp_grad_F": [
+ 0.02188783325254917,
+ 0.01768629439175129,
+ 0.01766696758568287,
+ 0.017658723518252373,
+ 0.017692700028419495
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.359000027179718,
+ "loss_eval": 1.7996938228607178,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 930.1182861328125,
+ 1425.561279296875,
+ 1645.422607421875,
+ 1531.2088623046875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004439539334271103,
+ 0.00030093194800429046,
+ 0.00030001465347595513,
+ 0.0003001568838953972,
+ 0.0002998457639478147
+ ],
+ "bp_grad_F": [
+ 0.021926432847976685,
+ 0.01775786094367504,
+ 0.017738472670316696,
+ 0.01773017831146717,
+ 0.01776653714478016
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.8030681610107422,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 931.579345703125,
+ 1427.7337646484375,
+ 1647.9693603515625,
+ 1533.509033203125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044511700980365276,
+ 0.00030080872238613665,
+ 0.00030003004940226674,
+ 0.0003000932920258492,
+ 0.00029993904172442853
+ ],
+ "bp_grad_F": [
+ 0.021828416734933853,
+ 0.017681054770946503,
+ 0.017661932855844498,
+ 0.017653752118349075,
+ 0.017688728868961334
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.7960853576660156,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 932.7696533203125,
+ 1429.520751953125,
+ 1650.0577392578125,
+ 1535.389892578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004446738166734576,
+ 0.0003006414044648409,
+ 0.00030009649344719946,
+ 0.0003001675067935139,
+ 0.00029965140856802464
+ ],
+ "bp_grad_F": [
+ 0.021837500855326653,
+ 0.01768680103123188,
+ 0.017667656764388084,
+ 0.017659684643149376,
+ 0.017694275826215744
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35450002551078796,
+ "loss_eval": 1.8004000186920166,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 933.7157592773438,
+ 1430.9381103515625,
+ 1651.7154541015625,
+ 1536.879638671875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044473307207226753,
+ 0.00030047594918869436,
+ 0.0002997968113049865,
+ 0.00029963525594212115,
+ 0.00029955641366541386
+ ],
+ "bp_grad_F": [
+ 0.0217889491468668,
+ 0.01765742339193821,
+ 0.01763851009309292,
+ 0.01763063855469227,
+ 0.017664924263954163
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3555000126361847,
+ "loss_eval": 1.7942780256271362,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 934.4593505859375,
+ 1432.0382080078125,
+ 1652.9989013671875,
+ 1538.0234375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004453740257304162,
+ 0.0003002033627126366,
+ 0.00029949398594908416,
+ 0.00029964259010739625,
+ 0.0002993734087795019
+ ],
+ "bp_grad_F": [
+ 0.021799130365252495,
+ 0.017666727304458618,
+ 0.0176478810608387,
+ 0.017639974132180214,
+ 0.017674267292022705
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.34550002217292786,
+ "loss_eval": 1.800949215888977,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 934.9984741210938,
+ 1432.84814453125,
+ 1653.939697265625,
+ 1538.8624267578125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044546957360580564,
+ 0.0003038236463908106,
+ 0.000302964064758271,
+ 0.00030298702768050134,
+ 0.00030283271917141974
+ ],
+ "bp_grad_F": [
+ 0.021853182464838028,
+ 0.017717286944389343,
+ 0.017698239535093307,
+ 0.017690137028694153,
+ 0.01772582344710827
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35600000619888306,
+ "loss_eval": 1.800832986831665,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.3856201171875,
+ 1433.427490234375,
+ 1654.6126708984375,
+ 1539.4669189453125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044487748527899384,
+ 0.00030164900817908347,
+ 0.00030081532895565033,
+ 0.00030082385637797415,
+ 0.000300481216982007
+ ],
+ "bp_grad_F": [
+ 0.02177177555859089,
+ 0.017657004296779633,
+ 0.017638202756643295,
+ 0.017630264163017273,
+ 0.01766461506485939
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3490000069141388,
+ "loss_eval": 1.794891119003296,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.636474609375,
+ 1433.79345703125,
+ 1655.038330078125,
+ 1539.8505859375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004437313473317772,
+ 0.00030232034623622894,
+ 0.0003012971137650311,
+ 0.00030129036167636514,
+ 0.00030084658646956086
+ ],
+ "bp_grad_F": [
+ 0.021787401288747787,
+ 0.0176764614880085,
+ 0.017657602205872536,
+ 0.017649594694375992,
+ 0.017684470862150192
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35350000858306885,
+ "loss_eval": 1.7952260971069336,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.7716064453125,
+ 1433.996826171875,
+ 1655.2738037109375,
+ 1540.06298828125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044510490261018276,
+ 0.0003025131591130048,
+ 0.00030167156364768744,
+ 0.0003019055584445596,
+ 0.00030186952790245414
+ ],
+ "bp_grad_F": [
+ 0.02179691381752491,
+ 0.017687244340777397,
+ 0.017668338492512703,
+ 0.017660312354564667,
+ 0.01769554615020752
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35200002789497375,
+ "loss_eval": 1.7945536375045776,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.8350830078125,
+ 1434.09326171875,
+ 1655.3861083984375,
+ 1540.164794921875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044426857493817806,
+ 0.0003006447514053434,
+ 0.0002995560353156179,
+ 0.0002996143593918532,
+ 0.0002996891853399575
+ ],
+ "bp_grad_F": [
+ 0.02177303098142147,
+ 0.017660290002822876,
+ 0.017641469836235046,
+ 0.017633574083447456,
+ 0.01766815222799778
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.35850000381469727,
+ "loss_eval": 1.7939436435699463,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 11.269571304321289,
+ 935.8506469726562,
+ 1434.11669921875,
+ 1655.4130859375,
+ 1540.189208984375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00044382456690073013,
+ 0.0003010118380188942,
+ 0.0003002960584126413,
+ 0.00030042475555092096,
+ 0.00029991925111971796
+ ],
+ "bp_grad_F": [
+ 0.021775126457214355,
+ 0.01766343042254448,
+ 0.017644599080085754,
+ 0.017636677250266075,
+ 0.017671329900622368
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.3595000207424164,
+ "loss_eval": 1.7936068773269653,
+ "epoch": 80
+ }
+ ],
+ "seed": 42,
+ "alpha": 1.0,
+ "depth": 4,
+ "d_hidden": 128
+} \ No newline at end of file