summaryrefslogtreecommitdiff
path: root/results/snapshot_vit_v1/snapshot_vit_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s42.json')
-rw-r--r--results/snapshot_vit_v1/snapshot_vit_s42.json4594
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s42.json b/results/snapshot_vit_v1/snapshot_vit_s42.json
new file mode 100644
index 0000000..569af46
--- /dev/null
+++ b/results/snapshot_vit_v1/snapshot_vit_s42.json
@@ -0,0 +1,4594 @@
+{
+ "config": {
+ "output_dir": "results/snapshot_vit_v1",
+ "epochs": 60,
+ "lr": 0.001,
+ "wd": 0.05,
+ "seed": 42,
+ "depth": 4,
+ "d_model": 128,
+ "n_heads": 4
+ },
+ "depth": 4,
+ "d_model": 128,
+ "architecture": "ViTMini",
+ "bp_log": [
+ {
+ "hidden_norms_cls": [
+ 0.31052109599113464,
+ 3.2536301612854004,
+ 4.7681732177734375,
+ 6.129599571228027,
+ 7.124356746673584
+ ],
+ "hidden_norms_avg": [
+ 6.008513927459717,
+ 7.034290313720703,
+ 7.942849636077881,
+ 8.915729522705078,
+ 9.635361671447754
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.004442029166966677,
+ 0.0012008437188342214,
+ 0.0009976272704079747,
+ 0.0009104337659664452,
+ 0.0008558662957511842
+ ],
+ "bp_grad_F": [
+ 0.18535660207271576,
+ 0.03968670591711998,
+ 0.032604776322841644,
+ 0.029427478089928627,
+ 0.02746850810945034
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.1376953125,
+ "loss_eval": 2.35188627243042,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 0.511958122253418,
+ 12.453446388244629,
+ 18.366989135742188,
+ 25.54116439819336,
+ 31.80699348449707
+ ],
+ "hidden_norms_avg": [
+ 4.10694694519043,
+ 10.166566848754883,
+ 14.66998291015625,
+ 19.93342399597168,
+ 25.32619857788086
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0019771556835621595,
+ 0.00022324378369376063,
+ 0.00016308785416185856,
+ 0.00014621105219703168,
+ 0.0001451292191632092
+ ],
+ "bp_grad_F": [
+ 0.11066891252994537,
+ 0.01034498494118452,
+ 0.006372526753693819,
+ 0.0052248528227210045,
+ 0.005017552524805069
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.4501953125,
+ "loss_eval": 1.5154438018798828,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 0.6518111824989319,
+ 13.549692153930664,
+ 20.607715606689453,
+ 27.90418243408203,
+ 32.70498275756836
+ ],
+ "hidden_norms_avg": [
+ 4.0909905433654785,
+ 11.942686080932617,
+ 17.39116096496582,
+ 22.200014114379883,
+ 26.230010986328125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0017800139030441642,
+ 0.00026728332159109414,
+ 0.0001720335567370057,
+ 0.0001423172070644796,
+ 0.00013423117343336344
+ ],
+ "bp_grad_F": [
+ 0.08781559765338898,
+ 0.010987765155732632,
+ 0.0064147054217755795,
+ 0.0050079175271093845,
+ 0.004637593869119883
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.494140625,
+ "loss_eval": 1.3824832439422607,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 0.755299985408783,
+ 11.224863052368164,
+ 19.053363800048828,
+ 27.303081512451172,
+ 33.078182220458984
+ ],
+ "hidden_norms_avg": [
+ 4.027151584625244,
+ 12.449769973754883,
+ 17.769508361816406,
+ 22.97556495666504,
+ 27.065759658813477
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0018998769810423255,
+ 0.00030996452551335096,
+ 0.00018013815861195326,
+ 0.0001340982416877523,
+ 0.00012205552775412798
+ ],
+ "bp_grad_F": [
+ 0.09037011116743088,
+ 0.013488140888512135,
+ 0.007346263621002436,
+ 0.0051797907799482346,
+ 0.004589984193444252
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.5439453125,
+ "loss_eval": 1.2540550231933594,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 0.844818651676178,
+ 13.648336410522461,
+ 20.277976989746094,
+ 28.240915298461914,
+ 33.095726013183594
+ ],
+ "hidden_norms_avg": [
+ 4.036877632141113,
+ 12.003630638122559,
+ 17.05451011657715,
+ 22.15869903564453,
+ 25.917491912841797
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016167981084436178,
+ 0.00028610811568796635,
+ 0.0001777650322765112,
+ 0.00012878721463494003,
+ 0.0001112063619075343
+ ],
+ "bp_grad_F": [
+ 0.07410340011119843,
+ 0.012637714855372906,
+ 0.007633093744516373,
+ 0.005242784973233938,
+ 0.004431390203535557
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1045944690704346,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 0.9051892161369324,
+ 12.476008415222168,
+ 19.24710464477539,
+ 27.6123046875,
+ 32.35737609863281
+ ],
+ "hidden_norms_avg": [
+ 4.138596057891846,
+ 12.409324645996094,
+ 17.427003860473633,
+ 22.245147705078125,
+ 25.471385955810547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0016044765943661332,
+ 0.00030248358962126076,
+ 0.00018807635933626443,
+ 0.00013626758300233632,
+ 0.00011398641800042242
+ ],
+ "bp_grad_F": [
+ 0.08322811126708984,
+ 0.01390017382800579,
+ 0.008505746722221375,
+ 0.005747759714722633,
+ 0.004776888992637396
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.1296963691711426,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 0.9687634110450745,
+ 11.625859260559082,
+ 18.38014793395996,
+ 26.869504928588867,
+ 31.455507278442383
+ ],
+ "hidden_norms_avg": [
+ 4.263001441955566,
+ 13.1234769821167,
+ 17.853057861328125,
+ 22.476547241210938,
+ 25.29656410217285
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0015340449754148722,
+ 0.00033552697277627885,
+ 0.00021536082203965634,
+ 0.00015067037020344287,
+ 0.00012220896314829588
+ ],
+ "bp_grad_F": [
+ 0.07571946829557419,
+ 0.015132292173802853,
+ 0.009512492455542088,
+ 0.006373303942382336,
+ 0.005029390100389719
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.603515625,
+ "loss_eval": 1.0963702201843262,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 1.0029383897781372,
+ 12.687585830688477,
+ 19.734830856323242,
+ 28.174379348754883,
+ 32.5982780456543
+ ],
+ "hidden_norms_avg": [
+ 4.357974052429199,
+ 13.182960510253906,
+ 17.720989227294922,
+ 21.832895278930664,
+ 24.934776306152344
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013370191445574164,
+ 0.00026788320974446833,
+ 0.00018144956266041845,
+ 0.00013219293032307178,
+ 0.00010196284711128101
+ ],
+ "bp_grad_F": [
+ 0.06996501982212067,
+ 0.013071151450276375,
+ 0.008477694354951382,
+ 0.0061036222614347935,
+ 0.004761465825140476
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6416015625,
+ "loss_eval": 0.9737913012504578,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 1.043707013130188,
+ 12.487404823303223,
+ 18.845643997192383,
+ 26.870864868164062,
+ 31.145292282104492
+ ],
+ "hidden_norms_avg": [
+ 4.454991340637207,
+ 13.503378868103027,
+ 18.694488525390625,
+ 23.029804229736328,
+ 25.810880661010742
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0013130803126841784,
+ 0.00029930632445029914,
+ 0.0002022052649408579,
+ 0.0001383959170198068,
+ 0.00010439592006150633
+ ],
+ "bp_grad_F": [
+ 0.0743240937590599,
+ 0.015402271412312984,
+ 0.009977605193853378,
+ 0.006877230014652014,
+ 0.005202346481382847
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.666015625,
+ "loss_eval": 0.9317076206207275,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 1.0887501239776611,
+ 12.662396430969238,
+ 18.622724533081055,
+ 26.599454879760742,
+ 31.788663864135742
+ ],
+ "hidden_norms_avg": [
+ 4.529710292816162,
+ 13.683384895324707,
+ 18.47463607788086,
+ 22.395898818969727,
+ 25.244558334350586
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0012017677072435617,
+ 0.0002972102665808052,
+ 0.00019775003602262586,
+ 0.00013734954700339586,
+ 9.880279685603455e-05
+ ],
+ "bp_grad_F": [
+ 0.0661192312836647,
+ 0.01516024675220251,
+ 0.010001113638281822,
+ 0.006893018260598183,
+ 0.0051134442910552025
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6669921875,
+ "loss_eval": 0.9026263952255249,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1163448095321655,
+ 12.711283683776855,
+ 18.790128707885742,
+ 26.846359252929688,
+ 31.663158416748047
+ ],
+ "hidden_norms_avg": [
+ 4.502295970916748,
+ 13.801639556884766,
+ 18.488975524902344,
+ 22.378704071044922,
+ 25.22056007385254
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0011062510311603546,
+ 0.00029147896566428244,
+ 0.0001970102748600766,
+ 0.00013174059859011322,
+ 0.0001037597976392135
+ ],
+ "bp_grad_F": [
+ 0.06217500939965248,
+ 0.014721231535077095,
+ 0.00993143580853939,
+ 0.006723989732563496,
+ 0.005166618153452873
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.6845703125,
+ "loss_eval": 0.8660677671432495,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1505078077316284,
+ 12.160571098327637,
+ 18.15353012084961,
+ 25.762012481689453,
+ 31.478300094604492
+ ],
+ "hidden_norms_avg": [
+ 4.5605149269104,
+ 13.918573379516602,
+ 18.88881492614746,
+ 22.79344940185547,
+ 25.800094604492188
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009689349099062383,
+ 0.0002486997109372169,
+ 0.0001736732665449381,
+ 0.00011473154881969094,
+ 8.573567902203649e-05
+ ],
+ "bp_grad_F": [
+ 0.06455213576555252,
+ 0.01547171175479889,
+ 0.010573537088930607,
+ 0.0071961241774261,
+ 0.005212985444813967
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.71484375,
+ "loss_eval": 0.812907874584198,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 1.1844152212142944,
+ 11.332664489746094,
+ 16.57625961303711,
+ 23.82307243347168,
+ 28.492321014404297
+ ],
+ "hidden_norms_avg": [
+ 4.602160453796387,
+ 13.876313209533691,
+ 17.891036987304688,
+ 21.410982131958008,
+ 23.97108268737793
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009290817542932928,
+ 0.0002613075776025653,
+ 0.0001877332106232643,
+ 0.0001262558507733047,
+ 9.168039832729846e-05
+ ],
+ "bp_grad_F": [
+ 0.06392678618431091,
+ 0.01674485206604004,
+ 0.011727217584848404,
+ 0.007738997228443623,
+ 0.005730107892304659
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7197265625,
+ "loss_eval": 0.7641609907150269,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2184560298919678,
+ 12.450925827026367,
+ 18.076860427856445,
+ 25.162586212158203,
+ 30.365047454833984
+ ],
+ "hidden_norms_avg": [
+ 4.7080278396606445,
+ 13.851634979248047,
+ 18.517131805419922,
+ 22.074214935302734,
+ 24.72054100036621
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009277731878682971,
+ 0.00024563330225646496,
+ 0.00017736255540512502,
+ 0.00012202116340631619,
+ 8.748921391088516e-05
+ ],
+ "bp_grad_F": [
+ 0.06389915198087692,
+ 0.016115156933665276,
+ 0.0110858753323555,
+ 0.0076499818824231625,
+ 0.005541808437556028
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.697265625,
+ "loss_eval": 0.8037601113319397,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 1.243064045906067,
+ 11.932015419006348,
+ 17.215856552124023,
+ 24.764291763305664,
+ 29.49314308166504
+ ],
+ "hidden_norms_avg": [
+ 4.651937961578369,
+ 13.890728950500488,
+ 18.2476749420166,
+ 21.80103302001953,
+ 24.145692825317383
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009111211402341723,
+ 0.000253814272582531,
+ 0.00018247529806103557,
+ 0.00011639296280918643,
+ 8.364167297258973e-05
+ ],
+ "bp_grad_F": [
+ 0.06324896216392517,
+ 0.016394753009080887,
+ 0.01153184287250042,
+ 0.007614497095346451,
+ 0.0056136660277843475
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.728515625,
+ "loss_eval": 0.7384279370307922,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2652677297592163,
+ 11.532588005065918,
+ 16.7224178314209,
+ 23.326444625854492,
+ 28.03766441345215
+ ],
+ "hidden_norms_avg": [
+ 4.652615547180176,
+ 13.981542587280273,
+ 17.984512329101562,
+ 21.317432403564453,
+ 23.233760833740234
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0008032417972572148,
+ 0.00022395161795429885,
+ 0.00016904002404771745,
+ 0.0001078559216693975,
+ 7.841538899810985e-05
+ ],
+ "bp_grad_F": [
+ 0.06386830657720566,
+ 0.016731705516576767,
+ 0.012135310098528862,
+ 0.008108492009341717,
+ 0.006046997383236885
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7333984375,
+ "loss_eval": 0.7387630939483643,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 1.2944419384002686,
+ 11.34481430053711,
+ 16.45362091064453,
+ 22.63861846923828,
+ 28.011232376098633
+ ],
+ "hidden_norms_avg": [
+ 4.738389015197754,
+ 13.769956588745117,
+ 17.63072395324707,
+ 21.14189338684082,
+ 23.455045700073242
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007927753031253815,
+ 0.0002345799293834716,
+ 0.00016934113227762282,
+ 0.00011508075840538368,
+ 7.966109114931896e-05
+ ],
+ "bp_grad_F": [
+ 0.0655454769730568,
+ 0.01815187744796276,
+ 0.013005951419472694,
+ 0.008820701390504837,
+ 0.006184164900332689
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7255859375,
+ "loss_eval": 0.7302451133728027,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3085625171661377,
+ 11.323317527770996,
+ 15.866230964660645,
+ 21.746976852416992,
+ 27.081127166748047
+ ],
+ "hidden_norms_avg": [
+ 4.687533855438232,
+ 13.471115112304688,
+ 17.396968841552734,
+ 20.327377319335938,
+ 22.58539581298828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006625292589887977,
+ 0.00019486426026560366,
+ 0.00014659677981399,
+ 9.787825547391549e-05,
+ 6.321907130768523e-05
+ ],
+ "bp_grad_F": [
+ 0.07393868267536163,
+ 0.020178642123937607,
+ 0.014442694373428822,
+ 0.009784683585166931,
+ 0.00656729843467474
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7412109375,
+ "loss_eval": 0.7063955068588257,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3433176279067993,
+ 10.762125968933105,
+ 15.129413604736328,
+ 21.06867790222168,
+ 26.1944522857666
+ ],
+ "hidden_norms_avg": [
+ 4.709607124328613,
+ 13.69739055633545,
+ 17.006061553955078,
+ 19.97213363647461,
+ 22.212177276611328
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006978239398449659,
+ 0.00021396303782239556,
+ 0.00016030693950597197,
+ 0.00010856003791559488,
+ 6.917239079484716e-05
+ ],
+ "bp_grad_F": [
+ 0.06653428077697754,
+ 0.019508732482790947,
+ 0.014456766657531261,
+ 0.010107609443366528,
+ 0.006681134924292564
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.75,
+ "loss_eval": 0.6990396976470947,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3607734441757202,
+ 10.718966484069824,
+ 15.383923530578613,
+ 21.34387969970703,
+ 26.49329376220703
+ ],
+ "hidden_norms_avg": [
+ 4.7122907638549805,
+ 13.804581642150879,
+ 17.532636642456055,
+ 20.843929290771484,
+ 23.01592254638672
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007053805165924132,
+ 0.0002122409496223554,
+ 0.00016182110994122922,
+ 0.00011085433652624488,
+ 7.204789289971814e-05
+ ],
+ "bp_grad_F": [
+ 0.06105736270546913,
+ 0.017779415473341942,
+ 0.013269647024571896,
+ 0.009227588772773743,
+ 0.006410240661352873
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7763671875,
+ "loss_eval": 0.6498311758041382,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 1.3752704858779907,
+ 10.530582427978516,
+ 14.803340911865234,
+ 20.217910766601562,
+ 25.20522689819336
+ ],
+ "hidden_norms_avg": [
+ 4.7595720291137695,
+ 13.601245880126953,
+ 17.491943359375,
+ 20.960437774658203,
+ 22.910301208496094
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006476694834418595,
+ 0.00020479912927839905,
+ 0.0001524801627965644,
+ 0.00010630583710735664,
+ 6.906194903422147e-05
+ ],
+ "bp_grad_F": [
+ 0.06572327762842178,
+ 0.019566379487514496,
+ 0.01484121847897768,
+ 0.010426007211208344,
+ 0.006943442393094301
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.763671875,
+ "loss_eval": 0.6451045274734497,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 1.394100546836853,
+ 9.805717468261719,
+ 14.102628707885742,
+ 19.18745231628418,
+ 24.205224990844727
+ ],
+ "hidden_norms_avg": [
+ 4.746951580047607,
+ 13.343804359436035,
+ 16.609134674072266,
+ 19.829851150512695,
+ 21.580671310424805
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006192427244968712,
+ 0.0002108582411892712,
+ 0.0001636892993701622,
+ 0.0001098570428439416,
+ 6.864540046080947e-05
+ ],
+ "bp_grad_F": [
+ 0.06809430569410324,
+ 0.02151457779109478,
+ 0.01606965810060501,
+ 0.011247958056628704,
+ 0.007375919260084629
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7705078125,
+ "loss_eval": 0.6522111892700195,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4160058498382568,
+ 9.728543281555176,
+ 13.389554977416992,
+ 18.542705535888672,
+ 23.791994094848633
+ ],
+ "hidden_norms_avg": [
+ 4.738738536834717,
+ 13.15449333190918,
+ 16.28533172607422,
+ 19.581254959106445,
+ 21.488550186157227
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006278376094996929,
+ 0.00020051853789482266,
+ 0.00015803576388861984,
+ 0.0001043542506522499,
+ 6.271857273532078e-05
+ ],
+ "bp_grad_F": [
+ 0.07535671442747116,
+ 0.02472539246082306,
+ 0.01880054548382759,
+ 0.012977317906916142,
+ 0.007879889570176601
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.767578125,
+ "loss_eval": 0.6732022762298584,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4301073551177979,
+ 9.656251907348633,
+ 13.501574516296387,
+ 18.518707275390625,
+ 23.49370574951172
+ ],
+ "hidden_norms_avg": [
+ 4.7338972091674805,
+ 12.90231704711914,
+ 15.899849891662598,
+ 18.982860565185547,
+ 20.785310745239258
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005697127780877054,
+ 0.00018775691569317132,
+ 0.00014216902491170913,
+ 9.182754729408771e-05,
+ 5.984708695905283e-05
+ ],
+ "bp_grad_F": [
+ 0.07130222022533417,
+ 0.023520665243268013,
+ 0.017786188051104546,
+ 0.012143870815634727,
+ 0.007813607342541218
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7763671875,
+ "loss_eval": 0.6380050182342529,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4623057842254639,
+ 10.028787612915039,
+ 13.687016487121582,
+ 18.426584243774414,
+ 23.602413177490234
+ ],
+ "hidden_norms_avg": [
+ 4.807516574859619,
+ 12.739899635314941,
+ 16.150466918945312,
+ 19.439754486083984,
+ 21.316791534423828
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005416463245637715,
+ 0.00019103426893707365,
+ 0.00014568559709005058,
+ 9.899997530737892e-05,
+ 6.29485584795475e-05
+ ],
+ "bp_grad_F": [
+ 0.07191846519708633,
+ 0.023787740617990494,
+ 0.01782786287367344,
+ 0.012350695207715034,
+ 0.007955120876431465
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7841796875,
+ "loss_eval": 0.6439570784568787,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4565976858139038,
+ 9.294268608093262,
+ 12.656200408935547,
+ 17.385971069335938,
+ 21.959299087524414
+ ],
+ "hidden_norms_avg": [
+ 4.774696350097656,
+ 12.394432067871094,
+ 15.230389595031738,
+ 18.10796356201172,
+ 19.88006591796875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005462650442495942,
+ 0.00019751323270611465,
+ 0.00015244862879626453,
+ 0.00010562407260295004,
+ 6.40779035165906e-05
+ ],
+ "bp_grad_F": [
+ 0.07698184996843338,
+ 0.026412304490804672,
+ 0.02022000029683113,
+ 0.013991317711770535,
+ 0.008763212710618973
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7568359375,
+ "loss_eval": 0.6531677842140198,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4813296794891357,
+ 9.043482780456543,
+ 12.308734893798828,
+ 16.513948440551758,
+ 21.061283111572266
+ ],
+ "hidden_norms_avg": [
+ 4.7356462478637695,
+ 12.33294677734375,
+ 15.104657173156738,
+ 17.771398544311523,
+ 19.526002883911133
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000557436200324446,
+ 0.0002021614054683596,
+ 0.0001567570143379271,
+ 0.00010984922846546397,
+ 6.634221062995493e-05
+ ],
+ "bp_grad_F": [
+ 0.07777652144432068,
+ 0.027695877477526665,
+ 0.021396547555923462,
+ 0.015052770264446735,
+ 0.009372876025736332
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7744140625,
+ "loss_eval": 0.6539995074272156,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4828969240188599,
+ 8.677760124206543,
+ 12.009501457214355,
+ 16.262908935546875,
+ 20.79404067993164
+ ],
+ "hidden_norms_avg": [
+ 4.744379043579102,
+ 12.125540733337402,
+ 14.89413833618164,
+ 17.47431182861328,
+ 18.953710556030273
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005026232684031129,
+ 0.00019721532589755952,
+ 0.00014348917466122657,
+ 0.00010225686855847016,
+ 5.8645866374718025e-05
+ ],
+ "bp_grad_F": [
+ 0.0830698236823082,
+ 0.03011341392993927,
+ 0.023107260465621948,
+ 0.016188694164156914,
+ 0.00968033168464899
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7744140625,
+ "loss_eval": 0.6444424390792847,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5019822120666504,
+ 9.1107816696167,
+ 12.172623634338379,
+ 16.5975341796875,
+ 20.453947067260742
+ ],
+ "hidden_norms_avg": [
+ 4.741573333740234,
+ 12.045503616333008,
+ 14.836026191711426,
+ 17.666833877563477,
+ 19.175966262817383
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005040269461460412,
+ 0.00019225970027036965,
+ 0.0001496450131526217,
+ 0.00010478955664439127,
+ 6.137428135843948e-05
+ ],
+ "bp_grad_F": [
+ 0.07822537422180176,
+ 0.02863621897995472,
+ 0.022284477949142456,
+ 0.01552330981940031,
+ 0.009474868886172771
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.6074927449226379,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5009087324142456,
+ 8.223862648010254,
+ 11.225082397460938,
+ 15.531359672546387,
+ 19.848068237304688
+ ],
+ "hidden_norms_avg": [
+ 4.69788122177124,
+ 11.848491668701172,
+ 14.342337608337402,
+ 16.882020950317383,
+ 18.197385787963867
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004685261519625783,
+ 0.00017912790644913912,
+ 0.00013862684136256576,
+ 9.223359666066244e-05,
+ 5.140554640092887e-05
+ ],
+ "bp_grad_F": [
+ 0.09127916395664215,
+ 0.03443564847111702,
+ 0.026544470340013504,
+ 0.01809101179242134,
+ 0.010493002831935883
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7783203125,
+ "loss_eval": 0.6329880952835083,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 1.509100079536438,
+ 8.238924980163574,
+ 10.995248794555664,
+ 14.927000045776367,
+ 19.032428741455078
+ ],
+ "hidden_norms_avg": [
+ 4.678654193878174,
+ 11.513160705566406,
+ 14.12202262878418,
+ 16.704364776611328,
+ 18.131078720092773
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004594121128320694,
+ 0.00018182865460403264,
+ 0.000145129015436396,
+ 0.00010142508108401671,
+ 5.208289803704247e-05
+ ],
+ "bp_grad_F": [
+ 0.09080124646425247,
+ 0.03489048779010773,
+ 0.027099598199129105,
+ 0.018760183826088905,
+ 0.010796112939715385
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7822265625,
+ "loss_eval": 0.625268816947937,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 1.503785252571106,
+ 7.896090030670166,
+ 10.495330810546875,
+ 14.530640602111816,
+ 18.728647232055664
+ ],
+ "hidden_norms_avg": [
+ 4.70166540145874,
+ 11.420204162597656,
+ 13.774767875671387,
+ 16.2652530670166,
+ 17.631481170654297
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00043488750816322863,
+ 0.00017315168224740773,
+ 0.0001335645210929215,
+ 8.99006481631659e-05,
+ 5.126056930748746e-05
+ ],
+ "bp_grad_F": [
+ 0.10076858103275299,
+ 0.039271026849746704,
+ 0.0300181582570076,
+ 0.020545953884720802,
+ 0.011564387008547783
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.771484375,
+ "loss_eval": 0.6479744911193848,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 1.505173921585083,
+ 7.728392124176025,
+ 10.420252799987793,
+ 14.133453369140625,
+ 18.110719680786133
+ ],
+ "hidden_norms_avg": [
+ 4.7109880447387695,
+ 11.242951393127441,
+ 13.997397422790527,
+ 16.60598373413086,
+ 17.915313720703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00040974540752358735,
+ 0.0001792571711121127,
+ 0.00014464404375758022,
+ 9.883226448437199e-05,
+ 5.038536983192898e-05
+ ],
+ "bp_grad_F": [
+ 0.09923475980758667,
+ 0.039516862481832504,
+ 0.03056514263153076,
+ 0.021311543881893158,
+ 0.011838918551802635
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7880859375,
+ "loss_eval": 0.6011433601379395,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5013800859451294,
+ 7.8755106925964355,
+ 10.452071189880371,
+ 14.013816833496094,
+ 17.622900009155273
+ ],
+ "hidden_norms_avg": [
+ 4.662457466125488,
+ 11.018245697021484,
+ 13.179399490356445,
+ 15.56103515625,
+ 16.739452362060547
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00033098450512625277,
+ 0.0001421417691744864,
+ 0.00011021740647265688,
+ 7.645406731171533e-05,
+ 4.017115134047344e-05
+ ],
+ "bp_grad_F": [
+ 0.09463275969028473,
+ 0.03948793560266495,
+ 0.03067062795162201,
+ 0.021538278087973595,
+ 0.012101472355425358
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8076171875,
+ "loss_eval": 0.5846524238586426,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5032685995101929,
+ 7.549060344696045,
+ 10.04562759399414,
+ 13.609556198120117,
+ 17.36180877685547
+ ],
+ "hidden_norms_avg": [
+ 4.688360214233398,
+ 11.03510856628418,
+ 13.660865783691406,
+ 16.024188995361328,
+ 17.242145538330078
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003352685598656535,
+ 0.0001500560319982469,
+ 0.000116633229481522,
+ 8.394405449507758e-05,
+ 4.0652244933880866e-05
+ ],
+ "bp_grad_F": [
+ 0.10540100187063217,
+ 0.044482193887233734,
+ 0.03421863541007042,
+ 0.023781608790159225,
+ 0.012753129936754704
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7861328125,
+ "loss_eval": 0.5960580110549927,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 1.5032752752304077,
+ 7.387601375579834,
+ 9.652260780334473,
+ 13.042936325073242,
+ 16.688335418701172
+ ],
+ "hidden_norms_avg": [
+ 4.644099235534668,
+ 10.739524841308594,
+ 13.165095329284668,
+ 15.435381889343262,
+ 16.59172248840332
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003447248600423336,
+ 0.0001518868375569582,
+ 0.00012246235564816743,
+ 8.41514120111242e-05,
+ 4.193704080535099e-05
+ ],
+ "bp_grad_F": [
+ 0.11063266545534134,
+ 0.04730832949280739,
+ 0.03743334487080574,
+ 0.02577192150056362,
+ 0.01377912238240242
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.78515625,
+ "loss_eval": 0.652167797088623,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4935848712921143,
+ 7.262828826904297,
+ 9.431328773498535,
+ 12.742668151855469,
+ 16.348758697509766
+ ],
+ "hidden_norms_avg": [
+ 4.6145453453063965,
+ 10.670759201049805,
+ 12.641580581665039,
+ 14.64714241027832,
+ 15.685794830322266
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003325030847918242,
+ 0.00014367286348715425,
+ 0.00011324919614708051,
+ 7.871988782426342e-05,
+ 4.058879494550638e-05
+ ],
+ "bp_grad_F": [
+ 0.11436768621206284,
+ 0.04893247410655022,
+ 0.03840672969818115,
+ 0.02707456797361374,
+ 0.014087510295212269
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7978515625,
+ "loss_eval": 0.6156834363937378,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4897189140319824,
+ 7.156031608581543,
+ 9.365946769714355,
+ 12.499292373657227,
+ 15.942588806152344
+ ],
+ "hidden_norms_avg": [
+ 4.635710716247559,
+ 10.602685928344727,
+ 12.637743949890137,
+ 14.74621868133545,
+ 15.834792137145996
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000299928622553125,
+ 0.00013245265290606767,
+ 0.00010241761629004031,
+ 7.247657049447298e-05,
+ 3.780105180339888e-05
+ ],
+ "bp_grad_F": [
+ 0.11267601698637009,
+ 0.0501401461660862,
+ 0.03941003605723381,
+ 0.0279407799243927,
+ 0.014723201282322407
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.80078125,
+ "loss_eval": 0.5903886556625366,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4791479110717773,
+ 7.027911186218262,
+ 9.0321044921875,
+ 12.123476028442383,
+ 15.987238883972168
+ ],
+ "hidden_norms_avg": [
+ 4.5436177253723145,
+ 10.157598495483398,
+ 12.115620613098145,
+ 14.023022651672363,
+ 15.130277633666992
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002464659046381712,
+ 0.00011603213351918384,
+ 9.401622082805261e-05,
+ 6.44488463876769e-05,
+ 2.8129303245805204e-05
+ ],
+ "bp_grad_F": [
+ 0.1319781094789505,
+ 0.05854209512472153,
+ 0.04639327526092529,
+ 0.03260229155421257,
+ 0.01578359492123127
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7841796875,
+ "loss_eval": 0.6532921195030212,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4722236394882202,
+ 6.847982406616211,
+ 9.039284706115723,
+ 11.94421672821045,
+ 15.479789733886719
+ ],
+ "hidden_norms_avg": [
+ 4.536457538604736,
+ 10.0848388671875,
+ 11.944480895996094,
+ 13.931117057800293,
+ 15.018562316894531
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00023636725381948054,
+ 0.00011084756260970607,
+ 8.837366476655006e-05,
+ 6.370043411152437e-05,
+ 3.0101380616542883e-05
+ ],
+ "bp_grad_F": [
+ 0.1352969855070114,
+ 0.06069062277674675,
+ 0.04737559333443642,
+ 0.03317096084356308,
+ 0.016367904841899872
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7783203125,
+ "loss_eval": 0.6675163507461548,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4741134643554688,
+ 6.7887864112854,
+ 8.833945274353027,
+ 11.777705192565918,
+ 15.091635704040527
+ ],
+ "hidden_norms_avg": [
+ 4.546427249908447,
+ 10.082904815673828,
+ 11.992964744567871,
+ 14.035684585571289,
+ 15.085047721862793
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002497230307199061,
+ 0.00011889061715919524,
+ 9.627552208257839e-05,
+ 6.80557859595865e-05,
+ 3.187589391018264e-05
+ ],
+ "bp_grad_F": [
+ 0.13283543288707733,
+ 0.06097453087568283,
+ 0.047521013766527176,
+ 0.033583469688892365,
+ 0.016502397134900093
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7998046875,
+ "loss_eval": 0.6332878470420837,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4732073545455933,
+ 6.690948009490967,
+ 8.623305320739746,
+ 11.383458137512207,
+ 14.868409156799316
+ ],
+ "hidden_norms_avg": [
+ 4.510478973388672,
+ 9.772372245788574,
+ 11.55829906463623,
+ 13.379657745361328,
+ 14.343344688415527
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00019870084361173213,
+ 0.00010116927296621725,
+ 8.329773845616728e-05,
+ 6.15280878264457e-05,
+ 2.8435944841476157e-05
+ ],
+ "bp_grad_F": [
+ 0.13917136192321777,
+ 0.06636927276849747,
+ 0.05231080949306488,
+ 0.0366261750459671,
+ 0.017451239749789238
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8017578125,
+ "loss_eval": 0.6271109580993652,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4620546102523804,
+ 6.489831924438477,
+ 8.487679481506348,
+ 11.202116966247559,
+ 14.761962890625
+ ],
+ "hidden_norms_avg": [
+ 4.5009870529174805,
+ 9.717012405395508,
+ 11.480990409851074,
+ 13.235471725463867,
+ 14.178875923156738
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015383858408313245,
+ 8.131976937875152e-05,
+ 6.472255336120725e-05,
+ 4.378501034807414e-05,
+ 1.9541592337191105e-05
+ ],
+ "bp_grad_F": [
+ 0.1546960175037384,
+ 0.07402726262807846,
+ 0.058267489075660706,
+ 0.041084613651037216,
+ 0.018521569669246674
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.794921875,
+ "loss_eval": 0.6767467260360718,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4651520252227783,
+ 6.564362525939941,
+ 8.296653747558594,
+ 11.014183044433594,
+ 14.418519973754883
+ ],
+ "hidden_norms_avg": [
+ 4.483984470367432,
+ 9.593335151672363,
+ 11.23758316040039,
+ 13.036303520202637,
+ 14.015531539916992
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002037636877503246,
+ 0.00010235400259261951,
+ 8.395169425057247e-05,
+ 5.674947897205129e-05,
+ 2.5295201339758933e-05
+ ],
+ "bp_grad_F": [
+ 0.15471766889095306,
+ 0.07422170042991638,
+ 0.05941145122051239,
+ 0.04111991077661514,
+ 0.018912144005298615
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8037109375,
+ "loss_eval": 0.6682149171829224,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 1.457137107849121,
+ 6.368557929992676,
+ 8.152215957641602,
+ 10.783031463623047,
+ 14.167640686035156
+ ],
+ "hidden_norms_avg": [
+ 4.462830066680908,
+ 9.585762977600098,
+ 11.208064079284668,
+ 13.065739631652832,
+ 13.993027687072754
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00016671593766659498,
+ 8.65811962285079e-05,
+ 7.217681559268385e-05,
+ 5.042032353230752e-05,
+ 2.1260022549540736e-05
+ ],
+ "bp_grad_F": [
+ 0.15730538964271545,
+ 0.07605564594268799,
+ 0.06052647903561592,
+ 0.04247846081852913,
+ 0.01923321560025215
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8134765625,
+ "loss_eval": 0.6757298111915588,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4529122114181519,
+ 6.260828018188477,
+ 8.032843589782715,
+ 10.586301803588867,
+ 13.950445175170898
+ ],
+ "hidden_norms_avg": [
+ 4.4613800048828125,
+ 9.4591646194458,
+ 11.012088775634766,
+ 12.760184288024902,
+ 13.692852973937988
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001344321499345824,
+ 6.65406696498394e-05,
+ 5.5920852901181206e-05,
+ 3.9107719203457236e-05,
+ 1.5611329217790626e-05
+ ],
+ "bp_grad_F": [
+ 0.1660272479057312,
+ 0.08182978630065918,
+ 0.06507853418588638,
+ 0.046549297869205475,
+ 0.020592277869582176
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.806640625,
+ "loss_eval": 0.685518205165863,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4509673118591309,
+ 6.163156032562256,
+ 7.82518196105957,
+ 10.378498077392578,
+ 13.96407699584961
+ ],
+ "hidden_norms_avg": [
+ 4.434635162353516,
+ 9.335474967956543,
+ 10.857998847961426,
+ 12.551763534545898,
+ 13.511585235595703
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00011230952804908156,
+ 5.540825441130437e-05,
+ 4.5063996367389336e-05,
+ 2.9814285881002434e-05,
+ 1.1903831364179496e-05
+ ],
+ "bp_grad_F": [
+ 0.1772848516702652,
+ 0.08942516893148422,
+ 0.07126298546791077,
+ 0.04956020042300224,
+ 0.021146513521671295
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7958984375,
+ "loss_eval": 0.69295334815979,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4527415037155151,
+ 6.165233612060547,
+ 7.756027698516846,
+ 10.242467880249023,
+ 13.45471477508545
+ ],
+ "hidden_norms_avg": [
+ 4.438976287841797,
+ 9.343517303466797,
+ 10.836493492126465,
+ 12.435514450073242,
+ 13.287426948547363
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0001074640967999585,
+ 5.268112363410182e-05,
+ 4.352951145847328e-05,
+ 3.164535519317724e-05,
+ 1.2792614143108949e-05
+ ],
+ "bp_grad_F": [
+ 0.17606250941753387,
+ 0.08888891339302063,
+ 0.07090400159358978,
+ 0.05056491121649742,
+ 0.021766021847724915
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.806640625,
+ "loss_eval": 0.6969807147979736,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4455187320709229,
+ 6.104230880737305,
+ 7.606966972351074,
+ 10.056215286254883,
+ 13.531522750854492
+ ],
+ "hidden_norms_avg": [
+ 4.394144535064697,
+ 9.197455406188965,
+ 10.598797798156738,
+ 12.198134422302246,
+ 13.1181001663208
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.084033081308007e-05,
+ 4.605063077178784e-05,
+ 3.957438457291573e-05,
+ 2.727917853917461e-05,
+ 1.0920393833657727e-05
+ ],
+ "bp_grad_F": [
+ 0.1919114887714386,
+ 0.09742862731218338,
+ 0.07786751538515091,
+ 0.05414625629782677,
+ 0.022070109844207764
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.810546875,
+ "loss_eval": 0.713995635509491,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4383388757705688,
+ 6.067695617675781,
+ 7.595578670501709,
+ 9.960418701171875,
+ 13.367838859558105
+ ],
+ "hidden_norms_avg": [
+ 4.4121479988098145,
+ 9.207226753234863,
+ 10.62590217590332,
+ 12.186077117919922,
+ 13.054762840270996
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010577002831269056,
+ 5.2172203140798956e-05,
+ 4.119141885894351e-05,
+ 2.997498268086929e-05,
+ 1.1721556802513078e-05
+ ],
+ "bp_grad_F": [
+ 0.19711492955684662,
+ 0.09961695969104767,
+ 0.07941404730081558,
+ 0.05621125549077988,
+ 0.02285071834921837
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7998046875,
+ "loss_eval": 0.7457866668701172,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 1.438454270362854,
+ 6.097946643829346,
+ 7.5858659744262695,
+ 9.956851959228516,
+ 13.270756721496582
+ ],
+ "hidden_norms_avg": [
+ 4.392654895782471,
+ 9.144302368164062,
+ 10.536030769348145,
+ 12.092294692993164,
+ 12.985077857971191
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00010758326970972121,
+ 5.274294744594954e-05,
+ 4.421125413500704e-05,
+ 3.0753104510949925e-05,
+ 1.1889996130776126e-05
+ ],
+ "bp_grad_F": [
+ 0.19883227348327637,
+ 0.1017213836312294,
+ 0.0807848572731018,
+ 0.056292060762643814,
+ 0.022987989708781242
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7998046875,
+ "loss_eval": 0.7402137517929077,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4367005825042725,
+ 6.004332542419434,
+ 7.504194259643555,
+ 9.782310485839844,
+ 13.125389099121094
+ ],
+ "hidden_norms_avg": [
+ 4.3845720291137695,
+ 9.06988525390625,
+ 10.41169548034668,
+ 11.905806541442871,
+ 12.784433364868164
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 9.236831829184666e-05,
+ 4.803440242540091e-05,
+ 3.901722448063083e-05,
+ 2.752364525804296e-05,
+ 1.1449340490798932e-05
+ ],
+ "bp_grad_F": [
+ 0.19664740562438965,
+ 0.10213448107242584,
+ 0.08124449104070663,
+ 0.05709528177976608,
+ 0.023260990157723427
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8017578125,
+ "loss_eval": 0.732274055480957,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4371269941329956,
+ 5.965888500213623,
+ 7.401495933532715,
+ 9.748833656311035,
+ 13.274619102478027
+ ],
+ "hidden_norms_avg": [
+ 4.380629539489746,
+ 9.019668579101562,
+ 10.396828651428223,
+ 11.923394203186035,
+ 12.77461051940918
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.760760490782559e-05,
+ 4.048245318699628e-05,
+ 3.216555342078209e-05,
+ 2.2310470740194432e-05,
+ 8.838631401886232e-06
+ ],
+ "bp_grad_F": [
+ 0.20731569826602936,
+ 0.10790340602397919,
+ 0.08557390421628952,
+ 0.059937626123428345,
+ 0.023827020078897476
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8046875,
+ "loss_eval": 0.7751725316047668,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4341260194778442,
+ 5.9393768310546875,
+ 7.411903381347656,
+ 9.739734649658203,
+ 13.19786548614502
+ ],
+ "hidden_norms_avg": [
+ 4.378067493438721,
+ 8.986294746398926,
+ 10.316237449645996,
+ 11.792922019958496,
+ 12.673585891723633
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.968516390770674e-05,
+ 3.471451054792851e-05,
+ 2.8814916731789708e-05,
+ 1.9318980776006356e-05,
+ 7.639268915227149e-06
+ ],
+ "bp_grad_F": [
+ 0.2137812376022339,
+ 0.11110929399728775,
+ 0.08847261965274811,
+ 0.06186935305595398,
+ 0.024307044222950935
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8056640625,
+ "loss_eval": 0.764312744140625,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4324616193771362,
+ 5.883492469787598,
+ 7.319663047790527,
+ 9.547243118286133,
+ 13.008822441101074
+ ],
+ "hidden_norms_avg": [
+ 4.376597881317139,
+ 8.99113941192627,
+ 10.321625709533691,
+ 11.771256446838379,
+ 12.628817558288574
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.972177991177887e-05,
+ 3.871036460623145e-05,
+ 3.142197601846419e-05,
+ 2.2371379600372165e-05,
+ 8.571933904022444e-06
+ ],
+ "bp_grad_F": [
+ 0.21534259617328644,
+ 0.11241323500871658,
+ 0.08915204554796219,
+ 0.06287811696529388,
+ 0.024627922102808952
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7958984375,
+ "loss_eval": 0.7731261253356934,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4321078062057495,
+ 5.858248710632324,
+ 7.306819915771484,
+ 9.56387996673584,
+ 13.071084022521973
+ ],
+ "hidden_norms_avg": [
+ 4.371452808380127,
+ 8.94082260131836,
+ 10.26811695098877,
+ 11.765360832214355,
+ 12.617104530334473
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.236401870613918e-05,
+ 3.8528516597580165e-05,
+ 3.0984694603830576e-05,
+ 2.1565809220192023e-05,
+ 7.989257937879302e-06
+ ],
+ "bp_grad_F": [
+ 0.2197490781545639,
+ 0.1155213937163353,
+ 0.09188564866781235,
+ 0.06453806161880493,
+ 0.024861471727490425
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.7958984375,
+ "loss_eval": 0.7778797149658203,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4319349527359009,
+ 5.846956253051758,
+ 7.283481121063232,
+ 9.520010948181152,
+ 13.023626327514648
+ ],
+ "hidden_norms_avg": [
+ 4.372097969055176,
+ 8.950923919677734,
+ 10.25277328491211,
+ 11.715353012084961,
+ 12.572748184204102
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.399707490345463e-05,
+ 3.384953743079677e-05,
+ 2.7512824090081267e-05,
+ 1.8538266886025667e-05,
+ 7.2009356699709315e-06
+ ],
+ "bp_grad_F": [
+ 0.21942120790481567,
+ 0.11553706228733063,
+ 0.09221186488866806,
+ 0.06456339359283447,
+ 0.024819573387503624
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.798828125,
+ "loss_eval": 0.7808230519294739,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4311723709106445,
+ 5.84969425201416,
+ 7.275974273681641,
+ 9.513206481933594,
+ 12.99256420135498
+ ],
+ "hidden_norms_avg": [
+ 4.37282133102417,
+ 8.946002006530762,
+ 10.248116493225098,
+ 11.702008247375488,
+ 12.54873275756836
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.404191663023084e-05,
+ 3.509471571305767e-05,
+ 2.9476050258381292e-05,
+ 1.9310447896714322e-05,
+ 7.2306984293391e-06
+ ],
+ "bp_grad_F": [
+ 0.22379544377326965,
+ 0.11763197183609009,
+ 0.09364764392375946,
+ 0.06539658457040787,
+ 0.02503892220556736
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.80078125,
+ "loss_eval": 0.7862963080406189,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4306355714797974,
+ 5.837501049041748,
+ 7.250905990600586,
+ 9.502866744995117,
+ 13.022948265075684
+ ],
+ "hidden_norms_avg": [
+ 4.368107795715332,
+ 8.927281379699707,
+ 10.20923900604248,
+ 11.650206565856934,
+ 12.504077911376953
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 7.216054655145854e-05,
+ 3.7455520214280114e-05,
+ 3.0207094823708758e-05,
+ 2.1436455426737666e-05,
+ 7.401154562103329e-06
+ ],
+ "bp_grad_F": [
+ 0.22603340446949005,
+ 0.11918352544307709,
+ 0.0947541669011116,
+ 0.06624340265989304,
+ 0.02514214999973774
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.8017578125,
+ "loss_eval": 0.7883187532424927,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 1.4303507804870605,
+ 5.833686351776123,
+ 7.24592399597168,
+ 9.48628044128418,
+ 12.962425231933594
+ ],
+ "hidden_norms_avg": [
+ 4.368690013885498,
+ 8.926249504089355,
+ 10.21507453918457,
+ 11.65561294555664,
+ 12.507142066955566
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.914411642355844e-05,
+ 3.7666370189981535e-05,
+ 3.0613842682214454e-05,
+ 2.0578616386046633e-05,
+ 7.153785645641619e-06
+ ],
+ "bp_grad_F": [
+ 0.22665317356586456,
+ 0.1197197362780571,
+ 0.09526386857032776,
+ 0.06651060283184052,
+ 0.02521701157093048
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.798828125,
+ "loss_eval": 0.7879265546798706,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 1.430293083190918,
+ 5.832674026489258,
+ 7.243373394012451,
+ 9.484408378601074,
+ 12.968917846679688
+ ],
+ "hidden_norms_avg": [
+ 4.368374347686768,
+ 8.92542552947998,
+ 10.214056015014648,
+ 11.65438175201416,
+ 12.507084846496582
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.862521695438772e-05,
+ 3.740868851309642e-05,
+ 3.050716986763291e-05,
+ 2.0533103452180512e-05,
+ 7.137502961995779e-06
+ ],
+ "bp_grad_F": [
+ 0.22697713971138,
+ 0.11988355964422226,
+ 0.09540446847677231,
+ 0.06659507006406784,
+ 0.025233659893274307
+ ],
+ "gamma_dfa": NaN,
+ "gamma_dfa_per_layer": [],
+ "acc_eval": 0.798828125,
+ "loss_eval": 0.7890625,
+ "epoch": 60
+ }
+ ],
+ "dfa_log": [
+ {
+ "hidden_norms_cls": [
+ 0.31052109599113464,
+ 3.2536301612854004,
+ 4.7681732177734375,
+ 6.129599571228027,
+ 7.124356746673584
+ ],
+ "hidden_norms_avg": [
+ 6.008513927459717,
+ 7.034290313720703,
+ 7.942849636077881,
+ 8.915729522705078,
+ 9.635361671447754
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.004442029166966677,
+ 0.0012008437188342214,
+ 0.0009976272704079747,
+ 0.0009104337659664452,
+ 0.0008558662957511842
+ ],
+ "bp_grad_F": [
+ 0.18535660207271576,
+ 0.03968670591711998,
+ 0.032604776322841644,
+ 0.029427478089928627,
+ 0.02746850810945034
+ ],
+ "gamma_dfa": 0.003905070887412876,
+ "gamma_dfa_per_layer": [
+ 0.004920602310448885,
+ 0.005249542184174061,
+ 0.0038580193649977446,
+ 0.0015921196900308132
+ ],
+ "acc_eval": 0.1376953125,
+ "loss_eval": 2.35188627243042,
+ "epoch": 0
+ },
+ {
+ "hidden_norms_cls": [
+ 1.969543218612671,
+ 2409.528564453125,
+ 2965.8515625,
+ 5388.57568359375,
+ 10078.4892578125
+ ],
+ "hidden_norms_avg": [
+ 45.02196502685547,
+ 4042.294189453125,
+ 10780.892578125,
+ 14336.607421875,
+ 18185.720703125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00021220046619419008,
+ 6.587009124814358e-07,
+ 6.152115474833408e-07,
+ 6.009134381201875e-07,
+ 6.002246095704322e-07
+ ],
+ "bp_grad_F": [
+ 0.327708899974823,
+ 5.584151222137734e-05,
+ 3.1912604754325e-05,
+ 2.0850193322985433e-05,
+ 2.061383202089928e-05
+ ],
+ "gamma_dfa": 0.0062168055737856776,
+ "gamma_dfa_per_layer": [
+ 0.0034891567192971706,
+ 0.014096655882894993,
+ 0.008750341832637787,
+ -0.0014689321396872401
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 2.0569005012512207,
+ "epoch": 1
+ },
+ {
+ "hidden_norms_cls": [
+ 4.063174247741699,
+ 6453.43212890625,
+ 10849.3359375,
+ 13374.7021484375,
+ 36052.8046875
+ ],
+ "hidden_norms_avg": [
+ 93.43009185791016,
+ 12578.36328125,
+ 48372.984375,
+ 57469.9609375,
+ 73801.421875
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015539559535682201,
+ 2.588524239399703e-07,
+ 1.9553621655177267e-07,
+ 1.8433813409046707e-07,
+ 1.781664309419284e-07
+ ],
+ "bp_grad_F": [
+ 0.09239349514245987,
+ 5.2396142564248294e-05,
+ 9.398144356964622e-06,
+ 6.586112704098923e-06,
+ 6.009819117025472e-06
+ ],
+ "gamma_dfa": 0.009027999331010506,
+ "gamma_dfa_per_layer": [
+ 0.010615326464176178,
+ 0.014681536704301834,
+ 0.012467417865991592,
+ -0.0016522837104275823
+ ],
+ "acc_eval": 0.2236328125,
+ "loss_eval": 2.0732030868530273,
+ "epoch": 2
+ },
+ {
+ "hidden_norms_cls": [
+ 6.139724254608154,
+ 13514.7626953125,
+ 22634.615234375,
+ 30011.625,
+ 105646.9140625
+ ],
+ "hidden_norms_avg": [
+ 140.93157958984375,
+ 27337.47265625,
+ 105659.2734375,
+ 131533.03125,
+ 178079.78125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00013191952893976122,
+ 1.5711624712366756e-07,
+ 6.783211148331247e-08,
+ 6.273136676782087e-08,
+ 6.216072989673194e-08
+ ],
+ "bp_grad_F": [
+ 0.15658611059188843,
+ 2.8997201297897846e-05,
+ 2.6110699309356278e-06,
+ 2.0865154510829598e-06,
+ 2.029548568316386e-06
+ ],
+ "gamma_dfa": 0.0068359210272319615,
+ "gamma_dfa_per_layer": [
+ 0.01239929161965847,
+ 0.008297638036310673,
+ 0.009697571396827698,
+ -0.0030508169438689947
+ ],
+ "acc_eval": 0.2255859375,
+ "loss_eval": 2.0859451293945312,
+ "epoch": 3
+ },
+ {
+ "hidden_norms_cls": [
+ 8.060498237609863,
+ 26771.85546875,
+ 47700.99609375,
+ 65194.9375,
+ 243467.953125
+ ],
+ "hidden_norms_avg": [
+ 189.60569763183594,
+ 53537.2734375,
+ 224677.375,
+ 271932.0625,
+ 380665.78125
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.88996515236795e-05,
+ 7.635610188572173e-08,
+ 3.178359264666142e-08,
+ 2.8310823907418126e-08,
+ 2.8113991135114702e-08
+ ],
+ "bp_grad_F": [
+ 0.18565885722637177,
+ 2.3117625460145064e-05,
+ 1.2200183618915617e-06,
+ 1.0046638863059343e-06,
+ 9.67514324656804e-07
+ ],
+ "gamma_dfa": 0.00588334770873189,
+ "gamma_dfa_per_layer": [
+ 0.012929551303386688,
+ 0.005936518311500549,
+ 0.009927853010594845,
+ -0.0052605317905545235
+ ],
+ "acc_eval": 0.216796875,
+ "loss_eval": 2.1008124351501465,
+ "epoch": 4
+ },
+ {
+ "hidden_norms_cls": [
+ 9.924980163574219,
+ 45836.29296875,
+ 86015.5546875,
+ 115240.734375,
+ 396649.5625
+ ],
+ "hidden_norms_avg": [
+ 236.08885192871094,
+ 94806.203125,
+ 447709.03125,
+ 539570.125,
+ 680795.4375
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014524323341902345,
+ 3.066869780354864e-08,
+ 1.9569522891060842e-08,
+ 1.7725259482404e-08,
+ 1.7704602228718613e-08
+ ],
+ "bp_grad_F": [
+ 0.21425659954547882,
+ 1.3653657333634328e-05,
+ 6.662682494606997e-07,
+ 5.818570798510336e-07,
+ 5.813048460368009e-07
+ ],
+ "gamma_dfa": 0.006635856116190553,
+ "gamma_dfa_per_layer": [
+ 0.010879420675337315,
+ 0.013957185670733452,
+ 0.00779206957668066,
+ -0.006085251457989216
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.1039814949035645,
+ "epoch": 5
+ },
+ {
+ "hidden_norms_cls": [
+ 11.746355056762695,
+ 70552.8046875,
+ 256103.15625,
+ 694951.625,
+ 808366.5625
+ ],
+ "hidden_norms_avg": [
+ 279.4807434082031,
+ 128343.046875,
+ 645095.375,
+ 810123.8125,
+ 959871.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 6.159865733934566e-05,
+ 2.1975946395969004e-08,
+ 1.1060357074654803e-08,
+ 9.967390468546e-09,
+ 1.011228256686536e-08
+ ],
+ "bp_grad_F": [
+ 0.09021499752998352,
+ 5.0024723350361455e-06,
+ 4.539916176327097e-07,
+ 3.891582309734076e-07,
+ 3.9641980720261927e-07
+ ],
+ "gamma_dfa": 0.003665695490781218,
+ "gamma_dfa_per_layer": [
+ 0.009222292341291904,
+ 0.0031545532401651144,
+ 0.00775552075356245,
+ -0.005469584371894598
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 2.1214356422424316,
+ "epoch": 6
+ },
+ {
+ "hidden_norms_cls": [
+ 13.500020980834961,
+ 102720.734375,
+ 194937.703125,
+ 291956.1875,
+ 801362.9375
+ ],
+ "hidden_norms_avg": [
+ 321.6004943847656,
+ 208601.421875,
+ 1002364.1875,
+ 1189027.25,
+ 1448220.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00014696457947138697,
+ 1.642234792598174e-08,
+ 8.907985460382406e-09,
+ 8.127726935924784e-09,
+ 8.014287011803845e-09
+ ],
+ "bp_grad_F": [
+ 0.06841801106929779,
+ 4.044012712256517e-06,
+ 3.4213746857858496e-07,
+ 2.990170742123155e-07,
+ 2.988945198012516e-07
+ ],
+ "gamma_dfa": 0.004651258233934641,
+ "gamma_dfa_per_layer": [
+ 0.007132797501981258,
+ 0.010231958702206612,
+ 0.006907162256538868,
+ -0.0056668855249881744
+ ],
+ "acc_eval": 0.2099609375,
+ "loss_eval": 2.0963404178619385,
+ "epoch": 7
+ },
+ {
+ "hidden_norms_cls": [
+ 15.302024841308594,
+ 160872.96875,
+ 604043.4375,
+ 1296474.125,
+ 1546227.0
+ ],
+ "hidden_norms_avg": [
+ 359.47259521484375,
+ 298263.5,
+ 1317573.75,
+ 1553171.25,
+ 1878602.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000136460512294434,
+ 1.0422226637274434e-08,
+ 5.898865396147812e-09,
+ 5.4856741371622775e-09,
+ 5.4926698744850455e-09
+ ],
+ "bp_grad_F": [
+ 0.07932842522859573,
+ 2.1081664272060152e-06,
+ 2.560300345066935e-07,
+ 2.2075181504987995e-07,
+ 2.2043255398784822e-07
+ ],
+ "gamma_dfa": 0.004627774120308459,
+ "gamma_dfa_per_layer": [
+ 0.006024104077368975,
+ 0.01116865873336792,
+ 0.005747191607952118,
+ -0.004428857937455177
+ ],
+ "acc_eval": 0.220703125,
+ "loss_eval": 2.0744481086730957,
+ "epoch": 8
+ },
+ {
+ "hidden_norms_cls": [
+ 17.009462356567383,
+ 204948.671875,
+ 405065.21875,
+ 549855.3125,
+ 1400973.875
+ ],
+ "hidden_norms_avg": [
+ 396.66558837890625,
+ 480022.3125,
+ 2019487.75,
+ 2350966.75,
+ 2708745.25
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00026586122112348676,
+ 1.0135083883255902e-08,
+ 6.120911777429683e-09,
+ 5.8359819199438334e-09,
+ 5.662275093243352e-09
+ ],
+ "bp_grad_F": [
+ 0.37594228982925415,
+ 1.2430107744876295e-05,
+ 2.3164905371686473e-07,
+ 2.0265188993562333e-07,
+ 2.001279000296563e-07
+ ],
+ "gamma_dfa": 0.004862090456299484,
+ "gamma_dfa_per_layer": [
+ 0.006278482731431723,
+ 0.012495312839746475,
+ 0.005351733416318893,
+ -0.004677167162299156
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.0641043186187744,
+ "epoch": 9
+ },
+ {
+ "hidden_norms_cls": [
+ 18.669273376464844,
+ 316404.0625,
+ 619048.375,
+ 804163.5,
+ 1798441.0
+ ],
+ "hidden_norms_avg": [
+ 434.9389343261719,
+ 650998.25,
+ 2437815.25,
+ 2802479.0,
+ 3269810.75
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003605277743190527,
+ 6.009571951182124e-09,
+ 4.676837139783174e-09,
+ 4.657723096102018e-09,
+ 4.49635484400801e-09
+ ],
+ "bp_grad_F": [
+ 0.14846132695674896,
+ 4.3979816837236285e-06,
+ 1.7215310776919068e-07,
+ 1.581869213396203e-07,
+ 1.561998885790672e-07
+ ],
+ "gamma_dfa": 0.004480502451770008,
+ "gamma_dfa_per_layer": [
+ 0.006086423061788082,
+ 0.010957473888993263,
+ 0.004586817231029272,
+ -0.003708704374730587
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.0591208934783936,
+ "epoch": 10
+ },
+ {
+ "hidden_norms_cls": [
+ 20.326766967773438,
+ 443508.46875,
+ 899668.0625,
+ 1131299.375,
+ 2182177.5
+ ],
+ "hidden_norms_avg": [
+ 473.4957275390625,
+ 854388.9375,
+ 2926402.0,
+ 3295286.75,
+ 3825241.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005711699486710131,
+ 4.8561932253221585e-09,
+ 3.871160725310574e-09,
+ 3.833432238309342e-09,
+ 3.74674646863582e-09
+ ],
+ "bp_grad_F": [
+ 1.0882306098937988,
+ 3.257442813264788e-06,
+ 1.6311048511852277e-07,
+ 1.3397652764979284e-07,
+ 1.326638283671855e-07
+ ],
+ "gamma_dfa": 0.00462920154677704,
+ "gamma_dfa_per_layer": [
+ 0.008616073988378048,
+ 0.009468363597989082,
+ 0.003528183326125145,
+ -0.003095814725384116
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 2.0471031665802,
+ "epoch": 11
+ },
+ {
+ "hidden_norms_cls": [
+ 21.944751739501953,
+ 581616.1875,
+ 1205317.625,
+ 1456984.375,
+ 2587496.75
+ ],
+ "hidden_norms_avg": [
+ 511.203125,
+ 1119566.25,
+ 3562080.25,
+ 3992681.5,
+ 4538977.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009346234728582203,
+ 4.117307383921798e-09,
+ 3.257990321969828e-09,
+ 3.2349201095627222e-09,
+ 3.1638915931608835e-09
+ ],
+ "bp_grad_F": [
+ 0.42184242606163025,
+ 2.2249487301451154e-06,
+ 1.2586481545895367e-07,
+ 1.1919513553948491e-07,
+ 1.181974553787768e-07
+ ],
+ "gamma_dfa": 0.0034259117674082518,
+ "gamma_dfa_per_layer": [
+ 0.00526365265250206,
+ 0.008116653189063072,
+ 0.0030386103317141533,
+ -0.0027152691036462784
+ ],
+ "acc_eval": 0.2255859375,
+ "loss_eval": 2.0867815017700195,
+ "epoch": 12
+ },
+ {
+ "hidden_norms_cls": [
+ 23.46192741394043,
+ 733909.875,
+ 1508464.125,
+ 1841074.875,
+ 3055228.75
+ ],
+ "hidden_norms_avg": [
+ 546.8953247070312,
+ 1235037.0,
+ 3742642.75,
+ 4200378.0,
+ 4892382.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009773626225069165,
+ 3.5754739169391314e-09,
+ 2.9525657474493983e-09,
+ 2.9297144710227485e-09,
+ 2.8955173814182444e-09
+ ],
+ "bp_grad_F": [
+ 0.15538839995861053,
+ 2.0067516288690967e-06,
+ 1.1871279781416888e-07,
+ 1.046255491132797e-07,
+ 1.0416235340926505e-07
+ ],
+ "gamma_dfa": 0.002340688748518005,
+ "gamma_dfa_per_layer": [
+ 0.0019294173689559102,
+ 0.007100729271769524,
+ 0.0026949853636324406,
+ -0.0023623770102858543
+ ],
+ "acc_eval": 0.232421875,
+ "loss_eval": 2.088564872741699,
+ "epoch": 13
+ },
+ {
+ "hidden_norms_cls": [
+ 24.94734764099121,
+ 1151802.75,
+ 3671404.25,
+ 4625593.5,
+ 5052590.0
+ ],
+ "hidden_norms_avg": [
+ 582.0977172851562,
+ 1475600.75,
+ 4403784.0,
+ 5008330.0,
+ 5801902.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007562927203252912,
+ 2.676908916754428e-09,
+ 2.2055020032496486e-09,
+ 2.179777247590664e-09,
+ 2.173634161550808e-09
+ ],
+ "bp_grad_F": [
+ 0.36642539501190186,
+ 3.967601060139714e-06,
+ 8.444904864290947e-08,
+ 7.993684647544796e-08,
+ 7.900475651467787e-08
+ ],
+ "gamma_dfa": 0.0017957038653548807,
+ "gamma_dfa_per_layer": [
+ 0.0019046596717089415,
+ 0.005139546003192663,
+ 0.001759346341714263,
+ -0.0016207365551963449
+ ],
+ "acc_eval": 0.2109375,
+ "loss_eval": 2.08038330078125,
+ "epoch": 14
+ },
+ {
+ "hidden_norms_cls": [
+ 26.36701011657715,
+ 2210167.25,
+ 6804633.5,
+ 7592304.0,
+ 7772230.0
+ ],
+ "hidden_norms_avg": [
+ 615.4749145507812,
+ 1852637.875,
+ 5297662.0,
+ 6054509.0,
+ 6940769.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0009053644607774913,
+ 2.014937106054049e-09,
+ 1.6813730407960747e-09,
+ 1.63718916201816e-09,
+ 1.6135126568173064e-09
+ ],
+ "bp_grad_F": [
+ 0.15154746174812317,
+ 3.760401341423858e-06,
+ 6.479213254806382e-08,
+ 6.350511227992683e-08,
+ 6.00040195308793e-08
+ ],
+ "gamma_dfa": 0.00026495405472815037,
+ "gamma_dfa_per_layer": [
+ -0.0023696955759078264,
+ 0.0033954931423068047,
+ 0.0012687842827290297,
+ -0.0012347656302154064
+ ],
+ "acc_eval": 0.2333984375,
+ "loss_eval": 2.0685791969299316,
+ "epoch": 15
+ },
+ {
+ "hidden_norms_cls": [
+ 27.747814178466797,
+ 2020373.25,
+ 6352088.0,
+ 7372759.0,
+ 7751557.0
+ ],
+ "hidden_norms_avg": [
+ 647.8715209960938,
+ 2166255.0,
+ 5964871.0,
+ 6820316.0,
+ 7888183.5
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000535959261469543,
+ 1.8833379300531305e-09,
+ 1.6251041623505103e-09,
+ 1.5936774122593533e-09,
+ 1.5920619267362213e-09
+ ],
+ "bp_grad_F": [
+ 0.06977186352014542,
+ 4.2289293560315855e-06,
+ 5.94431135425566e-08,
+ 5.634814925770115e-08,
+ 5.626874255426628e-08
+ ],
+ "gamma_dfa": 0.0009004889943753369,
+ "gamma_dfa_per_layer": [
+ 1.3074517482891679e-05,
+ 0.003544538514688611,
+ 0.0012792267370969057,
+ -0.0012348837917670608
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 2.0676896572113037,
+ "epoch": 16
+ },
+ {
+ "hidden_norms_cls": [
+ 29.053590774536133,
+ 3083884.0,
+ 8692576.0,
+ 10024582.0,
+ 10278143.0
+ ],
+ "hidden_norms_avg": [
+ 679.1322021484375,
+ 2750560.0,
+ 7205648.0,
+ 8204248.5,
+ 9336888.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006835769745521247,
+ 1.5781399520520267e-09,
+ 1.3378861352109084e-09,
+ 1.2995797771253592e-09,
+ 1.2820219330578198e-09
+ ],
+ "bp_grad_F": [
+ 0.25767308473587036,
+ 1.6246455061263987e-06,
+ 6.349461756371966e-08,
+ 6.242527206268278e-08,
+ 4.5665522918625356e-08
+ ],
+ "gamma_dfa": 0.0003357882087584585,
+ "gamma_dfa_per_layer": [
+ -0.001319598057307303,
+ 0.002733789850026369,
+ 0.0008947808528319001,
+ -0.0009658198105171323
+ ],
+ "acc_eval": 0.23046875,
+ "loss_eval": 2.0777204036712646,
+ "epoch": 17
+ },
+ {
+ "hidden_norms_cls": [
+ 30.246440887451172,
+ 3200014.0,
+ 8626485.0,
+ 9743865.0,
+ 10146681.0
+ ],
+ "hidden_norms_avg": [
+ 708.5135498046875,
+ 2989787.0,
+ 7458187.5,
+ 8607358.0,
+ 10070516.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005841738311573863,
+ 1.4247033552905464e-09,
+ 1.2406603522308046e-09,
+ 1.21434362565509e-09,
+ 1.217411615961339e-09
+ ],
+ "bp_grad_F": [
+ 0.08999939262866974,
+ 1.7538721976961824e-06,
+ 4.803559150445835e-08,
+ 4.36282370230856e-08,
+ 4.3068951072200434e-08
+ ],
+ "gamma_dfa": -2.2506676032207906e-05,
+ "gamma_dfa_per_layer": [
+ -0.002581980312243104,
+ 0.002518225461244583,
+ 0.0009317069780081511,
+ -0.0009579788311384618
+ ],
+ "acc_eval": 0.2392578125,
+ "loss_eval": 2.0627658367156982,
+ "epoch": 18
+ },
+ {
+ "hidden_norms_cls": [
+ 31.42615509033203,
+ 4556513.5,
+ 10711725.0,
+ 11956874.0,
+ 12318100.0
+ ],
+ "hidden_norms_avg": [
+ 737.157958984375,
+ 3520006.5,
+ 8303534.5,
+ 9571905.0,
+ 11293369.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007374613196589053,
+ 1.2111865954622658e-09,
+ 1.0633514069269268e-09,
+ 1.0194807220642588e-09,
+ 1.0034837405470398e-09
+ ],
+ "bp_grad_F": [
+ 0.12247106432914734,
+ 2.740941681622644e-06,
+ 4.6019909660799385e-08,
+ 4.372383344275477e-08,
+ 3.6865596797497346e-08
+ ],
+ "gamma_dfa": 0.0005736843086197041,
+ "gamma_dfa_per_layer": [
+ 0.0002251334663014859,
+ 0.0021776340436190367,
+ 0.0006795942317694426,
+ -0.0007876245072111487
+ ],
+ "acc_eval": 0.22265625,
+ "loss_eval": 2.062939167022705,
+ "epoch": 19
+ },
+ {
+ "hidden_norms_cls": [
+ 32.559165954589844,
+ 4224958.5,
+ 10227904.0,
+ 11507743.0,
+ 12041642.0
+ ],
+ "hidden_norms_avg": [
+ 765.5013427734375,
+ 3988012.5,
+ 8953060.0,
+ 10431809.0,
+ 12380471.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006474430556409061,
+ 1.179957687114097e-09,
+ 1.0031043773395254e-09,
+ 9.744786089171953e-10,
+ 9.782840093564005e-10
+ ],
+ "bp_grad_F": [
+ 0.12209221720695496,
+ 1.616509621271689e-06,
+ 3.8821241332698264e-08,
+ 3.6648025059093925e-08,
+ 3.527756931021031e-08
+ ],
+ "gamma_dfa": -0.00019280995184089988,
+ "gamma_dfa_per_layer": [
+ -0.002911232877522707,
+ 0.0022857212461531162,
+ 0.0006594176520593464,
+ -0.0008051458280533552
+ ],
+ "acc_eval": 0.240234375,
+ "loss_eval": 2.0555338859558105,
+ "epoch": 20
+ },
+ {
+ "hidden_norms_cls": [
+ 33.59370040893555,
+ 5323277.5,
+ 11855673.0,
+ 13697022.0,
+ 14246667.0
+ ],
+ "hidden_norms_avg": [
+ 789.9629516601562,
+ 4634178.0,
+ 10205192.0,
+ 11930021.0,
+ 13993152.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006352875498123467,
+ 1.0036302899862903e-09,
+ 8.794808215029093e-10,
+ 8.579849608558732e-10,
+ 8.574586596310496e-10
+ ],
+ "bp_grad_F": [
+ 0.09745635837316513,
+ 5.127232043378172e-07,
+ 3.342180221466151e-08,
+ 3.173540363832217e-08,
+ 3.091372491326183e-08
+ ],
+ "gamma_dfa": -0.0006959605379961431,
+ "gamma_dfa_per_layer": [
+ -0.004454955458641052,
+ 0.0018251645378768444,
+ 0.0005447655566968024,
+ -0.000698816787917167
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.056840181350708,
+ "epoch": 21
+ },
+ {
+ "hidden_norms_cls": [
+ 34.583858489990234,
+ 6778143.0,
+ 13401385.0,
+ 15847366.0,
+ 16344266.0
+ ],
+ "hidden_norms_avg": [
+ 814.3038330078125,
+ 5395352.5,
+ 11137891.0,
+ 13094203.0,
+ 15406614.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0006492820102721453,
+ 8.925201688825268e-10,
+ 7.777718469270667e-10,
+ 7.627384279729199e-10,
+ 7.601627105557895e-10
+ ],
+ "bp_grad_F": [
+ 0.08801906555891037,
+ 1.8660392697711359e-06,
+ 3.472371190582635e-08,
+ 2.7845679539950652e-08,
+ 2.7135749647300145e-08
+ ],
+ "gamma_dfa": -0.0012016263353871182,
+ "gamma_dfa_per_layer": [
+ -0.006280785892158747,
+ 0.001651690574362874,
+ 0.0004266214673407376,
+ -0.0006040314910933375
+ ],
+ "acc_eval": 0.2255859375,
+ "loss_eval": 2.0746021270751953,
+ "epoch": 22
+ },
+ {
+ "hidden_norms_cls": [
+ 35.516666412353516,
+ 6985935.5,
+ 14020116.0,
+ 16575473.0,
+ 17109272.0
+ ],
+ "hidden_norms_avg": [
+ 838.5614013671875,
+ 6365095.0,
+ 12448551.0,
+ 14566203.0,
+ 16943832.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0007437304593622684,
+ 8.387662786546457e-10,
+ 7.299132409599451e-10,
+ 7.170505300635455e-10,
+ 7.115786293532267e-10
+ ],
+ "bp_grad_F": [
+ 0.1540054827928543,
+ 1.4262270724429982e-06,
+ 2.9031822279534936e-08,
+ 2.776059560005706e-08,
+ 2.5270722403547552e-08
+ ],
+ "gamma_dfa": -0.00010950746218441054,
+ "gamma_dfa_per_layer": [
+ -0.0017721566837280989,
+ 0.0015054477844387293,
+ 0.0003872170636896044,
+ -0.000558538013137877
+ ],
+ "acc_eval": 0.2392578125,
+ "loss_eval": 2.065904140472412,
+ "epoch": 23
+ },
+ {
+ "hidden_norms_cls": [
+ 36.39850997924805,
+ 7861434.0,
+ 14415042.0,
+ 16660478.0,
+ 17496562.0
+ ],
+ "hidden_norms_avg": [
+ 862.4805297851562,
+ 6600421.5,
+ 12694272.0,
+ 15043836.0,
+ 17968980.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005834798794239759,
+ 7.558619286029966e-10,
+ 6.530426754913776e-10,
+ 6.420492471015393e-10,
+ 6.389526685524061e-10
+ ],
+ "bp_grad_F": [
+ 0.09943251311779022,
+ 1.4788431599299656e-06,
+ 2.582997993272329e-08,
+ 2.3754548550414256e-08,
+ 2.322415859623561e-08
+ ],
+ "gamma_dfa": -0.0009345750440843403,
+ "gamma_dfa_per_layer": [
+ -0.005123761482536793,
+ 0.0015550897223874927,
+ 0.0003447675844654441,
+ -0.0005143960006535053
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.041043758392334,
+ "epoch": 24
+ },
+ {
+ "hidden_norms_cls": [
+ 37.283199310302734,
+ 8933519.0,
+ 15359962.0,
+ 17441364.0,
+ 18346258.0
+ ],
+ "hidden_norms_avg": [
+ 883.0538330078125,
+ 7354756.0,
+ 13721222.0,
+ 16105006.0,
+ 19368310.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00026283934130333364,
+ 6.873029922971341e-10,
+ 6.058342161274766e-10,
+ 6.000055452481945e-10,
+ 5.98545990548871e-10
+ ],
+ "bp_grad_F": [
+ 0.11474847048521042,
+ 2.4628958271932788e-05,
+ 1.3788282160476228e-07,
+ 2.199209525599599e-08,
+ 2.15279509774291e-08
+ ],
+ "gamma_dfa": -0.0014451614988502115,
+ "gamma_dfa_per_layer": [
+ -0.006978219375014305,
+ 0.0013526652473956347,
+ 0.0002992081572301686,
+ -0.0004543000250123441
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.0492172241210938,
+ "epoch": 25
+ },
+ {
+ "hidden_norms_cls": [
+ 38.11500930786133,
+ 10836846.0,
+ 17507178.0,
+ 19929002.0,
+ 20726542.0
+ ],
+ "hidden_norms_avg": [
+ 901.960205078125,
+ 8138403.5,
+ 14552406.0,
+ 17157852.0,
+ 20773122.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005291851703077555,
+ 6.35470620569123e-10,
+ 5.6208532273061e-10,
+ 5.496996191567405e-10,
+ 5.433966054901873e-10
+ ],
+ "bp_grad_F": [
+ 0.07972504198551178,
+ 1.2489309710872476e-06,
+ 2.2593511062041216e-08,
+ 2.1460177634935462e-08,
+ 1.941634231172884e-08
+ ],
+ "gamma_dfa": -0.000788729106716346,
+ "gamma_dfa_per_layer": [
+ -0.00451657734811306,
+ 0.0015372345224022865,
+ 0.00024382121046073735,
+ -0.00041939481161534786
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.0669429302215576,
+ "epoch": 26
+ },
+ {
+ "hidden_norms_cls": [
+ 38.87166213989258,
+ 11480826.0,
+ 18077316.0,
+ 20884150.0,
+ 22098916.0
+ ],
+ "hidden_norms_avg": [
+ 920.577880859375,
+ 8893063.0,
+ 15579717.0,
+ 18401958.0,
+ 22225722.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005104477168060839,
+ 5.858571405781277e-10,
+ 5.198571018105724e-10,
+ 5.114682011253535e-10,
+ 5.120092128052534e-10
+ ],
+ "bp_grad_F": [
+ 0.13577552139759064,
+ 2.0482397303567268e-05,
+ 2.1394010119024642e-08,
+ 2.0649670418038113e-08,
+ 1.8286096192809964e-08
+ ],
+ "gamma_dfa": -0.0004262418224243447,
+ "gamma_dfa_per_layer": [
+ -0.0029134145006537437,
+ 0.0013950758147984743,
+ 0.00018188939429819584,
+ -0.0003685179981403053
+ ],
+ "acc_eval": 0.2490234375,
+ "loss_eval": 2.053382396697998,
+ "epoch": 27
+ },
+ {
+ "hidden_norms_cls": [
+ 39.6179313659668,
+ 10591964.0,
+ 16346992.0,
+ 18847678.0,
+ 21847726.0
+ ],
+ "hidden_norms_avg": [
+ 937.9719848632812,
+ 9576851.0,
+ 16784906.0,
+ 19828342.0,
+ 23673520.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00023470228188671172,
+ 5.629120503058971e-10,
+ 5.04818964408571e-10,
+ 4.974847200855947e-10,
+ 4.968530586957343e-10
+ ],
+ "bp_grad_F": [
+ 0.03459252789616585,
+ 8.028884622035548e-06,
+ 1.9716548393944322e-08,
+ 1.807922522800709e-08,
+ 1.7913645677936074e-08
+ ],
+ "gamma_dfa": -0.0018089709192281589,
+ "gamma_dfa_per_layer": [
+ -0.008484212681651115,
+ 0.0014374498277902603,
+ 0.00020184949971735477,
+ -0.00039097032276913524
+ ],
+ "acc_eval": 0.224609375,
+ "loss_eval": 2.0604443550109863,
+ "epoch": 28
+ },
+ {
+ "hidden_norms_cls": [
+ 40.344242095947266,
+ 10467030.0,
+ 15235544.0,
+ 17027748.0,
+ 23281082.0
+ ],
+ "hidden_norms_avg": [
+ 954.3844604492188,
+ 10038487.0,
+ 16584430.0,
+ 19613710.0,
+ 24505476.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00015729073493275791,
+ 5.36418076624301e-10,
+ 4.5378717450361705e-10,
+ 4.4796202858243817e-10,
+ 4.477457571372412e-10
+ ],
+ "bp_grad_F": [
+ 0.04820869117975235,
+ 2.3596087430632906e-06,
+ 1.7855482425943592e-08,
+ 1.7340139990551506e-08,
+ 1.672622929049794e-08
+ ],
+ "gamma_dfa": -0.0013171448226785287,
+ "gamma_dfa_per_layer": [
+ -0.006438364274799824,
+ 0.0013229507021605968,
+ 0.00020032597240060568,
+ -0.00035349169047549367
+ ],
+ "acc_eval": 0.236328125,
+ "loss_eval": 2.061581611633301,
+ "epoch": 29
+ },
+ {
+ "hidden_norms_cls": [
+ 41.04903793334961,
+ 12235056.0,
+ 17721728.0,
+ 19784938.0,
+ 25024272.0
+ ],
+ "hidden_norms_avg": [
+ 969.5825805664062,
+ 11940616.0,
+ 19401350.0,
+ 22468846.0,
+ 26879212.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00035265026963315904,
+ 5.423251847602728e-10,
+ 4.4247547292819434e-10,
+ 4.358849947649901e-10,
+ 4.3593659238005955e-10
+ ],
+ "bp_grad_F": [
+ 0.0735621377825737,
+ 1.917086819958058e-06,
+ 1.9346130031294706e-08,
+ 1.5936171493535767e-08,
+ 1.5501758099389917e-08
+ ],
+ "gamma_dfa": -0.001081134716514498,
+ "gamma_dfa_per_layer": [
+ -0.005434883758425713,
+ 0.0012318368535488844,
+ 0.00019993717432953417,
+ -0.00032142913551069796
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.0760293006896973,
+ "epoch": 30
+ },
+ {
+ "hidden_norms_cls": [
+ 41.723567962646484,
+ 10562926.0,
+ 13746881.0,
+ 15736975.0,
+ 26354068.0
+ ],
+ "hidden_norms_avg": [
+ 984.3485717773438,
+ 12533570.0,
+ 19717132.0,
+ 22961588.0,
+ 28083302.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0002546848263591528,
+ 4.777176432213537e-10,
+ 4.0483683072523036e-10,
+ 4.0072575813177025e-10,
+ 4.013349652609577e-10
+ ],
+ "bp_grad_F": [
+ 0.06879052519798279,
+ 1.7057992636182462e-06,
+ 1.6271217262442406e-08,
+ 1.4877675091895526e-08,
+ 1.484982270483215e-08
+ ],
+ "gamma_dfa": -0.0015064112594700418,
+ "gamma_dfa_per_layer": [
+ -0.007336798589676619,
+ 0.0013772943057119846,
+ 0.00022022609482519329,
+ -0.0002863668487407267
+ ],
+ "acc_eval": 0.20703125,
+ "loss_eval": 2.078207492828369,
+ "epoch": 31
+ },
+ {
+ "hidden_norms_cls": [
+ 42.342227935791016,
+ 13283171.0,
+ 17422292.0,
+ 19770980.0,
+ 28086972.0
+ ],
+ "hidden_norms_avg": [
+ 999.26123046875,
+ 13875387.0,
+ 21404830.0,
+ 24833206.0,
+ 29923332.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0003442879824433476,
+ 4.4142753341525065e-10,
+ 3.8908712363117104e-10,
+ 3.845144203040718e-10,
+ 3.8369810106964053e-10
+ ],
+ "bp_grad_F": [
+ 0.10482411086559296,
+ 2.8695783385046525e-06,
+ 1.7273855235089286e-08,
+ 1.4195452813225984e-08,
+ 1.3857171410336377e-08
+ ],
+ "gamma_dfa": -0.0009248298447346315,
+ "gamma_dfa_per_layer": [
+ -0.004888010676950216,
+ 0.0012753453338518739,
+ 0.00017224671319127083,
+ -0.0002589007490314543
+ ],
+ "acc_eval": 0.2373046875,
+ "loss_eval": 2.078000068664551,
+ "epoch": 32
+ },
+ {
+ "hidden_norms_cls": [
+ 42.90097427368164,
+ 16870614.0,
+ 22116480.0,
+ 24442270.0,
+ 29665536.0
+ ],
+ "hidden_norms_avg": [
+ 1013.56396484375,
+ 14764026.0,
+ 21856036.0,
+ 25334308.0,
+ 30474444.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047380090109072626,
+ 4.22005735911668e-10,
+ 3.5831293487831317e-10,
+ 3.5505443030103834e-10,
+ 3.5614466931122024e-10
+ ],
+ "bp_grad_F": [
+ 0.1035437062382698,
+ 1.2711110457530594e-06,
+ 1.418432571398398e-08,
+ 1.2978671470875724e-08,
+ 1.2937439564097986e-08
+ ],
+ "gamma_dfa": -0.00034118785697501153,
+ "gamma_dfa_per_layer": [
+ -0.002568737603724003,
+ 0.001293556997552514,
+ 0.000137164635816589,
+ -0.00022673545754514635
+ ],
+ "acc_eval": 0.2265625,
+ "loss_eval": 2.0730109214782715,
+ "epoch": 33
+ },
+ {
+ "hidden_norms_cls": [
+ 43.419898986816406,
+ 18221210.0,
+ 22675590.0,
+ 24728546.0,
+ 30520888.0
+ ],
+ "hidden_norms_avg": [
+ 1027.6595458984375,
+ 16337822.0,
+ 23378412.0,
+ 26921720.0,
+ 31927994.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004629126051440835,
+ 4.106864293085266e-10,
+ 3.557905081663648e-10,
+ 3.536362591649578e-10,
+ 3.5421768296295397e-10
+ ],
+ "bp_grad_F": [
+ 0.08281872421503067,
+ 1.4263683851822861e-06,
+ 1.3245164076636229e-08,
+ 1.2740572152836194e-08,
+ 1.2752362721357713e-08
+ ],
+ "gamma_dfa": -0.0006677984529233072,
+ "gamma_dfa_per_layer": [
+ -0.0036979843862354755,
+ 0.0011370242573320866,
+ 0.00012192466238047928,
+ -0.00023215834517031908
+ ],
+ "acc_eval": 0.23828125,
+ "loss_eval": 2.0669164657592773,
+ "epoch": 34
+ },
+ {
+ "hidden_norms_cls": [
+ 43.868682861328125,
+ 18758150.0,
+ 23109030.0,
+ 25432404.0,
+ 31503354.0
+ ],
+ "hidden_norms_avg": [
+ 1040.644287109375,
+ 15512033.0,
+ 21965288.0,
+ 25882228.0,
+ 31813648.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00048007385339587927,
+ 4.271450415593847e-10,
+ 3.4119135294830016e-10,
+ 3.391489034054729e-10,
+ 3.387232438978316e-10
+ ],
+ "bp_grad_F": [
+ 0.36019906401634216,
+ 1.9220671674702317e-05,
+ 1.358929768713324e-08,
+ 1.2455363851415768e-08,
+ 1.2401786264604198e-08
+ ],
+ "gamma_dfa": -0.00031488661625189707,
+ "gamma_dfa_per_layer": [
+ -0.002551896497607231,
+ 0.001431336859241128,
+ 9.301750105805695e-05,
+ -0.00023200432769954205
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 2.0609660148620605,
+ "epoch": 35
+ },
+ {
+ "hidden_norms_cls": [
+ 44.293697357177734,
+ 21659484.0,
+ 26491946.0,
+ 29332332.0,
+ 32793040.0
+ ],
+ "hidden_norms_avg": [
+ 1051.83740234375,
+ 17567000.0,
+ 24049368.0,
+ 28083622.0,
+ 33467380.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00043948061647824943,
+ 4.0486294872188466e-10,
+ 3.3493480211532756e-10,
+ 3.3453453895937457e-10,
+ 3.3604671823006527e-10
+ ],
+ "bp_grad_F": [
+ 0.10878865420818329,
+ 3.037727083210484e-06,
+ 1.2592222375928941e-08,
+ 1.2103843261002112e-08,
+ 1.2022392859023512e-08
+ ],
+ "gamma_dfa": -0.00015630935013177805,
+ "gamma_dfa_per_layer": [
+ -0.0019119374919682741,
+ 0.0014281735057011247,
+ 7.57485831854865e-05,
+ -0.00021722199744544923
+ ],
+ "acc_eval": 0.2431640625,
+ "loss_eval": 2.0587897300720215,
+ "epoch": 36
+ },
+ {
+ "hidden_norms_cls": [
+ 44.68658447265625,
+ 21628572.0,
+ 26077032.0,
+ 28336790.0,
+ 33305650.0
+ ],
+ "hidden_norms_avg": [
+ 1062.067138671875,
+ 18163602.0,
+ 24404446.0,
+ 28478594.0,
+ 34156064.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005865619168616831,
+ 4.0249623078914e-10,
+ 3.3121710929506776e-10,
+ 3.310392793220984e-10,
+ 3.318675056984688e-10
+ ],
+ "bp_grad_F": [
+ 0.20061102509498596,
+ 1.4544431223839638e-06,
+ 1.3441372459510603e-08,
+ 1.2418687411752671e-08,
+ 1.2016870165609816e-08
+ ],
+ "gamma_dfa": -0.00039686575473751873,
+ "gamma_dfa_per_layer": [
+ -0.0029668076895177364,
+ 0.0015295962803065777,
+ 6.985102663747966e-05,
+ -0.00022010263637639582
+ ],
+ "acc_eval": 0.2275390625,
+ "loss_eval": 2.0569839477539062,
+ "epoch": 37
+ },
+ {
+ "hidden_norms_cls": [
+ 45.062259674072266,
+ 25376026.0,
+ 30203382.0,
+ 32772746.0,
+ 35119040.0
+ ],
+ "hidden_norms_avg": [
+ 1071.6630859375,
+ 18637428.0,
+ 24671676.0,
+ 28819074.0,
+ 34739232.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005594053072854877,
+ 3.9023292930373543e-10,
+ 3.2509483993692356e-10,
+ 3.23913590394298e-10,
+ 3.250162639023557e-10
+ ],
+ "bp_grad_F": [
+ 0.13359014689922333,
+ 4.247889592079446e-06,
+ 1.4051211749688264e-08,
+ 1.2317144637563615e-08,
+ 1.1531787968976914e-08
+ ],
+ "gamma_dfa": -0.0005283378432068275,
+ "gamma_dfa_per_layer": [
+ -0.0037097278982400894,
+ 0.0017695487476885319,
+ 4.308431380195543e-05,
+ -0.000216256536077708
+ ],
+ "acc_eval": 0.2666015625,
+ "loss_eval": 2.0476396083831787,
+ "epoch": 38
+ },
+ {
+ "hidden_norms_cls": [
+ 45.38731384277344,
+ 24903830.0,
+ 30026926.0,
+ 33563200.0,
+ 35539932.0
+ ],
+ "hidden_norms_avg": [
+ 1080.0860595703125,
+ 20496828.0,
+ 26709690.0,
+ 30932660.0,
+ 36357072.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005004233680665493,
+ 3.8017103354270887e-10,
+ 3.1730867933177365e-10,
+ 3.167333340048373e-10,
+ 3.1768215835725755e-10
+ ],
+ "bp_grad_F": [
+ 0.24717594683170319,
+ 2.9436714612529613e-06,
+ 1.1934382371237007e-08,
+ 1.1459838411553847e-08,
+ 1.1365100860416533e-08
+ ],
+ "gamma_dfa": -0.00022031009211787023,
+ "gamma_dfa_per_layer": [
+ -0.0022991469595581293,
+ 0.0015725505072623491,
+ 4.821528273168951e-05,
+ -0.00020285919890739024
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0488319396972656,
+ "epoch": 39
+ },
+ {
+ "hidden_norms_cls": [
+ 45.68830490112305,
+ 27470426.0,
+ 32688434.0,
+ 35418348.0,
+ 37778420.0
+ ],
+ "hidden_norms_avg": [
+ 1088.195068359375,
+ 19636778.0,
+ 25748976.0,
+ 30137794.0,
+ 36341748.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000507087679579854,
+ 3.7039282752004965e-10,
+ 3.106248036566228e-10,
+ 3.096240208666501e-10,
+ 3.10577202844442e-10
+ ],
+ "bp_grad_F": [
+ 0.247142493724823,
+ 5.3006801863375586e-06,
+ 1.5794508811950436e-08,
+ 1.5706817180216603e-08,
+ 1.0953104201405495e-08
+ ],
+ "gamma_dfa": -0.00026929086834570626,
+ "gamma_dfa_per_layer": [
+ -0.0025479549076408148,
+ 0.0016400209860876203,
+ 2.4549921363359317e-05,
+ -0.00019377947319298983
+ ],
+ "acc_eval": 0.2548828125,
+ "loss_eval": 2.0380632877349854,
+ "epoch": 40
+ },
+ {
+ "hidden_norms_cls": [
+ 45.95172119140625,
+ 29219790.0,
+ 34751968.0,
+ 37645720.0,
+ 39363420.0
+ ],
+ "hidden_norms_avg": [
+ 1095.55908203125,
+ 20059094.0,
+ 26161532.0,
+ 30539128.0,
+ 36948852.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004415555449668318,
+ 3.578430884942918e-10,
+ 3.05192260352527e-10,
+ 3.046965735276075e-10,
+ 3.0560776131949297e-10
+ ],
+ "bp_grad_F": [
+ 0.1088763028383255,
+ 4.900910880678566e-06,
+ 1.1387745857405207e-08,
+ 1.0883239198733463e-08,
+ 1.0722531307294503e-08
+ ],
+ "gamma_dfa": -0.0006201292017067317,
+ "gamma_dfa_per_layer": [
+ -0.004000760614871979,
+ 0.0016785510815680027,
+ 3.265401755925268e-05,
+ -0.0001909612910822034
+ ],
+ "acc_eval": 0.25,
+ "loss_eval": 2.041342258453369,
+ "epoch": 41
+ },
+ {
+ "hidden_norms_cls": [
+ 46.1973876953125,
+ 29375584.0,
+ 34745100.0,
+ 38109944.0,
+ 40454424.0
+ ],
+ "hidden_norms_avg": [
+ 1102.340087890625,
+ 21066706.0,
+ 27296236.0,
+ 31874516.0,
+ 38108092.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00040148120024241507,
+ 3.579030682931972e-10,
+ 3.0047467292071417e-10,
+ 2.979275159908923e-10,
+ 2.9703536852387913e-10
+ ],
+ "bp_grad_F": [
+ 0.2525903582572937,
+ 8.925781003199518e-06,
+ 1.1219404072448924e-08,
+ 1.084880185686643e-08,
+ 1.0492501978376367e-08
+ ],
+ "gamma_dfa": -0.00034770679030771134,
+ "gamma_dfa_per_layer": [
+ -0.002933461917564273,
+ 0.001698363572359085,
+ 3.748677045223303e-05,
+ -0.0001932155864778906
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.0345935821533203,
+ "epoch": 42
+ },
+ {
+ "hidden_norms_cls": [
+ 46.42340087890625,
+ 27399134.0,
+ 31821602.0,
+ 34474508.0,
+ 38109560.0
+ ],
+ "hidden_norms_avg": [
+ 1108.236328125,
+ 21543940.0,
+ 27684760.0,
+ 32082502.0,
+ 38718660.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000570801377762109,
+ 3.5802838471710174e-10,
+ 2.990230563160168e-10,
+ 2.9852947891484405e-10,
+ 2.9978877713610075e-10
+ ],
+ "bp_grad_F": [
+ 0.173945352435112,
+ 2.9223572255432373e-06,
+ 1.2221713419080515e-08,
+ 1.1539666999738074e-08,
+ 1.0805790928714032e-08
+ ],
+ "gamma_dfa": -5.9806044191645924e-05,
+ "gamma_dfa_per_layer": [
+ -0.001857165014371276,
+ 0.0017762510105967522,
+ 3.49261645169463e-05,
+ -0.00019323633750900626
+ ],
+ "acc_eval": 0.2412109375,
+ "loss_eval": 2.043308734893799,
+ "epoch": 43
+ },
+ {
+ "hidden_norms_cls": [
+ 46.619728088378906,
+ 31052948.0,
+ 36542220.0,
+ 39935176.0,
+ 42316204.0
+ ],
+ "hidden_norms_avg": [
+ 1113.68896484375,
+ 22679808.0,
+ 29079456.0,
+ 33751472.0,
+ 40006012.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046165595995262265,
+ 3.339039600369631e-10,
+ 2.9132621315319795e-10,
+ 2.9080904351275194e-10,
+ 2.9134980539247124e-10
+ ],
+ "bp_grad_F": [
+ 0.08871550858020782,
+ 1.195927779917838e-05,
+ 1.2490571243972681e-08,
+ 1.2371740965022582e-08,
+ 1.015614703447909e-08
+ ],
+ "gamma_dfa": -0.0003672020420708577,
+ "gamma_dfa_per_layer": [
+ -0.002894133096560836,
+ 0.0016025153454393148,
+ 2.5333010853501037e-05,
+ -0.0002025234280154109
+ ],
+ "acc_eval": 0.244140625,
+ "loss_eval": 2.029773473739624,
+ "epoch": 44
+ },
+ {
+ "hidden_norms_cls": [
+ 46.796348571777344,
+ 30912490.0,
+ 36281496.0,
+ 39245376.0,
+ 41656108.0
+ ],
+ "hidden_norms_avg": [
+ 1118.38134765625,
+ 23560890.0,
+ 29646840.0,
+ 34192144.0,
+ 40581760.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005251869442872703,
+ 3.3097524720915317e-10,
+ 2.891357153700369e-10,
+ 2.8932781170887267e-10,
+ 2.8904145743524623e-10
+ ],
+ "bp_grad_F": [
+ 0.09888254106044769,
+ 4.3903874029638246e-06,
+ 1.0815308648659538e-08,
+ 1.040402519691952e-08,
+ 1.0228043301196976e-08
+ ],
+ "gamma_dfa": -0.00037046667421236634,
+ "gamma_dfa_per_layer": [
+ -0.002757731592282653,
+ 0.0014231146778911352,
+ 3.9225356886163354e-05,
+ -0.00018647513934411108
+ ],
+ "acc_eval": 0.234375,
+ "loss_eval": 2.0383992195129395,
+ "epoch": 45
+ },
+ {
+ "hidden_norms_cls": [
+ 46.95427322387695,
+ 31720426.0,
+ 37234788.0,
+ 40129424.0,
+ 42928428.0
+ ],
+ "hidden_norms_avg": [
+ 1122.57470703125,
+ 22583276.0,
+ 28617936.0,
+ 33269996.0,
+ 40462568.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004295881371945143,
+ 3.419305394380956e-10,
+ 2.8222821302215095e-10,
+ 2.8184321543278656e-10,
+ 2.8312005517783234e-10
+ ],
+ "bp_grad_F": [
+ 0.5366736650466919,
+ 2.256676998513285e-05,
+ 1.1914533359913548e-08,
+ 1.1219233542192342e-08,
+ 1.004730165732326e-08
+ ],
+ "gamma_dfa": 0.00015619578334735706,
+ "gamma_dfa_per_layer": [
+ -0.0010500183561816812,
+ 0.001834970898926258,
+ 3.652184386737645e-05,
+ -0.00019669125322252512
+ ],
+ "acc_eval": 0.2431640625,
+ "loss_eval": 2.039337396621704,
+ "epoch": 46
+ },
+ {
+ "hidden_norms_cls": [
+ 47.09259796142578,
+ 32824944.0,
+ 38341332.0,
+ 41754692.0,
+ 44005196.0
+ ],
+ "hidden_norms_avg": [
+ 1126.26953125,
+ 24313264.0,
+ 30669532.0,
+ 35293632.0,
+ 41785680.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0005083036958239973,
+ 3.2607763711389737e-10,
+ 2.8033902976787317e-10,
+ 2.7943025671106625e-10,
+ 2.7980692762774595e-10
+ ],
+ "bp_grad_F": [
+ 0.06971772015094757,
+ 2.262569068989251e-06,
+ 1.0069017619684928e-08,
+ 9.845756210324907e-09,
+ 9.862499261714675e-09
+ ],
+ "gamma_dfa": 0.0007457349984179018,
+ "gamma_dfa_per_layer": [
+ 0.0015201317146420479,
+ 0.0016060702037066221,
+ 3.652479063021019e-05,
+ -0.00017978671530727297
+ ],
+ "acc_eval": 0.25,
+ "loss_eval": 2.0368857383728027,
+ "epoch": 47
+ },
+ {
+ "hidden_norms_cls": [
+ 47.21082305908203,
+ 33649040.0,
+ 39036836.0,
+ 42500816.0,
+ 44653764.0
+ ],
+ "hidden_norms_avg": [
+ 1129.5389404296875,
+ 24447482.0,
+ 30689206.0,
+ 35330028.0,
+ 42064012.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046678923536092043,
+ 3.204189136241098e-10,
+ 2.755325689829391e-10,
+ 2.7554050707756517e-10,
+ 2.7654081802275243e-10
+ ],
+ "bp_grad_F": [
+ 0.07496139407157898,
+ 2.2861270281282486e-06,
+ 9.997683569906712e-09,
+ 9.715622084627284e-09,
+ 9.736355721656764e-09
+ ],
+ "gamma_dfa": 0.0006021281524226652,
+ "gamma_dfa_per_layer": [
+ 0.0007927162805572152,
+ 0.001763419946655631,
+ 3.104796996922232e-05,
+ -0.000178671587491408
+ ],
+ "acc_eval": 0.259765625,
+ "loss_eval": 2.0324196815490723,
+ "epoch": 48
+ },
+ {
+ "hidden_norms_cls": [
+ 47.315826416015625,
+ 34514608.0,
+ 40222940.0,
+ 43606628.0,
+ 45508540.0
+ ],
+ "hidden_norms_avg": [
+ 1132.157958984375,
+ 24487910.0,
+ 30821460.0,
+ 35505456.0,
+ 42327908.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00041785358916968107,
+ 3.3263317100740153e-10,
+ 2.696754763942266e-10,
+ 2.701733836651954e-10,
+ 2.71275196750409e-10
+ ],
+ "bp_grad_F": [
+ 0.08130628615617752,
+ 3.3661247016425477e-06,
+ 1.078094857831502e-08,
+ 9.643851939244996e-09,
+ 9.617946439277603e-09
+ ],
+ "gamma_dfa": 0.0005021913366363151,
+ "gamma_dfa_per_layer": [
+ 0.00036606384674087167,
+ 0.0017899572849273682,
+ 2.7483671146910638e-05,
+ -0.00017473945626989007
+ ],
+ "acc_eval": 0.2626953125,
+ "loss_eval": 2.028841495513916,
+ "epoch": 49
+ },
+ {
+ "hidden_norms_cls": [
+ 47.388946533203125,
+ 35118772.0,
+ 40722008.0,
+ 44347232.0,
+ 46331384.0
+ ],
+ "hidden_norms_avg": [
+ 1134.3621826171875,
+ 24821028.0,
+ 31074444.0,
+ 35754528.0,
+ 42627356.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00043533919961191714,
+ 3.173189211391758e-10,
+ 2.687766953446413e-10,
+ 2.68161992611482e-10,
+ 2.690903055935223e-10
+ ],
+ "bp_grad_F": [
+ 0.09458157420158386,
+ 1.9965789306297665e-06,
+ 1.025628915130028e-08,
+ 9.58252854843522e-09,
+ 9.523047239667903e-09
+ ],
+ "gamma_dfa": 0.00038969498109509004,
+ "gamma_dfa_per_layer": [
+ -0.00010247333557344973,
+ 0.0018051008228212595,
+ 3.0877545214025304e-05,
+ -0.0001747251080814749
+ ],
+ "acc_eval": 0.2548828125,
+ "loss_eval": 2.0298049449920654,
+ "epoch": 50
+ },
+ {
+ "hidden_norms_cls": [
+ 47.4621696472168,
+ 34836160.0,
+ 40469796.0,
+ 44120564.0,
+ 46361016.0
+ ],
+ "hidden_norms_avg": [
+ 1136.3079833984375,
+ 24152832.0,
+ 30436140.0,
+ 35273740.0,
+ 42621312.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.000491869286634028,
+ 3.2774055691575654e-10,
+ 2.667974174919152e-10,
+ 2.669577336966711e-10,
+ 2.680060617876734e-10
+ ],
+ "bp_grad_F": [
+ 0.0854402706027031,
+ 1.6183460047614062e-06,
+ 9.980491100236577e-09,
+ 9.461099459429079e-09,
+ 9.473674289495193e-09
+ ],
+ "gamma_dfa": 0.0005695745421689935,
+ "gamma_dfa_per_layer": [
+ 0.0004214277723804116,
+ 0.001994946738705039,
+ 3.653779276646674e-05,
+ -0.00017461413517594337
+ ],
+ "acc_eval": 0.23828125,
+ "loss_eval": 2.024928092956543,
+ "epoch": 51
+ },
+ {
+ "hidden_norms_cls": [
+ 47.52342224121094,
+ 36446320.0,
+ 42468064.0,
+ 46175108.0,
+ 47947040.0
+ ],
+ "hidden_norms_avg": [
+ 1137.8057861328125,
+ 25400616.0,
+ 31703746.0,
+ 36432956.0,
+ 43307828.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00034005154157057405,
+ 3.121023717245208e-10,
+ 2.6523216956064743e-10,
+ 2.6489818671926457e-10,
+ 2.649658548126155e-10
+ ],
+ "bp_grad_F": [
+ 0.10125189274549484,
+ 4.0649438233231194e-06,
+ 9.830144698241838e-09,
+ 9.345456852827283e-09,
+ 9.317212779080819e-09
+ ],
+ "gamma_dfa": 0.0005080709906906122,
+ "gamma_dfa_per_layer": [
+ 0.00023581110872328281,
+ 0.0019333910895511508,
+ 3.0449831683654338e-05,
+ -0.00016736806719563901
+ ],
+ "acc_eval": 0.251953125,
+ "loss_eval": 2.0343496799468994,
+ "epoch": 52
+ },
+ {
+ "hidden_norms_cls": [
+ 47.567466735839844,
+ 35483484.0,
+ 41150516.0,
+ 44742840.0,
+ 47102380.0
+ ],
+ "hidden_norms_avg": [
+ 1139.05029296875,
+ 25225282.0,
+ 31585082.0,
+ 36363108.0,
+ 43411416.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00046872245729900897,
+ 3.1678357159670156e-10,
+ 2.6331647973165673e-10,
+ 2.64141680750285e-10,
+ 2.646937946604311e-10
+ ],
+ "bp_grad_F": [
+ 0.08037562668323517,
+ 2.9532295684475685e-06,
+ 9.44631484145475e-09,
+ 9.393840372240447e-09,
+ 9.41009226096412e-09
+ ],
+ "gamma_dfa": 0.0005205844290685491,
+ "gamma_dfa_per_layer": [
+ 0.0003642886003945023,
+ 0.0018537556752562523,
+ 3.766161171370186e-05,
+ -0.00017336817109026015
+ ],
+ "acc_eval": 0.2392578125,
+ "loss_eval": 2.02734375,
+ "epoch": 53
+ },
+ {
+ "hidden_norms_cls": [
+ 47.602928161621094,
+ 35582280.0,
+ 41200288.0,
+ 44686488.0,
+ 47126900.0
+ ],
+ "hidden_norms_avg": [
+ 1139.965087890625,
+ 25657812.0,
+ 31984420.0,
+ 36722060.0,
+ 43681628.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047245126916095614,
+ 3.1708738412739024e-10,
+ 2.6278745846042284e-10,
+ 2.6274540876336516e-10,
+ 2.6386243190401615e-10
+ ],
+ "bp_grad_F": [
+ 0.08141150325536728,
+ 1.0596501851978246e-05,
+ 1.0370135861137442e-08,
+ 1.0129613592368969e-08,
+ 9.407171930320146e-09
+ ],
+ "gamma_dfa": 0.00048223476824205136,
+ "gamma_dfa_per_layer": [
+ 0.00032963097328320146,
+ 0.00173661345615983,
+ 3.3767075365176424e-05,
+ -0.00017107243184000254
+ ],
+ "acc_eval": 0.251953125,
+ "loss_eval": 2.0290825366973877,
+ "epoch": 54
+ },
+ {
+ "hidden_norms_cls": [
+ 47.62870788574219,
+ 36373308.0,
+ 42049216.0,
+ 45803868.0,
+ 47955172.0
+ ],
+ "hidden_norms_avg": [
+ 1140.6492919921875,
+ 25698864.0,
+ 31990548.0,
+ 36707920.0,
+ 43700336.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004157091898377985,
+ 3.1451533044624114e-10,
+ 2.6160756894100246e-10,
+ 2.62937283057596e-10,
+ 2.633904483406724e-10
+ ],
+ "bp_grad_F": [
+ 0.28710466623306274,
+ 2.876764028769685e-06,
+ 9.405439982401731e-09,
+ 9.308096515781017e-09,
+ 9.319982119393444e-09
+ ],
+ "gamma_dfa": 0.00045457817577698734,
+ "gamma_dfa_per_layer": [
+ 0.00011597995762713253,
+ 0.0018383568385615945,
+ 3.561873018043116e-05,
+ -0.00017164282326120883
+ ],
+ "acc_eval": 0.2509765625,
+ "loss_eval": 2.0309882164001465,
+ "epoch": 55
+ },
+ {
+ "hidden_norms_cls": [
+ 47.646034240722656,
+ 35748556.0,
+ 41284136.0,
+ 44861788.0,
+ 47367128.0
+ ],
+ "hidden_norms_avg": [
+ 1141.1492919921875,
+ 25812252.0,
+ 32106642.0,
+ 36789100.0,
+ 43809728.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004877470782957971,
+ 3.1724206595029614e-10,
+ 2.6251881224403917e-10,
+ 2.627319750647672e-10,
+ 2.634734097561875e-10
+ ],
+ "bp_grad_F": [
+ 0.08355043828487396,
+ 2.428784682706464e-06,
+ 9.579466109244095e-09,
+ 9.378172016738517e-09,
+ 9.3862775329967e-09
+ ],
+ "gamma_dfa": 0.0006408758436009521,
+ "gamma_dfa_per_layer": [
+ 0.0009491340606473386,
+ 0.0017479720991104841,
+ 4.02485384256579e-05,
+ -0.00017385132377967238
+ ],
+ "acc_eval": 0.2451171875,
+ "loss_eval": 2.030231475830078,
+ "epoch": 56
+ },
+ {
+ "hidden_norms_cls": [
+ 47.65734100341797,
+ 35952124.0,
+ 41526152.0,
+ 45192104.0,
+ 47596588.0
+ ],
+ "hidden_norms_avg": [
+ 1141.4708251953125,
+ 25858530.0,
+ 32145604.0,
+ 36816776.0,
+ 43830904.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004684069426730275,
+ 3.1406693912217065e-10,
+ 2.6245111639511265e-10,
+ 2.628100792545496e-10,
+ 2.632017381820617e-10
+ ],
+ "bp_grad_F": [
+ 0.16165603697299957,
+ 3.1715710520074936e-06,
+ 1.017021755700398e-08,
+ 9.52006651289139e-09,
+ 9.360165087457517e-09
+ ],
+ "gamma_dfa": 0.0005993541035422822,
+ "gamma_dfa_per_layer": [
+ 0.0007396150031127036,
+ 0.0017993964720517397,
+ 3.345730510773137e-05,
+ -0.00017505236610304564
+ ],
+ "acc_eval": 0.2529296875,
+ "loss_eval": 2.030412197113037,
+ "epoch": 57
+ },
+ {
+ "hidden_norms_cls": [
+ 47.6636962890625,
+ 36249912.0,
+ 41976852.0,
+ 45623612.0,
+ 47785064.0
+ ],
+ "hidden_norms_avg": [
+ 1141.6495361328125,
+ 25785932.0,
+ 32065610.0,
+ 36745760.0,
+ 43805624.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047133295447565615,
+ 3.155541938859585e-10,
+ 2.617887573386213e-10,
+ 2.615481442536094e-10,
+ 2.6276933406954583e-10
+ ],
+ "bp_grad_F": [
+ 0.09146469831466675,
+ 1.8705788988881977e-06,
+ 9.432087999527994e-09,
+ 9.323818161988129e-09,
+ 9.325629157785897e-09
+ ],
+ "gamma_dfa": 0.0005754136018367717,
+ "gamma_dfa_per_layer": [
+ 0.0005892712506465614,
+ 0.0018461447907611728,
+ 3.762807318707928e-05,
+ -0.00017138970724772662
+ ],
+ "acc_eval": 0.251953125,
+ "loss_eval": 2.031130790710449,
+ "epoch": 58
+ },
+ {
+ "hidden_norms_cls": [
+ 47.66678237915039,
+ 36057328.0,
+ 41647260.0,
+ 45391196.0,
+ 47626604.0
+ ],
+ "hidden_norms_avg": [
+ 1141.7391357421875,
+ 25717830.0,
+ 31995718.0,
+ 36684084.0,
+ 43781820.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.00047832890413701534,
+ 3.149952798597866e-10,
+ 2.614737593109595e-10,
+ 2.6173804790197153e-10,
+ 2.6257329643897265e-10
+ ],
+ "bp_grad_F": [
+ 0.16335515677928925,
+ 1.6483251101817586e-06,
+ 9.493151154060797e-09,
+ 9.393547273361946e-09,
+ 9.338456230523207e-09
+ ],
+ "gamma_dfa": 0.0005906115802645218,
+ "gamma_dfa_per_layer": [
+ 0.0007219060207717121,
+ 0.0017734188586473465,
+ 3.73886723536998e-05,
+ -0.00017026723071467131
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.0293946266174316,
+ "epoch": 59
+ },
+ {
+ "hidden_norms_cls": [
+ 47.666595458984375,
+ 36029164.0,
+ 41621316.0,
+ 45328004.0,
+ 47606828.0
+ ],
+ "hidden_norms_avg": [
+ 1141.736328125,
+ 25716872.0,
+ 31991962.0,
+ 36680384.0,
+ 43781988.0
+ ],
+ "bp_grad_per_sample_l2_med": [
+ 0.0004811616672668606,
+ 3.1537170097628575e-10,
+ 2.6223428983840336e-10,
+ 2.6155200227861997e-10,
+ 2.6258059615535956e-10
+ ],
+ "bp_grad_F": [
+ 0.0951727032661438,
+ 1.623439857212361e-06,
+ 9.415242807619961e-09,
+ 9.343901652414388e-09,
+ 9.342033813197759e-09
+ ],
+ "gamma_dfa": 0.000660182828141842,
+ "gamma_dfa_per_layer": [
+ 0.0009655870962888002,
+ 0.0018112185643985868,
+ 3.598399052862078e-05,
+ -0.00017205833864863962
+ ],
+ "acc_eval": 0.255859375,
+ "loss_eval": 2.029409408569336,
+ "epoch": 60
+ }
+ ]
+} \ No newline at end of file