diff options
Diffstat (limited to 'results/snapshot_vit_v1/snapshot_vit_s42.json')
| -rw-r--r-- | results/snapshot_vit_v1/snapshot_vit_s42.json | 4594 |
1 files changed, 4594 insertions, 0 deletions
diff --git a/results/snapshot_vit_v1/snapshot_vit_s42.json b/results/snapshot_vit_v1/snapshot_vit_s42.json new file mode 100644 index 0000000..569af46 --- /dev/null +++ b/results/snapshot_vit_v1/snapshot_vit_s42.json @@ -0,0 +1,4594 @@ +{ + "config": { + "output_dir": "results/snapshot_vit_v1", + "epochs": 60, + "lr": 0.001, + "wd": 0.05, + "seed": 42, + "depth": 4, + "d_model": 128, + "n_heads": 4 + }, + "depth": 4, + "d_model": 128, + "architecture": "ViTMini", + "bp_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 0.511958122253418, + 12.453446388244629, + 18.366989135742188, + 25.54116439819336, + 31.80699348449707 + ], + "hidden_norms_avg": [ + 4.10694694519043, + 10.166566848754883, + 14.66998291015625, + 19.93342399597168, + 25.32619857788086 + ], + "bp_grad_per_sample_l2_med": [ + 0.0019771556835621595, + 0.00022324378369376063, + 0.00016308785416185856, + 0.00014621105219703168, + 0.0001451292191632092 + ], + "bp_grad_F": [ + 0.11066891252994537, + 0.01034498494118452, + 0.006372526753693819, + 0.0052248528227210045, + 0.005017552524805069 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.4501953125, + "loss_eval": 1.5154438018798828, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 0.6518111824989319, + 13.549692153930664, + 20.607715606689453, + 27.90418243408203, + 32.70498275756836 + ], + "hidden_norms_avg": [ + 4.0909905433654785, + 11.942686080932617, + 17.39116096496582, + 22.200014114379883, + 26.230010986328125 + ], + "bp_grad_per_sample_l2_med": [ + 0.0017800139030441642, + 0.00026728332159109414, + 0.0001720335567370057, + 0.0001423172070644796, + 0.00013423117343336344 + ], + "bp_grad_F": [ + 0.08781559765338898, + 0.010987765155732632, + 0.0064147054217755795, + 0.0050079175271093845, + 0.004637593869119883 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.494140625, + "loss_eval": 1.3824832439422607, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 0.755299985408783, + 11.224863052368164, + 19.053363800048828, + 27.303081512451172, + 33.078182220458984 + ], + "hidden_norms_avg": [ + 4.027151584625244, + 12.449769973754883, + 17.769508361816406, + 22.97556495666504, + 27.065759658813477 + ], + "bp_grad_per_sample_l2_med": [ + 0.0018998769810423255, + 0.00030996452551335096, + 0.00018013815861195326, + 0.0001340982416877523, + 0.00012205552775412798 + ], + "bp_grad_F": [ + 0.09037011116743088, + 0.013488140888512135, + 0.007346263621002436, + 0.0051797907799482346, + 0.004589984193444252 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.5439453125, + "loss_eval": 1.2540550231933594, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 0.844818651676178, + 13.648336410522461, + 20.277976989746094, + 28.240915298461914, + 33.095726013183594 + ], + "hidden_norms_avg": [ + 4.036877632141113, + 12.003630638122559, + 17.05451011657715, + 22.15869903564453, + 25.917491912841797 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016167981084436178, + 0.00028610811568796635, + 0.0001777650322765112, + 0.00012878721463494003, + 0.0001112063619075343 + ], + "bp_grad_F": [ + 0.07410340011119843, + 0.012637714855372906, + 0.007633093744516373, + 0.005242784973233938, + 0.004431390203535557 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1045944690704346, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 0.9051892161369324, + 12.476008415222168, + 19.24710464477539, + 27.6123046875, + 32.35737609863281 + ], + "hidden_norms_avg": [ + 4.138596057891846, + 12.409324645996094, + 17.427003860473633, + 22.245147705078125, + 25.471385955810547 + ], + "bp_grad_per_sample_l2_med": [ + 0.0016044765943661332, + 0.00030248358962126076, + 0.00018807635933626443, + 0.00013626758300233632, + 0.00011398641800042242 + ], + "bp_grad_F": [ + 0.08322811126708984, + 0.01390017382800579, + 0.008505746722221375, + 0.005747759714722633, + 0.004776888992637396 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.1296963691711426, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 0.9687634110450745, + 11.625859260559082, + 18.38014793395996, + 26.869504928588867, + 31.455507278442383 + ], + "hidden_norms_avg": [ + 4.263001441955566, + 13.1234769821167, + 17.853057861328125, + 22.476547241210938, + 25.29656410217285 + ], + "bp_grad_per_sample_l2_med": [ + 0.0015340449754148722, + 0.00033552697277627885, + 0.00021536082203965634, + 0.00015067037020344287, + 0.00012220896314829588 + ], + "bp_grad_F": [ + 0.07571946829557419, + 0.015132292173802853, + 0.009512492455542088, + 0.006373303942382336, + 0.005029390100389719 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.603515625, + "loss_eval": 1.0963702201843262, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 1.0029383897781372, + 12.687585830688477, + 19.734830856323242, + 28.174379348754883, + 32.5982780456543 + ], + "hidden_norms_avg": [ + 4.357974052429199, + 13.182960510253906, + 17.720989227294922, + 21.832895278930664, + 24.934776306152344 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013370191445574164, + 0.00026788320974446833, + 0.00018144956266041845, + 0.00013219293032307178, + 0.00010196284711128101 + ], + "bp_grad_F": [ + 0.06996501982212067, + 0.013071151450276375, + 0.008477694354951382, + 0.0061036222614347935, + 0.004761465825140476 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6416015625, + "loss_eval": 0.9737913012504578, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 1.043707013130188, + 12.487404823303223, + 18.845643997192383, + 26.870864868164062, + 31.145292282104492 + ], + "hidden_norms_avg": [ + 4.454991340637207, + 13.503378868103027, + 18.694488525390625, + 23.029804229736328, + 25.810880661010742 + ], + "bp_grad_per_sample_l2_med": [ + 0.0013130803126841784, + 0.00029930632445029914, + 0.0002022052649408579, + 0.0001383959170198068, + 0.00010439592006150633 + ], + "bp_grad_F": [ + 0.0743240937590599, + 0.015402271412312984, + 0.009977605193853378, + 0.006877230014652014, + 0.005202346481382847 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.666015625, + "loss_eval": 0.9317076206207275, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 1.0887501239776611, + 12.662396430969238, + 18.622724533081055, + 26.599454879760742, + 31.788663864135742 + ], + "hidden_norms_avg": [ + 4.529710292816162, + 13.683384895324707, + 18.47463607788086, + 22.395898818969727, + 25.244558334350586 + ], + "bp_grad_per_sample_l2_med": [ + 0.0012017677072435617, + 0.0002972102665808052, + 0.00019775003602262586, + 0.00013734954700339586, + 9.880279685603455e-05 + ], + "bp_grad_F": [ + 0.0661192312836647, + 0.01516024675220251, + 0.010001113638281822, + 0.006893018260598183, + 0.0051134442910552025 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6669921875, + "loss_eval": 0.9026263952255249, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 1.1163448095321655, + 12.711283683776855, + 18.790128707885742, + 26.846359252929688, + 31.663158416748047 + ], + "hidden_norms_avg": [ + 4.502295970916748, + 13.801639556884766, + 18.488975524902344, + 22.378704071044922, + 25.22056007385254 + ], + "bp_grad_per_sample_l2_med": [ + 0.0011062510311603546, + 0.00029147896566428244, + 0.0001970102748600766, + 0.00013174059859011322, + 0.0001037597976392135 + ], + "bp_grad_F": [ + 0.06217500939965248, + 0.014721231535077095, + 0.00993143580853939, + 0.006723989732563496, + 0.005166618153452873 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.6845703125, + "loss_eval": 0.8660677671432495, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 1.1505078077316284, + 12.160571098327637, + 18.15353012084961, + 25.762012481689453, + 31.478300094604492 + ], + "hidden_norms_avg": [ + 4.5605149269104, + 13.918573379516602, + 18.88881492614746, + 22.79344940185547, + 25.800094604492188 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009689349099062383, + 0.0002486997109372169, + 0.0001736732665449381, + 0.00011473154881969094, + 8.573567902203649e-05 + ], + "bp_grad_F": [ + 0.06455213576555252, + 0.01547171175479889, + 0.010573537088930607, + 0.0071961241774261, + 0.005212985444813967 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.71484375, + "loss_eval": 0.812907874584198, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 1.1844152212142944, + 11.332664489746094, + 16.57625961303711, + 23.82307243347168, + 28.492321014404297 + ], + "hidden_norms_avg": [ + 4.602160453796387, + 13.876313209533691, + 17.891036987304688, + 21.410982131958008, + 23.97108268737793 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009290817542932928, + 0.0002613075776025653, + 0.0001877332106232643, + 0.0001262558507733047, + 9.168039832729846e-05 + ], + "bp_grad_F": [ + 0.06392678618431091, + 0.01674485206604004, + 0.011727217584848404, + 0.007738997228443623, + 0.005730107892304659 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7197265625, + "loss_eval": 0.7641609907150269, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 1.2184560298919678, + 12.450925827026367, + 18.076860427856445, + 25.162586212158203, + 30.365047454833984 + ], + "hidden_norms_avg": [ + 4.7080278396606445, + 13.851634979248047, + 18.517131805419922, + 22.074214935302734, + 24.72054100036621 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009277731878682971, + 0.00024563330225646496, + 0.00017736255540512502, + 0.00012202116340631619, + 8.748921391088516e-05 + ], + "bp_grad_F": [ + 0.06389915198087692, + 0.016115156933665276, + 0.0110858753323555, + 0.0076499818824231625, + 0.005541808437556028 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.697265625, + "loss_eval": 0.8037601113319397, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 1.243064045906067, + 11.932015419006348, + 17.215856552124023, + 24.764291763305664, + 29.49314308166504 + ], + "hidden_norms_avg": [ + 4.651937961578369, + 13.890728950500488, + 18.2476749420166, + 21.80103302001953, + 24.145692825317383 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009111211402341723, + 0.000253814272582531, + 0.00018247529806103557, + 0.00011639296280918643, + 8.364167297258973e-05 + ], + "bp_grad_F": [ + 0.06324896216392517, + 0.016394753009080887, + 0.01153184287250042, + 0.007614497095346451, + 0.0056136660277843475 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.728515625, + "loss_eval": 0.7384279370307922, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 1.2652677297592163, + 11.532588005065918, + 16.7224178314209, + 23.326444625854492, + 28.03766441345215 + ], + "hidden_norms_avg": [ + 4.652615547180176, + 13.981542587280273, + 17.984512329101562, + 21.317432403564453, + 23.233760833740234 + ], + "bp_grad_per_sample_l2_med": [ + 0.0008032417972572148, + 0.00022395161795429885, + 0.00016904002404771745, + 0.0001078559216693975, + 7.841538899810985e-05 + ], + "bp_grad_F": [ + 0.06386830657720566, + 0.016731705516576767, + 0.012135310098528862, + 0.008108492009341717, + 0.006046997383236885 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7333984375, + "loss_eval": 0.7387630939483643, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 1.2944419384002686, + 11.34481430053711, + 16.45362091064453, + 22.63861846923828, + 28.011232376098633 + ], + "hidden_norms_avg": [ + 4.738389015197754, + 13.769956588745117, + 17.63072395324707, + 21.14189338684082, + 23.455045700073242 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007927753031253815, + 0.0002345799293834716, + 0.00016934113227762282, + 0.00011508075840538368, + 7.966109114931896e-05 + ], + "bp_grad_F": [ + 0.0655454769730568, + 0.01815187744796276, + 0.013005951419472694, + 0.008820701390504837, + 0.006184164900332689 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7255859375, + "loss_eval": 0.7302451133728027, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 1.3085625171661377, + 11.323317527770996, + 15.866230964660645, + 21.746976852416992, + 27.081127166748047 + ], + "hidden_norms_avg": [ + 4.687533855438232, + 13.471115112304688, + 17.396968841552734, + 20.327377319335938, + 22.58539581298828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006625292589887977, + 0.00019486426026560366, + 0.00014659677981399, + 9.787825547391549e-05, + 6.321907130768523e-05 + ], + "bp_grad_F": [ + 0.07393868267536163, + 0.020178642123937607, + 0.014442694373428822, + 0.009784683585166931, + 0.00656729843467474 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7412109375, + "loss_eval": 0.7063955068588257, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 1.3433176279067993, + 10.762125968933105, + 15.129413604736328, + 21.06867790222168, + 26.1944522857666 + ], + "hidden_norms_avg": [ + 4.709607124328613, + 13.69739055633545, + 17.006061553955078, + 19.97213363647461, + 22.212177276611328 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006978239398449659, + 0.00021396303782239556, + 0.00016030693950597197, + 0.00010856003791559488, + 6.917239079484716e-05 + ], + "bp_grad_F": [ + 0.06653428077697754, + 0.019508732482790947, + 0.014456766657531261, + 0.010107609443366528, + 0.006681134924292564 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.75, + "loss_eval": 0.6990396976470947, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 1.3607734441757202, + 10.718966484069824, + 15.383923530578613, + 21.34387969970703, + 26.49329376220703 + ], + "hidden_norms_avg": [ + 4.7122907638549805, + 13.804581642150879, + 17.532636642456055, + 20.843929290771484, + 23.01592254638672 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007053805165924132, + 0.0002122409496223554, + 0.00016182110994122922, + 0.00011085433652624488, + 7.204789289971814e-05 + ], + "bp_grad_F": [ + 0.06105736270546913, + 0.017779415473341942, + 0.013269647024571896, + 0.009227588772773743, + 0.006410240661352873 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6498311758041382, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 1.3752704858779907, + 10.530582427978516, + 14.803340911865234, + 20.217910766601562, + 25.20522689819336 + ], + "hidden_norms_avg": [ + 4.7595720291137695, + 13.601245880126953, + 17.491943359375, + 20.960437774658203, + 22.910301208496094 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006476694834418595, + 0.00020479912927839905, + 0.0001524801627965644, + 0.00010630583710735664, + 6.906194903422147e-05 + ], + "bp_grad_F": [ + 0.06572327762842178, + 0.019566379487514496, + 0.01484121847897768, + 0.010426007211208344, + 0.006943442393094301 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.763671875, + "loss_eval": 0.6451045274734497, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 1.394100546836853, + 9.805717468261719, + 14.102628707885742, + 19.18745231628418, + 24.205224990844727 + ], + "hidden_norms_avg": [ + 4.746951580047607, + 13.343804359436035, + 16.609134674072266, + 19.829851150512695, + 21.580671310424805 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006192427244968712, + 0.0002108582411892712, + 0.0001636892993701622, + 0.0001098570428439416, + 6.864540046080947e-05 + ], + "bp_grad_F": [ + 0.06809430569410324, + 0.02151457779109478, + 0.01606965810060501, + 0.011247958056628704, + 0.007375919260084629 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7705078125, + "loss_eval": 0.6522111892700195, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 1.4160058498382568, + 9.728543281555176, + 13.389554977416992, + 18.542705535888672, + 23.791994094848633 + ], + "hidden_norms_avg": [ + 4.738738536834717, + 13.15449333190918, + 16.28533172607422, + 19.581254959106445, + 21.488550186157227 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006278376094996929, + 0.00020051853789482266, + 0.00015803576388861984, + 0.0001043542506522499, + 6.271857273532078e-05 + ], + "bp_grad_F": [ + 0.07535671442747116, + 0.02472539246082306, + 0.01880054548382759, + 0.012977317906916142, + 0.007879889570176601 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.767578125, + "loss_eval": 0.6732022762298584, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 1.4301073551177979, + 9.656251907348633, + 13.501574516296387, + 18.518707275390625, + 23.49370574951172 + ], + "hidden_norms_avg": [ + 4.7338972091674805, + 12.90231704711914, + 15.899849891662598, + 18.982860565185547, + 20.785310745239258 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005697127780877054, + 0.00018775691569317132, + 0.00014216902491170913, + 9.182754729408771e-05, + 5.984708695905283e-05 + ], + "bp_grad_F": [ + 0.07130222022533417, + 0.023520665243268013, + 0.017786188051104546, + 0.012143870815634727, + 0.007813607342541218 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7763671875, + "loss_eval": 0.6380050182342529, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 1.4623057842254639, + 10.028787612915039, + 13.687016487121582, + 18.426584243774414, + 23.602413177490234 + ], + "hidden_norms_avg": [ + 4.807516574859619, + 12.739899635314941, + 16.150466918945312, + 19.439754486083984, + 21.316791534423828 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005416463245637715, + 0.00019103426893707365, + 0.00014568559709005058, + 9.899997530737892e-05, + 6.29485584795475e-05 + ], + "bp_grad_F": [ + 0.07191846519708633, + 0.023787740617990494, + 0.01782786287367344, + 0.012350695207715034, + 0.007955120876431465 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.6439570784568787, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 1.4565976858139038, + 9.294268608093262, + 12.656200408935547, + 17.385971069335938, + 21.959299087524414 + ], + "hidden_norms_avg": [ + 4.774696350097656, + 12.394432067871094, + 15.230389595031738, + 18.10796356201172, + 19.88006591796875 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005462650442495942, + 0.00019751323270611465, + 0.00015244862879626453, + 0.00010562407260295004, + 6.40779035165906e-05 + ], + "bp_grad_F": [ + 0.07698184996843338, + 0.026412304490804672, + 0.02022000029683113, + 0.013991317711770535, + 0.008763212710618973 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7568359375, + "loss_eval": 0.6531677842140198, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 1.4813296794891357, + 9.043482780456543, + 12.308734893798828, + 16.513948440551758, + 21.061283111572266 + ], + "hidden_norms_avg": [ + 4.7356462478637695, + 12.33294677734375, + 15.104657173156738, + 17.771398544311523, + 19.526002883911133 + ], + "bp_grad_per_sample_l2_med": [ + 0.000557436200324446, + 0.0002021614054683596, + 0.0001567570143379271, + 0.00010984922846546397, + 6.634221062995493e-05 + ], + "bp_grad_F": [ + 0.07777652144432068, + 0.027695877477526665, + 0.021396547555923462, + 0.015052770264446735, + 0.009372876025736332 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.6539995074272156, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 1.4828969240188599, + 8.677760124206543, + 12.009501457214355, + 16.262908935546875, + 20.79404067993164 + ], + "hidden_norms_avg": [ + 4.744379043579102, + 12.125540733337402, + 14.89413833618164, + 17.47431182861328, + 18.953710556030273 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005026232684031129, + 0.00019721532589755952, + 0.00014348917466122657, + 0.00010225686855847016, + 5.8645866374718025e-05 + ], + "bp_grad_F": [ + 0.0830698236823082, + 0.03011341392993927, + 0.023107260465621948, + 0.016188694164156914, + 0.00968033168464899 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7744140625, + "loss_eval": 0.6444424390792847, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 1.5019822120666504, + 9.1107816696167, + 12.172623634338379, + 16.5975341796875, + 20.453947067260742 + ], + "hidden_norms_avg": [ + 4.741573333740234, + 12.045503616333008, + 14.836026191711426, + 17.666833877563477, + 19.175966262817383 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005040269461460412, + 0.00019225970027036965, + 0.0001496450131526217, + 0.00010478955664439127, + 6.137428135843948e-05 + ], + "bp_grad_F": [ + 0.07822537422180176, + 0.02863621897995472, + 0.022284477949142456, + 0.01552330981940031, + 0.009474868886172771 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.6074927449226379, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 1.5009087324142456, + 8.223862648010254, + 11.225082397460938, + 15.531359672546387, + 19.848068237304688 + ], + "hidden_norms_avg": [ + 4.69788122177124, + 11.848491668701172, + 14.342337608337402, + 16.882020950317383, + 18.197385787963867 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004685261519625783, + 0.00017912790644913912, + 0.00013862684136256576, + 9.223359666066244e-05, + 5.140554640092887e-05 + ], + "bp_grad_F": [ + 0.09127916395664215, + 0.03443564847111702, + 0.026544470340013504, + 0.01809101179242134, + 0.010493002831935883 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6329880952835083, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 1.509100079536438, + 8.238924980163574, + 10.995248794555664, + 14.927000045776367, + 19.032428741455078 + ], + "hidden_norms_avg": [ + 4.678654193878174, + 11.513160705566406, + 14.12202262878418, + 16.704364776611328, + 18.131078720092773 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004594121128320694, + 0.00018182865460403264, + 0.000145129015436396, + 0.00010142508108401671, + 5.208289803704247e-05 + ], + "bp_grad_F": [ + 0.09080124646425247, + 0.03489048779010773, + 0.027099598199129105, + 0.018760183826088905, + 0.010796112939715385 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7822265625, + "loss_eval": 0.625268816947937, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 1.503785252571106, + 7.896090030670166, + 10.495330810546875, + 14.530640602111816, + 18.728647232055664 + ], + "hidden_norms_avg": [ + 4.70166540145874, + 11.420204162597656, + 13.774767875671387, + 16.2652530670166, + 17.631481170654297 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043488750816322863, + 0.00017315168224740773, + 0.0001335645210929215, + 8.99006481631659e-05, + 5.126056930748746e-05 + ], + "bp_grad_F": [ + 0.10076858103275299, + 0.039271026849746704, + 0.0300181582570076, + 0.020545953884720802, + 0.011564387008547783 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.771484375, + "loss_eval": 0.6479744911193848, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 1.505173921585083, + 7.728392124176025, + 10.420252799987793, + 14.133453369140625, + 18.110719680786133 + ], + "hidden_norms_avg": [ + 4.7109880447387695, + 11.242951393127441, + 13.997397422790527, + 16.60598373413086, + 17.915313720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00040974540752358735, + 0.0001792571711121127, + 0.00014464404375758022, + 9.883226448437199e-05, + 5.038536983192898e-05 + ], + "bp_grad_F": [ + 0.09923475980758667, + 0.039516862481832504, + 0.03056514263153076, + 0.021311543881893158, + 0.011838918551802635 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7880859375, + "loss_eval": 0.6011433601379395, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 1.5013800859451294, + 7.8755106925964355, + 10.452071189880371, + 14.013816833496094, + 17.622900009155273 + ], + "hidden_norms_avg": [ + 4.662457466125488, + 11.018245697021484, + 13.179399490356445, + 15.56103515625, + 16.739452362060547 + ], + "bp_grad_per_sample_l2_med": [ + 0.00033098450512625277, + 0.0001421417691744864, + 0.00011021740647265688, + 7.645406731171533e-05, + 4.017115134047344e-05 + ], + "bp_grad_F": [ + 0.09463275969028473, + 0.03948793560266495, + 0.03067062795162201, + 0.021538278087973595, + 0.012101472355425358 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8076171875, + "loss_eval": 0.5846524238586426, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 1.5032685995101929, + 7.549060344696045, + 10.04562759399414, + 13.609556198120117, + 17.36180877685547 + ], + "hidden_norms_avg": [ + 4.688360214233398, + 11.03510856628418, + 13.660865783691406, + 16.024188995361328, + 17.242145538330078 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003352685598656535, + 0.0001500560319982469, + 0.000116633229481522, + 8.394405449507758e-05, + 4.0652244933880866e-05 + ], + "bp_grad_F": [ + 0.10540100187063217, + 0.044482193887233734, + 0.03421863541007042, + 0.023781608790159225, + 0.012753129936754704 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7861328125, + "loss_eval": 0.5960580110549927, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 1.5032752752304077, + 7.387601375579834, + 9.652260780334473, + 13.042936325073242, + 16.688335418701172 + ], + "hidden_norms_avg": [ + 4.644099235534668, + 10.739524841308594, + 13.165095329284668, + 15.435381889343262, + 16.59172248840332 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003447248600423336, + 0.0001518868375569582, + 0.00012246235564816743, + 8.41514120111242e-05, + 4.193704080535099e-05 + ], + "bp_grad_F": [ + 0.11063266545534134, + 0.04730832949280739, + 0.03743334487080574, + 0.02577192150056362, + 0.01377912238240242 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.78515625, + "loss_eval": 0.652167797088623, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 1.4935848712921143, + 7.262828826904297, + 9.431328773498535, + 12.742668151855469, + 16.348758697509766 + ], + "hidden_norms_avg": [ + 4.6145453453063965, + 10.670759201049805, + 12.641580581665039, + 14.64714241027832, + 15.685794830322266 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003325030847918242, + 0.00014367286348715425, + 0.00011324919614708051, + 7.871988782426342e-05, + 4.058879494550638e-05 + ], + "bp_grad_F": [ + 0.11436768621206284, + 0.04893247410655022, + 0.03840672969818115, + 0.02707456797361374, + 0.014087510295212269 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7978515625, + "loss_eval": 0.6156834363937378, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 1.4897189140319824, + 7.156031608581543, + 9.365946769714355, + 12.499292373657227, + 15.942588806152344 + ], + "hidden_norms_avg": [ + 4.635710716247559, + 10.602685928344727, + 12.637743949890137, + 14.74621868133545, + 15.834792137145996 + ], + "bp_grad_per_sample_l2_med": [ + 0.000299928622553125, + 0.00013245265290606767, + 0.00010241761629004031, + 7.247657049447298e-05, + 3.780105180339888e-05 + ], + "bp_grad_F": [ + 0.11267601698637009, + 0.0501401461660862, + 0.03941003605723381, + 0.0279407799243927, + 0.014723201282322407 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.5903886556625366, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 1.4791479110717773, + 7.027911186218262, + 9.0321044921875, + 12.123476028442383, + 15.987238883972168 + ], + "hidden_norms_avg": [ + 4.5436177253723145, + 10.157598495483398, + 12.115620613098145, + 14.023022651672363, + 15.130277633666992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002464659046381712, + 0.00011603213351918384, + 9.401622082805261e-05, + 6.44488463876769e-05, + 2.8129303245805204e-05 + ], + "bp_grad_F": [ + 0.1319781094789505, + 0.05854209512472153, + 0.04639327526092529, + 0.03260229155421257, + 0.01578359492123127 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7841796875, + "loss_eval": 0.6532921195030212, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 1.4722236394882202, + 6.847982406616211, + 9.039284706115723, + 11.94421672821045, + 15.479789733886719 + ], + "hidden_norms_avg": [ + 4.536457538604736, + 10.0848388671875, + 11.944480895996094, + 13.931117057800293, + 15.018562316894531 + ], + "bp_grad_per_sample_l2_med": [ + 0.00023636725381948054, + 0.00011084756260970607, + 8.837366476655006e-05, + 6.370043411152437e-05, + 3.0101380616542883e-05 + ], + "bp_grad_F": [ + 0.1352969855070114, + 0.06069062277674675, + 0.04737559333443642, + 0.03317096084356308, + 0.016367904841899872 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7783203125, + "loss_eval": 0.6675163507461548, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 1.4741134643554688, + 6.7887864112854, + 8.833945274353027, + 11.777705192565918, + 15.091635704040527 + ], + "hidden_norms_avg": [ + 4.546427249908447, + 10.082904815673828, + 11.992964744567871, + 14.035684585571289, + 15.085047721862793 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002497230307199061, + 0.00011889061715919524, + 9.627552208257839e-05, + 6.80557859595865e-05, + 3.187589391018264e-05 + ], + "bp_grad_F": [ + 0.13283543288707733, + 0.06097453087568283, + 0.047521013766527176, + 0.033583469688892365, + 0.016502397134900093 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.6332878470420837, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 1.4732073545455933, + 6.690948009490967, + 8.623305320739746, + 11.383458137512207, + 14.868409156799316 + ], + "hidden_norms_avg": [ + 4.510478973388672, + 9.772372245788574, + 11.55829906463623, + 13.379657745361328, + 14.343344688415527 + ], + "bp_grad_per_sample_l2_med": [ + 0.00019870084361173213, + 0.00010116927296621725, + 8.329773845616728e-05, + 6.15280878264457e-05, + 2.8435944841476157e-05 + ], + "bp_grad_F": [ + 0.13917136192321777, + 0.06636927276849747, + 0.05231080949306488, + 0.0366261750459671, + 0.017451239749789238 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.6271109580993652, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 1.4620546102523804, + 6.489831924438477, + 8.487679481506348, + 11.202116966247559, + 14.761962890625 + ], + "hidden_norms_avg": [ + 4.5009870529174805, + 9.717012405395508, + 11.480990409851074, + 13.235471725463867, + 14.178875923156738 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015383858408313245, + 8.131976937875152e-05, + 6.472255336120725e-05, + 4.378501034807414e-05, + 1.9541592337191105e-05 + ], + "bp_grad_F": [ + 0.1546960175037384, + 0.07402726262807846, + 0.058267489075660706, + 0.041084613651037216, + 0.018521569669246674 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.794921875, + "loss_eval": 0.6767467260360718, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 1.4651520252227783, + 6.564362525939941, + 8.296653747558594, + 11.014183044433594, + 14.418519973754883 + ], + "hidden_norms_avg": [ + 4.483984470367432, + 9.593335151672363, + 11.23758316040039, + 13.036303520202637, + 14.015531539916992 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002037636877503246, + 0.00010235400259261951, + 8.395169425057247e-05, + 5.674947897205129e-05, + 2.5295201339758933e-05 + ], + "bp_grad_F": [ + 0.15471766889095306, + 0.07422170042991638, + 0.05941145122051239, + 0.04111991077661514, + 0.018912144005298615 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8037109375, + "loss_eval": 0.6682149171829224, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 1.457137107849121, + 6.368557929992676, + 8.152215957641602, + 10.783031463623047, + 14.167640686035156 + ], + "hidden_norms_avg": [ + 4.462830066680908, + 9.585762977600098, + 11.208064079284668, + 13.065739631652832, + 13.993027687072754 + ], + "bp_grad_per_sample_l2_med": [ + 0.00016671593766659498, + 8.65811962285079e-05, + 7.217681559268385e-05, + 5.042032353230752e-05, + 2.1260022549540736e-05 + ], + "bp_grad_F": [ + 0.15730538964271545, + 0.07605564594268799, + 0.06052647903561592, + 0.04247846081852913, + 0.01923321560025215 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8134765625, + "loss_eval": 0.6757298111915588, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 1.4529122114181519, + 6.260828018188477, + 8.032843589782715, + 10.586301803588867, + 13.950445175170898 + ], + "hidden_norms_avg": [ + 4.4613800048828125, + 9.4591646194458, + 11.012088775634766, + 12.760184288024902, + 13.692852973937988 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001344321499345824, + 6.65406696498394e-05, + 5.5920852901181206e-05, + 3.9107719203457236e-05, + 1.5611329217790626e-05 + ], + "bp_grad_F": [ + 0.1660272479057312, + 0.08182978630065918, + 0.06507853418588638, + 0.046549297869205475, + 0.020592277869582176 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.806640625, + "loss_eval": 0.685518205165863, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 1.4509673118591309, + 6.163156032562256, + 7.82518196105957, + 10.378498077392578, + 13.96407699584961 + ], + "hidden_norms_avg": [ + 4.434635162353516, + 9.335474967956543, + 10.857998847961426, + 12.551763534545898, + 13.511585235595703 + ], + "bp_grad_per_sample_l2_med": [ + 0.00011230952804908156, + 5.540825441130437e-05, + 4.5063996367389336e-05, + 2.9814285881002434e-05, + 1.1903831364179496e-05 + ], + "bp_grad_F": [ + 0.1772848516702652, + 0.08942516893148422, + 0.07126298546791077, + 0.04956020042300224, + 0.021146513521671295 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.69295334815979, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 1.4527415037155151, + 6.165233612060547, + 7.756027698516846, + 10.242467880249023, + 13.45471477508545 + ], + "hidden_norms_avg": [ + 4.438976287841797, + 9.343517303466797, + 10.836493492126465, + 12.435514450073242, + 13.287426948547363 + ], + "bp_grad_per_sample_l2_med": [ + 0.0001074640967999585, + 5.268112363410182e-05, + 4.352951145847328e-05, + 3.164535519317724e-05, + 1.2792614143108949e-05 + ], + "bp_grad_F": [ + 0.17606250941753387, + 0.08888891339302063, + 0.07090400159358978, + 0.05056491121649742, + 0.021766021847724915 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.806640625, + "loss_eval": 0.6969807147979736, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 1.4455187320709229, + 6.104230880737305, + 7.606966972351074, + 10.056215286254883, + 13.531522750854492 + ], + "hidden_norms_avg": [ + 4.394144535064697, + 9.197455406188965, + 10.598797798156738, + 12.198134422302246, + 13.1181001663208 + ], + "bp_grad_per_sample_l2_med": [ + 9.084033081308007e-05, + 4.605063077178784e-05, + 3.957438457291573e-05, + 2.727917853917461e-05, + 1.0920393833657727e-05 + ], + "bp_grad_F": [ + 0.1919114887714386, + 0.09742862731218338, + 0.07786751538515091, + 0.05414625629782677, + 0.022070109844207764 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.810546875, + "loss_eval": 0.713995635509491, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 1.4383388757705688, + 6.067695617675781, + 7.595578670501709, + 9.960418701171875, + 13.367838859558105 + ], + "hidden_norms_avg": [ + 4.4121479988098145, + 9.207226753234863, + 10.62590217590332, + 12.186077117919922, + 13.054762840270996 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010577002831269056, + 5.2172203140798956e-05, + 4.119141885894351e-05, + 2.997498268086929e-05, + 1.1721556802513078e-05 + ], + "bp_grad_F": [ + 0.19711492955684662, + 0.09961695969104767, + 0.07941404730081558, + 0.05621125549077988, + 0.02285071834921837 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.7457866668701172, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 1.438454270362854, + 6.097946643829346, + 7.5858659744262695, + 9.956851959228516, + 13.270756721496582 + ], + "hidden_norms_avg": [ + 4.392654895782471, + 9.144302368164062, + 10.536030769348145, + 12.092294692993164, + 12.985077857971191 + ], + "bp_grad_per_sample_l2_med": [ + 0.00010758326970972121, + 5.274294744594954e-05, + 4.421125413500704e-05, + 3.0753104510949925e-05, + 1.1889996130776126e-05 + ], + "bp_grad_F": [ + 0.19883227348327637, + 0.1017213836312294, + 0.0807848572731018, + 0.056292060762643814, + 0.022987989708781242 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7998046875, + "loss_eval": 0.7402137517929077, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 1.4367005825042725, + 6.004332542419434, + 7.504194259643555, + 9.782310485839844, + 13.125389099121094 + ], + "hidden_norms_avg": [ + 4.3845720291137695, + 9.06988525390625, + 10.41169548034668, + 11.905806541442871, + 12.784433364868164 + ], + "bp_grad_per_sample_l2_med": [ + 9.236831829184666e-05, + 4.803440242540091e-05, + 3.901722448063083e-05, + 2.752364525804296e-05, + 1.1449340490798932e-05 + ], + "bp_grad_F": [ + 0.19664740562438965, + 0.10213448107242584, + 0.08124449104070663, + 0.05709528177976608, + 0.023260990157723427 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.732274055480957, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 1.4371269941329956, + 5.965888500213623, + 7.401495933532715, + 9.748833656311035, + 13.274619102478027 + ], + "hidden_norms_avg": [ + 4.380629539489746, + 9.019668579101562, + 10.396828651428223, + 11.923394203186035, + 12.77461051940918 + ], + "bp_grad_per_sample_l2_med": [ + 7.760760490782559e-05, + 4.048245318699628e-05, + 3.216555342078209e-05, + 2.2310470740194432e-05, + 8.838631401886232e-06 + ], + "bp_grad_F": [ + 0.20731569826602936, + 0.10790340602397919, + 0.08557390421628952, + 0.059937626123428345, + 0.023827020078897476 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8046875, + "loss_eval": 0.7751725316047668, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 1.4341260194778442, + 5.9393768310546875, + 7.411903381347656, + 9.739734649658203, + 13.19786548614502 + ], + "hidden_norms_avg": [ + 4.378067493438721, + 8.986294746398926, + 10.316237449645996, + 11.792922019958496, + 12.673585891723633 + ], + "bp_grad_per_sample_l2_med": [ + 6.968516390770674e-05, + 3.471451054792851e-05, + 2.8814916731789708e-05, + 1.9318980776006356e-05, + 7.639268915227149e-06 + ], + "bp_grad_F": [ + 0.2137812376022339, + 0.11110929399728775, + 0.08847261965274811, + 0.06186935305595398, + 0.024307044222950935 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8056640625, + "loss_eval": 0.764312744140625, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 1.4324616193771362, + 5.883492469787598, + 7.319663047790527, + 9.547243118286133, + 13.008822441101074 + ], + "hidden_norms_avg": [ + 4.376597881317139, + 8.99113941192627, + 10.321625709533691, + 11.771256446838379, + 12.628817558288574 + ], + "bp_grad_per_sample_l2_med": [ + 7.972177991177887e-05, + 3.871036460623145e-05, + 3.142197601846419e-05, + 2.2371379600372165e-05, + 8.571933904022444e-06 + ], + "bp_grad_F": [ + 0.21534259617328644, + 0.11241323500871658, + 0.08915204554796219, + 0.06287811696529388, + 0.024627922102808952 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.7731261253356934, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 1.4321078062057495, + 5.858248710632324, + 7.306819915771484, + 9.56387996673584, + 13.071084022521973 + ], + "hidden_norms_avg": [ + 4.371452808380127, + 8.94082260131836, + 10.26811695098877, + 11.765360832214355, + 12.617104530334473 + ], + "bp_grad_per_sample_l2_med": [ + 7.236401870613918e-05, + 3.8528516597580165e-05, + 3.0984694603830576e-05, + 2.1565809220192023e-05, + 7.989257937879302e-06 + ], + "bp_grad_F": [ + 0.2197490781545639, + 0.1155213937163353, + 0.09188564866781235, + 0.06453806161880493, + 0.024861471727490425 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.7958984375, + "loss_eval": 0.7778797149658203, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 1.4319349527359009, + 5.846956253051758, + 7.283481121063232, + 9.520010948181152, + 13.023626327514648 + ], + "hidden_norms_avg": [ + 4.372097969055176, + 8.950923919677734, + 10.25277328491211, + 11.715353012084961, + 12.572748184204102 + ], + "bp_grad_per_sample_l2_med": [ + 6.399707490345463e-05, + 3.384953743079677e-05, + 2.7512824090081267e-05, + 1.8538266886025667e-05, + 7.2009356699709315e-06 + ], + "bp_grad_F": [ + 0.21942120790481567, + 0.11553706228733063, + 0.09221186488866806, + 0.06456339359283447, + 0.024819573387503624 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7808230519294739, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 1.4311723709106445, + 5.84969425201416, + 7.275974273681641, + 9.513206481933594, + 12.99256420135498 + ], + "hidden_norms_avg": [ + 4.37282133102417, + 8.946002006530762, + 10.248116493225098, + 11.702008247375488, + 12.54873275756836 + ], + "bp_grad_per_sample_l2_med": [ + 6.404191663023084e-05, + 3.509471571305767e-05, + 2.9476050258381292e-05, + 1.9310447896714322e-05, + 7.2306984293391e-06 + ], + "bp_grad_F": [ + 0.22379544377326965, + 0.11763197183609009, + 0.09364764392375946, + 0.06539658457040787, + 0.02503892220556736 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.80078125, + "loss_eval": 0.7862963080406189, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 1.4306355714797974, + 5.837501049041748, + 7.250905990600586, + 9.502866744995117, + 13.022948265075684 + ], + "hidden_norms_avg": [ + 4.368107795715332, + 8.927281379699707, + 10.20923900604248, + 11.650206565856934, + 12.504077911376953 + ], + "bp_grad_per_sample_l2_med": [ + 7.216054655145854e-05, + 3.7455520214280114e-05, + 3.0207094823708758e-05, + 2.1436455426737666e-05, + 7.401154562103329e-06 + ], + "bp_grad_F": [ + 0.22603340446949005, + 0.11918352544307709, + 0.0947541669011116, + 0.06624340265989304, + 0.02514214999973774 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.8017578125, + "loss_eval": 0.7883187532424927, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 1.4303507804870605, + 5.833686351776123, + 7.24592399597168, + 9.48628044128418, + 12.962425231933594 + ], + "hidden_norms_avg": [ + 4.368690013885498, + 8.926249504089355, + 10.21507453918457, + 11.65561294555664, + 12.507142066955566 + ], + "bp_grad_per_sample_l2_med": [ + 6.914411642355844e-05, + 3.7666370189981535e-05, + 3.0613842682214454e-05, + 2.0578616386046633e-05, + 7.153785645641619e-06 + ], + "bp_grad_F": [ + 0.22665317356586456, + 0.1197197362780571, + 0.09526386857032776, + 0.06651060283184052, + 0.02521701157093048 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7879265546798706, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 1.430293083190918, + 5.832674026489258, + 7.243373394012451, + 9.484408378601074, + 12.968917846679688 + ], + "hidden_norms_avg": [ + 4.368374347686768, + 8.92542552947998, + 10.214056015014648, + 11.65438175201416, + 12.507084846496582 + ], + "bp_grad_per_sample_l2_med": [ + 6.862521695438772e-05, + 3.740868851309642e-05, + 3.050716986763291e-05, + 2.0533103452180512e-05, + 7.137502961995779e-06 + ], + "bp_grad_F": [ + 0.22697713971138, + 0.11988355964422226, + 0.09540446847677231, + 0.06659507006406784, + 0.025233659893274307 + ], + "gamma_dfa": NaN, + "gamma_dfa_per_layer": [], + "acc_eval": 0.798828125, + "loss_eval": 0.7890625, + "epoch": 60 + } + ], + "dfa_log": [ + { + "hidden_norms_cls": [ + 0.31052109599113464, + 3.2536301612854004, + 4.7681732177734375, + 6.129599571228027, + 7.124356746673584 + ], + "hidden_norms_avg": [ + 6.008513927459717, + 7.034290313720703, + 7.942849636077881, + 8.915729522705078, + 9.635361671447754 + ], + "bp_grad_per_sample_l2_med": [ + 0.004442029166966677, + 0.0012008437188342214, + 0.0009976272704079747, + 0.0009104337659664452, + 0.0008558662957511842 + ], + "bp_grad_F": [ + 0.18535660207271576, + 0.03968670591711998, + 0.032604776322841644, + 0.029427478089928627, + 0.02746850810945034 + ], + "gamma_dfa": 0.003905070887412876, + "gamma_dfa_per_layer": [ + 0.004920602310448885, + 0.005249542184174061, + 0.0038580193649977446, + 0.0015921196900308132 + ], + "acc_eval": 0.1376953125, + "loss_eval": 2.35188627243042, + "epoch": 0 + }, + { + "hidden_norms_cls": [ + 1.969543218612671, + 2409.528564453125, + 2965.8515625, + 5388.57568359375, + 10078.4892578125 + ], + "hidden_norms_avg": [ + 45.02196502685547, + 4042.294189453125, + 10780.892578125, + 14336.607421875, + 18185.720703125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00021220046619419008, + 6.587009124814358e-07, + 6.152115474833408e-07, + 6.009134381201875e-07, + 6.002246095704322e-07 + ], + "bp_grad_F": [ + 0.327708899974823, + 5.584151222137734e-05, + 3.1912604754325e-05, + 2.0850193322985433e-05, + 2.061383202089928e-05 + ], + "gamma_dfa": 0.0062168055737856776, + "gamma_dfa_per_layer": [ + 0.0034891567192971706, + 0.014096655882894993, + 0.008750341832637787, + -0.0014689321396872401 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0569005012512207, + "epoch": 1 + }, + { + "hidden_norms_cls": [ + 4.063174247741699, + 6453.43212890625, + 10849.3359375, + 13374.7021484375, + 36052.8046875 + ], + "hidden_norms_avg": [ + 93.43009185791016, + 12578.36328125, + 48372.984375, + 57469.9609375, + 73801.421875 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015539559535682201, + 2.588524239399703e-07, + 1.9553621655177267e-07, + 1.8433813409046707e-07, + 1.781664309419284e-07 + ], + "bp_grad_F": [ + 0.09239349514245987, + 5.2396142564248294e-05, + 9.398144356964622e-06, + 6.586112704098923e-06, + 6.009819117025472e-06 + ], + "gamma_dfa": 0.009027999331010506, + "gamma_dfa_per_layer": [ + 0.010615326464176178, + 0.014681536704301834, + 0.012467417865991592, + -0.0016522837104275823 + ], + "acc_eval": 0.2236328125, + "loss_eval": 2.0732030868530273, + "epoch": 2 + }, + { + "hidden_norms_cls": [ + 6.139724254608154, + 13514.7626953125, + 22634.615234375, + 30011.625, + 105646.9140625 + ], + "hidden_norms_avg": [ + 140.93157958984375, + 27337.47265625, + 105659.2734375, + 131533.03125, + 178079.78125 + ], + "bp_grad_per_sample_l2_med": [ + 0.00013191952893976122, + 1.5711624712366756e-07, + 6.783211148331247e-08, + 6.273136676782087e-08, + 6.216072989673194e-08 + ], + "bp_grad_F": [ + 0.15658611059188843, + 2.8997201297897846e-05, + 2.6110699309356278e-06, + 2.0865154510829598e-06, + 2.029548568316386e-06 + ], + "gamma_dfa": 0.0068359210272319615, + "gamma_dfa_per_layer": [ + 0.01239929161965847, + 0.008297638036310673, + 0.009697571396827698, + -0.0030508169438689947 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0859451293945312, + "epoch": 3 + }, + { + "hidden_norms_cls": [ + 8.060498237609863, + 26771.85546875, + 47700.99609375, + 65194.9375, + 243467.953125 + ], + "hidden_norms_avg": [ + 189.60569763183594, + 53537.2734375, + 224677.375, + 271932.0625, + 380665.78125 + ], + "bp_grad_per_sample_l2_med": [ + 6.88996515236795e-05, + 7.635610188572173e-08, + 3.178359264666142e-08, + 2.8310823907418126e-08, + 2.8113991135114702e-08 + ], + "bp_grad_F": [ + 0.18565885722637177, + 2.3117625460145064e-05, + 1.2200183618915617e-06, + 1.0046638863059343e-06, + 9.67514324656804e-07 + ], + "gamma_dfa": 0.00588334770873189, + "gamma_dfa_per_layer": [ + 0.012929551303386688, + 0.005936518311500549, + 0.009927853010594845, + -0.0052605317905545235 + ], + "acc_eval": 0.216796875, + "loss_eval": 2.1008124351501465, + "epoch": 4 + }, + { + "hidden_norms_cls": [ + 9.924980163574219, + 45836.29296875, + 86015.5546875, + 115240.734375, + 396649.5625 + ], + "hidden_norms_avg": [ + 236.08885192871094, + 94806.203125, + 447709.03125, + 539570.125, + 680795.4375 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014524323341902345, + 3.066869780354864e-08, + 1.9569522891060842e-08, + 1.7725259482404e-08, + 1.7704602228718613e-08 + ], + "bp_grad_F": [ + 0.21425659954547882, + 1.3653657333634328e-05, + 6.662682494606997e-07, + 5.818570798510336e-07, + 5.813048460368009e-07 + ], + "gamma_dfa": 0.006635856116190553, + "gamma_dfa_per_layer": [ + 0.010879420675337315, + 0.013957185670733452, + 0.00779206957668066, + -0.006085251457989216 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.1039814949035645, + "epoch": 5 + }, + { + "hidden_norms_cls": [ + 11.746355056762695, + 70552.8046875, + 256103.15625, + 694951.625, + 808366.5625 + ], + "hidden_norms_avg": [ + 279.4807434082031, + 128343.046875, + 645095.375, + 810123.8125, + 959871.0 + ], + "bp_grad_per_sample_l2_med": [ + 6.159865733934566e-05, + 2.1975946395969004e-08, + 1.1060357074654803e-08, + 9.967390468546e-09, + 1.011228256686536e-08 + ], + "bp_grad_F": [ + 0.09021499752998352, + 5.0024723350361455e-06, + 4.539916176327097e-07, + 3.891582309734076e-07, + 3.9641980720261927e-07 + ], + "gamma_dfa": 0.003665695490781218, + "gamma_dfa_per_layer": [ + 0.009222292341291904, + 0.0031545532401651144, + 0.00775552075356245, + -0.005469584371894598 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.1214356422424316, + "epoch": 6 + }, + { + "hidden_norms_cls": [ + 13.500020980834961, + 102720.734375, + 194937.703125, + 291956.1875, + 801362.9375 + ], + "hidden_norms_avg": [ + 321.6004943847656, + 208601.421875, + 1002364.1875, + 1189027.25, + 1448220.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.00014696457947138697, + 1.642234792598174e-08, + 8.907985460382406e-09, + 8.127726935924784e-09, + 8.014287011803845e-09 + ], + "bp_grad_F": [ + 0.06841801106929779, + 4.044012712256517e-06, + 3.4213746857858496e-07, + 2.990170742123155e-07, + 2.988945198012516e-07 + ], + "gamma_dfa": 0.004651258233934641, + "gamma_dfa_per_layer": [ + 0.007132797501981258, + 0.010231958702206612, + 0.006907162256538868, + -0.0056668855249881744 + ], + "acc_eval": 0.2099609375, + "loss_eval": 2.0963404178619385, + "epoch": 7 + }, + { + "hidden_norms_cls": [ + 15.302024841308594, + 160872.96875, + 604043.4375, + 1296474.125, + 1546227.0 + ], + "hidden_norms_avg": [ + 359.47259521484375, + 298263.5, + 1317573.75, + 1553171.25, + 1878602.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000136460512294434, + 1.0422226637274434e-08, + 5.898865396147812e-09, + 5.4856741371622775e-09, + 5.4926698744850455e-09 + ], + "bp_grad_F": [ + 0.07932842522859573, + 2.1081664272060152e-06, + 2.560300345066935e-07, + 2.2075181504987995e-07, + 2.2043255398784822e-07 + ], + "gamma_dfa": 0.004627774120308459, + "gamma_dfa_per_layer": [ + 0.006024104077368975, + 0.01116865873336792, + 0.005747191607952118, + -0.004428857937455177 + ], + "acc_eval": 0.220703125, + "loss_eval": 2.0744481086730957, + "epoch": 8 + }, + { + "hidden_norms_cls": [ + 17.009462356567383, + 204948.671875, + 405065.21875, + 549855.3125, + 1400973.875 + ], + "hidden_norms_avg": [ + 396.66558837890625, + 480022.3125, + 2019487.75, + 2350966.75, + 2708745.25 + ], + "bp_grad_per_sample_l2_med": [ + 0.00026586122112348676, + 1.0135083883255902e-08, + 6.120911777429683e-09, + 5.8359819199438334e-09, + 5.662275093243352e-09 + ], + "bp_grad_F": [ + 0.37594228982925415, + 1.2430107744876295e-05, + 2.3164905371686473e-07, + 2.0265188993562333e-07, + 2.001279000296563e-07 + ], + "gamma_dfa": 0.004862090456299484, + "gamma_dfa_per_layer": [ + 0.006278482731431723, + 0.012495312839746475, + 0.005351733416318893, + -0.004677167162299156 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0641043186187744, + "epoch": 9 + }, + { + "hidden_norms_cls": [ + 18.669273376464844, + 316404.0625, + 619048.375, + 804163.5, + 1798441.0 + ], + "hidden_norms_avg": [ + 434.9389343261719, + 650998.25, + 2437815.25, + 2802479.0, + 3269810.75 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003605277743190527, + 6.009571951182124e-09, + 4.676837139783174e-09, + 4.657723096102018e-09, + 4.49635484400801e-09 + ], + "bp_grad_F": [ + 0.14846132695674896, + 4.3979816837236285e-06, + 1.7215310776919068e-07, + 1.581869213396203e-07, + 1.561998885790672e-07 + ], + "gamma_dfa": 0.004480502451770008, + "gamma_dfa_per_layer": [ + 0.006086423061788082, + 0.010957473888993263, + 0.004586817231029272, + -0.003708704374730587 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0591208934783936, + "epoch": 10 + }, + { + "hidden_norms_cls": [ + 20.326766967773438, + 443508.46875, + 899668.0625, + 1131299.375, + 2182177.5 + ], + "hidden_norms_avg": [ + 473.4957275390625, + 854388.9375, + 2926402.0, + 3295286.75, + 3825241.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005711699486710131, + 4.8561932253221585e-09, + 3.871160725310574e-09, + 3.833432238309342e-09, + 3.74674646863582e-09 + ], + "bp_grad_F": [ + 1.0882306098937988, + 3.257442813264788e-06, + 1.6311048511852277e-07, + 1.3397652764979284e-07, + 1.326638283671855e-07 + ], + "gamma_dfa": 0.00462920154677704, + "gamma_dfa_per_layer": [ + 0.008616073988378048, + 0.009468363597989082, + 0.003528183326125145, + -0.003095814725384116 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0471031665802, + "epoch": 11 + }, + { + "hidden_norms_cls": [ + 21.944751739501953, + 581616.1875, + 1205317.625, + 1456984.375, + 2587496.75 + ], + "hidden_norms_avg": [ + 511.203125, + 1119566.25, + 3562080.25, + 3992681.5, + 4538977.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009346234728582203, + 4.117307383921798e-09, + 3.257990321969828e-09, + 3.2349201095627222e-09, + 3.1638915931608835e-09 + ], + "bp_grad_F": [ + 0.42184242606163025, + 2.2249487301451154e-06, + 1.2586481545895367e-07, + 1.1919513553948491e-07, + 1.181974553787768e-07 + ], + "gamma_dfa": 0.0034259117674082518, + "gamma_dfa_per_layer": [ + 0.00526365265250206, + 0.008116653189063072, + 0.0030386103317141533, + -0.0027152691036462784 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0867815017700195, + "epoch": 12 + }, + { + "hidden_norms_cls": [ + 23.46192741394043, + 733909.875, + 1508464.125, + 1841074.875, + 3055228.75 + ], + "hidden_norms_avg": [ + 546.8953247070312, + 1235037.0, + 3742642.75, + 4200378.0, + 4892382.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009773626225069165, + 3.5754739169391314e-09, + 2.9525657474493983e-09, + 2.9297144710227485e-09, + 2.8955173814182444e-09 + ], + "bp_grad_F": [ + 0.15538839995861053, + 2.0067516288690967e-06, + 1.1871279781416888e-07, + 1.046255491132797e-07, + 1.0416235340926505e-07 + ], + "gamma_dfa": 0.002340688748518005, + "gamma_dfa_per_layer": [ + 0.0019294173689559102, + 0.007100729271769524, + 0.0026949853636324406, + -0.0023623770102858543 + ], + "acc_eval": 0.232421875, + "loss_eval": 2.088564872741699, + "epoch": 13 + }, + { + "hidden_norms_cls": [ + 24.94734764099121, + 1151802.75, + 3671404.25, + 4625593.5, + 5052590.0 + ], + "hidden_norms_avg": [ + 582.0977172851562, + 1475600.75, + 4403784.0, + 5008330.0, + 5801902.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007562927203252912, + 2.676908916754428e-09, + 2.2055020032496486e-09, + 2.179777247590664e-09, + 2.173634161550808e-09 + ], + "bp_grad_F": [ + 0.36642539501190186, + 3.967601060139714e-06, + 8.444904864290947e-08, + 7.993684647544796e-08, + 7.900475651467787e-08 + ], + "gamma_dfa": 0.0017957038653548807, + "gamma_dfa_per_layer": [ + 0.0019046596717089415, + 0.005139546003192663, + 0.001759346341714263, + -0.0016207365551963449 + ], + "acc_eval": 0.2109375, + "loss_eval": 2.08038330078125, + "epoch": 14 + }, + { + "hidden_norms_cls": [ + 26.36701011657715, + 2210167.25, + 6804633.5, + 7592304.0, + 7772230.0 + ], + "hidden_norms_avg": [ + 615.4749145507812, + 1852637.875, + 5297662.0, + 6054509.0, + 6940769.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.0009053644607774913, + 2.014937106054049e-09, + 1.6813730407960747e-09, + 1.63718916201816e-09, + 1.6135126568173064e-09 + ], + "bp_grad_F": [ + 0.15154746174812317, + 3.760401341423858e-06, + 6.479213254806382e-08, + 6.350511227992683e-08, + 6.00040195308793e-08 + ], + "gamma_dfa": 0.00026495405472815037, + "gamma_dfa_per_layer": [ + -0.0023696955759078264, + 0.0033954931423068047, + 0.0012687842827290297, + -0.0012347656302154064 + ], + "acc_eval": 0.2333984375, + "loss_eval": 2.0685791969299316, + "epoch": 15 + }, + { + "hidden_norms_cls": [ + 27.747814178466797, + 2020373.25, + 6352088.0, + 7372759.0, + 7751557.0 + ], + "hidden_norms_avg": [ + 647.8715209960938, + 2166255.0, + 5964871.0, + 6820316.0, + 7888183.5 + ], + "bp_grad_per_sample_l2_med": [ + 0.000535959261469543, + 1.8833379300531305e-09, + 1.6251041623505103e-09, + 1.5936774122593533e-09, + 1.5920619267362213e-09 + ], + "bp_grad_F": [ + 0.06977186352014542, + 4.2289293560315855e-06, + 5.94431135425566e-08, + 5.634814925770115e-08, + 5.626874255426628e-08 + ], + "gamma_dfa": 0.0009004889943753369, + "gamma_dfa_per_layer": [ + 1.3074517482891679e-05, + 0.003544538514688611, + 0.0012792267370969057, + -0.0012348837917670608 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0676896572113037, + "epoch": 16 + }, + { + "hidden_norms_cls": [ + 29.053590774536133, + 3083884.0, + 8692576.0, + 10024582.0, + 10278143.0 + ], + "hidden_norms_avg": [ + 679.1322021484375, + 2750560.0, + 7205648.0, + 8204248.5, + 9336888.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006835769745521247, + 1.5781399520520267e-09, + 1.3378861352109084e-09, + 1.2995797771253592e-09, + 1.2820219330578198e-09 + ], + "bp_grad_F": [ + 0.25767308473587036, + 1.6246455061263987e-06, + 6.349461756371966e-08, + 6.242527206268278e-08, + 4.5665522918625356e-08 + ], + "gamma_dfa": 0.0003357882087584585, + "gamma_dfa_per_layer": [ + -0.001319598057307303, + 0.002733789850026369, + 0.0008947808528319001, + -0.0009658198105171323 + ], + "acc_eval": 0.23046875, + "loss_eval": 2.0777204036712646, + "epoch": 17 + }, + { + "hidden_norms_cls": [ + 30.246440887451172, + 3200014.0, + 8626485.0, + 9743865.0, + 10146681.0 + ], + "hidden_norms_avg": [ + 708.5135498046875, + 2989787.0, + 7458187.5, + 8607358.0, + 10070516.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005841738311573863, + 1.4247033552905464e-09, + 1.2406603522308046e-09, + 1.21434362565509e-09, + 1.217411615961339e-09 + ], + "bp_grad_F": [ + 0.08999939262866974, + 1.7538721976961824e-06, + 4.803559150445835e-08, + 4.36282370230856e-08, + 4.3068951072200434e-08 + ], + "gamma_dfa": -2.2506676032207906e-05, + "gamma_dfa_per_layer": [ + -0.002581980312243104, + 0.002518225461244583, + 0.0009317069780081511, + -0.0009579788311384618 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.0627658367156982, + "epoch": 18 + }, + { + "hidden_norms_cls": [ + 31.42615509033203, + 4556513.5, + 10711725.0, + 11956874.0, + 12318100.0 + ], + "hidden_norms_avg": [ + 737.157958984375, + 3520006.5, + 8303534.5, + 9571905.0, + 11293369.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007374613196589053, + 1.2111865954622658e-09, + 1.0633514069269268e-09, + 1.0194807220642588e-09, + 1.0034837405470398e-09 + ], + "bp_grad_F": [ + 0.12247106432914734, + 2.740941681622644e-06, + 4.6019909660799385e-08, + 4.372383344275477e-08, + 3.6865596797497346e-08 + ], + "gamma_dfa": 0.0005736843086197041, + "gamma_dfa_per_layer": [ + 0.0002251334663014859, + 0.0021776340436190367, + 0.0006795942317694426, + -0.0007876245072111487 + ], + "acc_eval": 0.22265625, + "loss_eval": 2.062939167022705, + "epoch": 19 + }, + { + "hidden_norms_cls": [ + 32.559165954589844, + 4224958.5, + 10227904.0, + 11507743.0, + 12041642.0 + ], + "hidden_norms_avg": [ + 765.5013427734375, + 3988012.5, + 8953060.0, + 10431809.0, + 12380471.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006474430556409061, + 1.179957687114097e-09, + 1.0031043773395254e-09, + 9.744786089171953e-10, + 9.782840093564005e-10 + ], + "bp_grad_F": [ + 0.12209221720695496, + 1.616509621271689e-06, + 3.8821241332698264e-08, + 3.6648025059093925e-08, + 3.527756931021031e-08 + ], + "gamma_dfa": -0.00019280995184089988, + "gamma_dfa_per_layer": [ + -0.002911232877522707, + 0.0022857212461531162, + 0.0006594176520593464, + -0.0008051458280533552 + ], + "acc_eval": 0.240234375, + "loss_eval": 2.0555338859558105, + "epoch": 20 + }, + { + "hidden_norms_cls": [ + 33.59370040893555, + 5323277.5, + 11855673.0, + 13697022.0, + 14246667.0 + ], + "hidden_norms_avg": [ + 789.9629516601562, + 4634178.0, + 10205192.0, + 11930021.0, + 13993152.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006352875498123467, + 1.0036302899862903e-09, + 8.794808215029093e-10, + 8.579849608558732e-10, + 8.574586596310496e-10 + ], + "bp_grad_F": [ + 0.09745635837316513, + 5.127232043378172e-07, + 3.342180221466151e-08, + 3.173540363832217e-08, + 3.091372491326183e-08 + ], + "gamma_dfa": -0.0006959605379961431, + "gamma_dfa_per_layer": [ + -0.004454955458641052, + 0.0018251645378768444, + 0.0005447655566968024, + -0.000698816787917167 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.056840181350708, + "epoch": 21 + }, + { + "hidden_norms_cls": [ + 34.583858489990234, + 6778143.0, + 13401385.0, + 15847366.0, + 16344266.0 + ], + "hidden_norms_avg": [ + 814.3038330078125, + 5395352.5, + 11137891.0, + 13094203.0, + 15406614.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0006492820102721453, + 8.925201688825268e-10, + 7.777718469270667e-10, + 7.627384279729199e-10, + 7.601627105557895e-10 + ], + "bp_grad_F": [ + 0.08801906555891037, + 1.8660392697711359e-06, + 3.472371190582635e-08, + 2.7845679539950652e-08, + 2.7135749647300145e-08 + ], + "gamma_dfa": -0.0012016263353871182, + "gamma_dfa_per_layer": [ + -0.006280785892158747, + 0.001651690574362874, + 0.0004266214673407376, + -0.0006040314910933375 + ], + "acc_eval": 0.2255859375, + "loss_eval": 2.0746021270751953, + "epoch": 22 + }, + { + "hidden_norms_cls": [ + 35.516666412353516, + 6985935.5, + 14020116.0, + 16575473.0, + 17109272.0 + ], + "hidden_norms_avg": [ + 838.5614013671875, + 6365095.0, + 12448551.0, + 14566203.0, + 16943832.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0007437304593622684, + 8.387662786546457e-10, + 7.299132409599451e-10, + 7.170505300635455e-10, + 7.115786293532267e-10 + ], + "bp_grad_F": [ + 0.1540054827928543, + 1.4262270724429982e-06, + 2.9031822279534936e-08, + 2.776059560005706e-08, + 2.5270722403547552e-08 + ], + "gamma_dfa": -0.00010950746218441054, + "gamma_dfa_per_layer": [ + -0.0017721566837280989, + 0.0015054477844387293, + 0.0003872170636896044, + -0.000558538013137877 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.065904140472412, + "epoch": 23 + }, + { + "hidden_norms_cls": [ + 36.39850997924805, + 7861434.0, + 14415042.0, + 16660478.0, + 17496562.0 + ], + "hidden_norms_avg": [ + 862.4805297851562, + 6600421.5, + 12694272.0, + 15043836.0, + 17968980.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005834798794239759, + 7.558619286029966e-10, + 6.530426754913776e-10, + 6.420492471015393e-10, + 6.389526685524061e-10 + ], + "bp_grad_F": [ + 0.09943251311779022, + 1.4788431599299656e-06, + 2.582997993272329e-08, + 2.3754548550414256e-08, + 2.322415859623561e-08 + ], + "gamma_dfa": -0.0009345750440843403, + "gamma_dfa_per_layer": [ + -0.005123761482536793, + 0.0015550897223874927, + 0.0003447675844654441, + -0.0005143960006535053 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.041043758392334, + "epoch": 24 + }, + { + "hidden_norms_cls": [ + 37.283199310302734, + 8933519.0, + 15359962.0, + 17441364.0, + 18346258.0 + ], + "hidden_norms_avg": [ + 883.0538330078125, + 7354756.0, + 13721222.0, + 16105006.0, + 19368310.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00026283934130333364, + 6.873029922971341e-10, + 6.058342161274766e-10, + 6.000055452481945e-10, + 5.98545990548871e-10 + ], + "bp_grad_F": [ + 0.11474847048521042, + 2.4628958271932788e-05, + 1.3788282160476228e-07, + 2.199209525599599e-08, + 2.15279509774291e-08 + ], + "gamma_dfa": -0.0014451614988502115, + "gamma_dfa_per_layer": [ + -0.006978219375014305, + 0.0013526652473956347, + 0.0002992081572301686, + -0.0004543000250123441 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.0492172241210938, + "epoch": 25 + }, + { + "hidden_norms_cls": [ + 38.11500930786133, + 10836846.0, + 17507178.0, + 19929002.0, + 20726542.0 + ], + "hidden_norms_avg": [ + 901.960205078125, + 8138403.5, + 14552406.0, + 17157852.0, + 20773122.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005291851703077555, + 6.35470620569123e-10, + 5.6208532273061e-10, + 5.496996191567405e-10, + 5.433966054901873e-10 + ], + "bp_grad_F": [ + 0.07972504198551178, + 1.2489309710872476e-06, + 2.2593511062041216e-08, + 2.1460177634935462e-08, + 1.941634231172884e-08 + ], + "gamma_dfa": -0.000788729106716346, + "gamma_dfa_per_layer": [ + -0.00451657734811306, + 0.0015372345224022865, + 0.00024382121046073735, + -0.00041939481161534786 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0669429302215576, + "epoch": 26 + }, + { + "hidden_norms_cls": [ + 38.87166213989258, + 11480826.0, + 18077316.0, + 20884150.0, + 22098916.0 + ], + "hidden_norms_avg": [ + 920.577880859375, + 8893063.0, + 15579717.0, + 18401958.0, + 22225722.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005104477168060839, + 5.858571405781277e-10, + 5.198571018105724e-10, + 5.114682011253535e-10, + 5.120092128052534e-10 + ], + "bp_grad_F": [ + 0.13577552139759064, + 2.0482397303567268e-05, + 2.1394010119024642e-08, + 2.0649670418038113e-08, + 1.8286096192809964e-08 + ], + "gamma_dfa": -0.0004262418224243447, + "gamma_dfa_per_layer": [ + -0.0029134145006537437, + 0.0013950758147984743, + 0.00018188939429819584, + -0.0003685179981403053 + ], + "acc_eval": 0.2490234375, + "loss_eval": 2.053382396697998, + "epoch": 27 + }, + { + "hidden_norms_cls": [ + 39.6179313659668, + 10591964.0, + 16346992.0, + 18847678.0, + 21847726.0 + ], + "hidden_norms_avg": [ + 937.9719848632812, + 9576851.0, + 16784906.0, + 19828342.0, + 23673520.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00023470228188671172, + 5.629120503058971e-10, + 5.04818964408571e-10, + 4.974847200855947e-10, + 4.968530586957343e-10 + ], + "bp_grad_F": [ + 0.03459252789616585, + 8.028884622035548e-06, + 1.9716548393944322e-08, + 1.807922522800709e-08, + 1.7913645677936074e-08 + ], + "gamma_dfa": -0.0018089709192281589, + "gamma_dfa_per_layer": [ + -0.008484212681651115, + 0.0014374498277902603, + 0.00020184949971735477, + -0.00039097032276913524 + ], + "acc_eval": 0.224609375, + "loss_eval": 2.0604443550109863, + "epoch": 28 + }, + { + "hidden_norms_cls": [ + 40.344242095947266, + 10467030.0, + 15235544.0, + 17027748.0, + 23281082.0 + ], + "hidden_norms_avg": [ + 954.3844604492188, + 10038487.0, + 16584430.0, + 19613710.0, + 24505476.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00015729073493275791, + 5.36418076624301e-10, + 4.5378717450361705e-10, + 4.4796202858243817e-10, + 4.477457571372412e-10 + ], + "bp_grad_F": [ + 0.04820869117975235, + 2.3596087430632906e-06, + 1.7855482425943592e-08, + 1.7340139990551506e-08, + 1.672622929049794e-08 + ], + "gamma_dfa": -0.0013171448226785287, + "gamma_dfa_per_layer": [ + -0.006438364274799824, + 0.0013229507021605968, + 0.00020032597240060568, + -0.00035349169047549367 + ], + "acc_eval": 0.236328125, + "loss_eval": 2.061581611633301, + "epoch": 29 + }, + { + "hidden_norms_cls": [ + 41.04903793334961, + 12235056.0, + 17721728.0, + 19784938.0, + 25024272.0 + ], + "hidden_norms_avg": [ + 969.5825805664062, + 11940616.0, + 19401350.0, + 22468846.0, + 26879212.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00035265026963315904, + 5.423251847602728e-10, + 4.4247547292819434e-10, + 4.358849947649901e-10, + 4.3593659238005955e-10 + ], + "bp_grad_F": [ + 0.0735621377825737, + 1.917086819958058e-06, + 1.9346130031294706e-08, + 1.5936171493535767e-08, + 1.5501758099389917e-08 + ], + "gamma_dfa": -0.001081134716514498, + "gamma_dfa_per_layer": [ + -0.005434883758425713, + 0.0012318368535488844, + 0.00019993717432953417, + -0.00032142913551069796 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0760293006896973, + "epoch": 30 + }, + { + "hidden_norms_cls": [ + 41.723567962646484, + 10562926.0, + 13746881.0, + 15736975.0, + 26354068.0 + ], + "hidden_norms_avg": [ + 984.3485717773438, + 12533570.0, + 19717132.0, + 22961588.0, + 28083302.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0002546848263591528, + 4.777176432213537e-10, + 4.0483683072523036e-10, + 4.0072575813177025e-10, + 4.013349652609577e-10 + ], + "bp_grad_F": [ + 0.06879052519798279, + 1.7057992636182462e-06, + 1.6271217262442406e-08, + 1.4877675091895526e-08, + 1.484982270483215e-08 + ], + "gamma_dfa": -0.0015064112594700418, + "gamma_dfa_per_layer": [ + -0.007336798589676619, + 0.0013772943057119846, + 0.00022022609482519329, + -0.0002863668487407267 + ], + "acc_eval": 0.20703125, + "loss_eval": 2.078207492828369, + "epoch": 31 + }, + { + "hidden_norms_cls": [ + 42.342227935791016, + 13283171.0, + 17422292.0, + 19770980.0, + 28086972.0 + ], + "hidden_norms_avg": [ + 999.26123046875, + 13875387.0, + 21404830.0, + 24833206.0, + 29923332.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0003442879824433476, + 4.4142753341525065e-10, + 3.8908712363117104e-10, + 3.845144203040718e-10, + 3.8369810106964053e-10 + ], + "bp_grad_F": [ + 0.10482411086559296, + 2.8695783385046525e-06, + 1.7273855235089286e-08, + 1.4195452813225984e-08, + 1.3857171410336377e-08 + ], + "gamma_dfa": -0.0009248298447346315, + "gamma_dfa_per_layer": [ + -0.004888010676950216, + 0.0012753453338518739, + 0.00017224671319127083, + -0.0002589007490314543 + ], + "acc_eval": 0.2373046875, + "loss_eval": 2.078000068664551, + "epoch": 32 + }, + { + "hidden_norms_cls": [ + 42.90097427368164, + 16870614.0, + 22116480.0, + 24442270.0, + 29665536.0 + ], + "hidden_norms_avg": [ + 1013.56396484375, + 14764026.0, + 21856036.0, + 25334308.0, + 30474444.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047380090109072626, + 4.22005735911668e-10, + 3.5831293487831317e-10, + 3.5505443030103834e-10, + 3.5614466931122024e-10 + ], + "bp_grad_F": [ + 0.1035437062382698, + 1.2711110457530594e-06, + 1.418432571398398e-08, + 1.2978671470875724e-08, + 1.2937439564097986e-08 + ], + "gamma_dfa": -0.00034118785697501153, + "gamma_dfa_per_layer": [ + -0.002568737603724003, + 0.001293556997552514, + 0.000137164635816589, + -0.00022673545754514635 + ], + "acc_eval": 0.2265625, + "loss_eval": 2.0730109214782715, + "epoch": 33 + }, + { + "hidden_norms_cls": [ + 43.419898986816406, + 18221210.0, + 22675590.0, + 24728546.0, + 30520888.0 + ], + "hidden_norms_avg": [ + 1027.6595458984375, + 16337822.0, + 23378412.0, + 26921720.0, + 31927994.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004629126051440835, + 4.106864293085266e-10, + 3.557905081663648e-10, + 3.536362591649578e-10, + 3.5421768296295397e-10 + ], + "bp_grad_F": [ + 0.08281872421503067, + 1.4263683851822861e-06, + 1.3245164076636229e-08, + 1.2740572152836194e-08, + 1.2752362721357713e-08 + ], + "gamma_dfa": -0.0006677984529233072, + "gamma_dfa_per_layer": [ + -0.0036979843862354755, + 0.0011370242573320866, + 0.00012192466238047928, + -0.00023215834517031908 + ], + "acc_eval": 0.23828125, + "loss_eval": 2.0669164657592773, + "epoch": 34 + }, + { + "hidden_norms_cls": [ + 43.868682861328125, + 18758150.0, + 23109030.0, + 25432404.0, + 31503354.0 + ], + "hidden_norms_avg": [ + 1040.644287109375, + 15512033.0, + 21965288.0, + 25882228.0, + 31813648.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00048007385339587927, + 4.271450415593847e-10, + 3.4119135294830016e-10, + 3.391489034054729e-10, + 3.387232438978316e-10 + ], + "bp_grad_F": [ + 0.36019906401634216, + 1.9220671674702317e-05, + 1.358929768713324e-08, + 1.2455363851415768e-08, + 1.2401786264604198e-08 + ], + "gamma_dfa": -0.00031488661625189707, + "gamma_dfa_per_layer": [ + -0.002551896497607231, + 0.001431336859241128, + 9.301750105805695e-05, + -0.00023200432769954205 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0609660148620605, + "epoch": 35 + }, + { + "hidden_norms_cls": [ + 44.293697357177734, + 21659484.0, + 26491946.0, + 29332332.0, + 32793040.0 + ], + "hidden_norms_avg": [ + 1051.83740234375, + 17567000.0, + 24049368.0, + 28083622.0, + 33467380.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043948061647824943, + 4.0486294872188466e-10, + 3.3493480211532756e-10, + 3.3453453895937457e-10, + 3.3604671823006527e-10 + ], + "bp_grad_F": [ + 0.10878865420818329, + 3.037727083210484e-06, + 1.2592222375928941e-08, + 1.2103843261002112e-08, + 1.2022392859023512e-08 + ], + "gamma_dfa": -0.00015630935013177805, + "gamma_dfa_per_layer": [ + -0.0019119374919682741, + 0.0014281735057011247, + 7.57485831854865e-05, + -0.00021722199744544923 + ], + "acc_eval": 0.2431640625, + "loss_eval": 2.0587897300720215, + "epoch": 36 + }, + { + "hidden_norms_cls": [ + 44.68658447265625, + 21628572.0, + 26077032.0, + 28336790.0, + 33305650.0 + ], + "hidden_norms_avg": [ + 1062.067138671875, + 18163602.0, + 24404446.0, + 28478594.0, + 34156064.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005865619168616831, + 4.0249623078914e-10, + 3.3121710929506776e-10, + 3.310392793220984e-10, + 3.318675056984688e-10 + ], + "bp_grad_F": [ + 0.20061102509498596, + 1.4544431223839638e-06, + 1.3441372459510603e-08, + 1.2418687411752671e-08, + 1.2016870165609816e-08 + ], + "gamma_dfa": -0.00039686575473751873, + "gamma_dfa_per_layer": [ + -0.0029668076895177364, + 0.0015295962803065777, + 6.985102663747966e-05, + -0.00022010263637639582 + ], + "acc_eval": 0.2275390625, + "loss_eval": 2.0569839477539062, + "epoch": 37 + }, + { + "hidden_norms_cls": [ + 45.062259674072266, + 25376026.0, + 30203382.0, + 32772746.0, + 35119040.0 + ], + "hidden_norms_avg": [ + 1071.6630859375, + 18637428.0, + 24671676.0, + 28819074.0, + 34739232.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005594053072854877, + 3.9023292930373543e-10, + 3.2509483993692356e-10, + 3.23913590394298e-10, + 3.250162639023557e-10 + ], + "bp_grad_F": [ + 0.13359014689922333, + 4.247889592079446e-06, + 1.4051211749688264e-08, + 1.2317144637563615e-08, + 1.1531787968976914e-08 + ], + "gamma_dfa": -0.0005283378432068275, + "gamma_dfa_per_layer": [ + -0.0037097278982400894, + 0.0017695487476885319, + 4.308431380195543e-05, + -0.000216256536077708 + ], + "acc_eval": 0.2666015625, + "loss_eval": 2.0476396083831787, + "epoch": 38 + }, + { + "hidden_norms_cls": [ + 45.38731384277344, + 24903830.0, + 30026926.0, + 33563200.0, + 35539932.0 + ], + "hidden_norms_avg": [ + 1080.0860595703125, + 20496828.0, + 26709690.0, + 30932660.0, + 36357072.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005004233680665493, + 3.8017103354270887e-10, + 3.1730867933177365e-10, + 3.167333340048373e-10, + 3.1768215835725755e-10 + ], + "bp_grad_F": [ + 0.24717594683170319, + 2.9436714612529613e-06, + 1.1934382371237007e-08, + 1.1459838411553847e-08, + 1.1365100860416533e-08 + ], + "gamma_dfa": -0.00022031009211787023, + "gamma_dfa_per_layer": [ + -0.0022991469595581293, + 0.0015725505072623491, + 4.821528273168951e-05, + -0.00020285919890739024 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0488319396972656, + "epoch": 39 + }, + { + "hidden_norms_cls": [ + 45.68830490112305, + 27470426.0, + 32688434.0, + 35418348.0, + 37778420.0 + ], + "hidden_norms_avg": [ + 1088.195068359375, + 19636778.0, + 25748976.0, + 30137794.0, + 36341748.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000507087679579854, + 3.7039282752004965e-10, + 3.106248036566228e-10, + 3.096240208666501e-10, + 3.10577202844442e-10 + ], + "bp_grad_F": [ + 0.247142493724823, + 5.3006801863375586e-06, + 1.5794508811950436e-08, + 1.5706817180216603e-08, + 1.0953104201405495e-08 + ], + "gamma_dfa": -0.00026929086834570626, + "gamma_dfa_per_layer": [ + -0.0025479549076408148, + 0.0016400209860876203, + 2.4549921363359317e-05, + -0.00019377947319298983 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0380632877349854, + "epoch": 40 + }, + { + "hidden_norms_cls": [ + 45.95172119140625, + 29219790.0, + 34751968.0, + 37645720.0, + 39363420.0 + ], + "hidden_norms_avg": [ + 1095.55908203125, + 20059094.0, + 26161532.0, + 30539128.0, + 36948852.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004415555449668318, + 3.578430884942918e-10, + 3.05192260352527e-10, + 3.046965735276075e-10, + 3.0560776131949297e-10 + ], + "bp_grad_F": [ + 0.1088763028383255, + 4.900910880678566e-06, + 1.1387745857405207e-08, + 1.0883239198733463e-08, + 1.0722531307294503e-08 + ], + "gamma_dfa": -0.0006201292017067317, + "gamma_dfa_per_layer": [ + -0.004000760614871979, + 0.0016785510815680027, + 3.265401755925268e-05, + -0.0001909612910822034 + ], + "acc_eval": 0.25, + "loss_eval": 2.041342258453369, + "epoch": 41 + }, + { + "hidden_norms_cls": [ + 46.1973876953125, + 29375584.0, + 34745100.0, + 38109944.0, + 40454424.0 + ], + "hidden_norms_avg": [ + 1102.340087890625, + 21066706.0, + 27296236.0, + 31874516.0, + 38108092.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00040148120024241507, + 3.579030682931972e-10, + 3.0047467292071417e-10, + 2.979275159908923e-10, + 2.9703536852387913e-10 + ], + "bp_grad_F": [ + 0.2525903582572937, + 8.925781003199518e-06, + 1.1219404072448924e-08, + 1.084880185686643e-08, + 1.0492501978376367e-08 + ], + "gamma_dfa": -0.00034770679030771134, + "gamma_dfa_per_layer": [ + -0.002933461917564273, + 0.001698363572359085, + 3.748677045223303e-05, + -0.0001932155864778906 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.0345935821533203, + "epoch": 42 + }, + { + "hidden_norms_cls": [ + 46.42340087890625, + 27399134.0, + 31821602.0, + 34474508.0, + 38109560.0 + ], + "hidden_norms_avg": [ + 1108.236328125, + 21543940.0, + 27684760.0, + 32082502.0, + 38718660.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000570801377762109, + 3.5802838471710174e-10, + 2.990230563160168e-10, + 2.9852947891484405e-10, + 2.9978877713610075e-10 + ], + "bp_grad_F": [ + 0.173945352435112, + 2.9223572255432373e-06, + 1.2221713419080515e-08, + 1.1539666999738074e-08, + 1.0805790928714032e-08 + ], + "gamma_dfa": -5.9806044191645924e-05, + "gamma_dfa_per_layer": [ + -0.001857165014371276, + 0.0017762510105967522, + 3.49261645169463e-05, + -0.00019323633750900626 + ], + "acc_eval": 0.2412109375, + "loss_eval": 2.043308734893799, + "epoch": 43 + }, + { + "hidden_norms_cls": [ + 46.619728088378906, + 31052948.0, + 36542220.0, + 39935176.0, + 42316204.0 + ], + "hidden_norms_avg": [ + 1113.68896484375, + 22679808.0, + 29079456.0, + 33751472.0, + 40006012.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046165595995262265, + 3.339039600369631e-10, + 2.9132621315319795e-10, + 2.9080904351275194e-10, + 2.9134980539247124e-10 + ], + "bp_grad_F": [ + 0.08871550858020782, + 1.195927779917838e-05, + 1.2490571243972681e-08, + 1.2371740965022582e-08, + 1.015614703447909e-08 + ], + "gamma_dfa": -0.0003672020420708577, + "gamma_dfa_per_layer": [ + -0.002894133096560836, + 0.0016025153454393148, + 2.5333010853501037e-05, + -0.0002025234280154109 + ], + "acc_eval": 0.244140625, + "loss_eval": 2.029773473739624, + "epoch": 44 + }, + { + "hidden_norms_cls": [ + 46.796348571777344, + 30912490.0, + 36281496.0, + 39245376.0, + 41656108.0 + ], + "hidden_norms_avg": [ + 1118.38134765625, + 23560890.0, + 29646840.0, + 34192144.0, + 40581760.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005251869442872703, + 3.3097524720915317e-10, + 2.891357153700369e-10, + 2.8932781170887267e-10, + 2.8904145743524623e-10 + ], + "bp_grad_F": [ + 0.09888254106044769, + 4.3903874029638246e-06, + 1.0815308648659538e-08, + 1.040402519691952e-08, + 1.0228043301196976e-08 + ], + "gamma_dfa": -0.00037046667421236634, + "gamma_dfa_per_layer": [ + -0.002757731592282653, + 0.0014231146778911352, + 3.9225356886163354e-05, + -0.00018647513934411108 + ], + "acc_eval": 0.234375, + "loss_eval": 2.0383992195129395, + "epoch": 45 + }, + { + "hidden_norms_cls": [ + 46.95427322387695, + 31720426.0, + 37234788.0, + 40129424.0, + 42928428.0 + ], + "hidden_norms_avg": [ + 1122.57470703125, + 22583276.0, + 28617936.0, + 33269996.0, + 40462568.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004295881371945143, + 3.419305394380956e-10, + 2.8222821302215095e-10, + 2.8184321543278656e-10, + 2.8312005517783234e-10 + ], + "bp_grad_F": [ + 0.5366736650466919, + 2.256676998513285e-05, + 1.1914533359913548e-08, + 1.1219233542192342e-08, + 1.004730165732326e-08 + ], + "gamma_dfa": 0.00015619578334735706, + "gamma_dfa_per_layer": [ + -0.0010500183561816812, + 0.001834970898926258, + 3.652184386737645e-05, + -0.00019669125322252512 + ], + "acc_eval": 0.2431640625, + "loss_eval": 2.039337396621704, + "epoch": 46 + }, + { + "hidden_norms_cls": [ + 47.09259796142578, + 32824944.0, + 38341332.0, + 41754692.0, + 44005196.0 + ], + "hidden_norms_avg": [ + 1126.26953125, + 24313264.0, + 30669532.0, + 35293632.0, + 41785680.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0005083036958239973, + 3.2607763711389737e-10, + 2.8033902976787317e-10, + 2.7943025671106625e-10, + 2.7980692762774595e-10 + ], + "bp_grad_F": [ + 0.06971772015094757, + 2.262569068989251e-06, + 1.0069017619684928e-08, + 9.845756210324907e-09, + 9.862499261714675e-09 + ], + "gamma_dfa": 0.0007457349984179018, + "gamma_dfa_per_layer": [ + 0.0015201317146420479, + 0.0016060702037066221, + 3.652479063021019e-05, + -0.00017978671530727297 + ], + "acc_eval": 0.25, + "loss_eval": 2.0368857383728027, + "epoch": 47 + }, + { + "hidden_norms_cls": [ + 47.21082305908203, + 33649040.0, + 39036836.0, + 42500816.0, + 44653764.0 + ], + "hidden_norms_avg": [ + 1129.5389404296875, + 24447482.0, + 30689206.0, + 35330028.0, + 42064012.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046678923536092043, + 3.204189136241098e-10, + 2.755325689829391e-10, + 2.7554050707756517e-10, + 2.7654081802275243e-10 + ], + "bp_grad_F": [ + 0.07496139407157898, + 2.2861270281282486e-06, + 9.997683569906712e-09, + 9.715622084627284e-09, + 9.736355721656764e-09 + ], + "gamma_dfa": 0.0006021281524226652, + "gamma_dfa_per_layer": [ + 0.0007927162805572152, + 0.001763419946655631, + 3.104796996922232e-05, + -0.000178671587491408 + ], + "acc_eval": 0.259765625, + "loss_eval": 2.0324196815490723, + "epoch": 48 + }, + { + "hidden_norms_cls": [ + 47.315826416015625, + 34514608.0, + 40222940.0, + 43606628.0, + 45508540.0 + ], + "hidden_norms_avg": [ + 1132.157958984375, + 24487910.0, + 30821460.0, + 35505456.0, + 42327908.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00041785358916968107, + 3.3263317100740153e-10, + 2.696754763942266e-10, + 2.701733836651954e-10, + 2.71275196750409e-10 + ], + "bp_grad_F": [ + 0.08130628615617752, + 3.3661247016425477e-06, + 1.078094857831502e-08, + 9.643851939244996e-09, + 9.617946439277603e-09 + ], + "gamma_dfa": 0.0005021913366363151, + "gamma_dfa_per_layer": [ + 0.00036606384674087167, + 0.0017899572849273682, + 2.7483671146910638e-05, + -0.00017473945626989007 + ], + "acc_eval": 0.2626953125, + "loss_eval": 2.028841495513916, + "epoch": 49 + }, + { + "hidden_norms_cls": [ + 47.388946533203125, + 35118772.0, + 40722008.0, + 44347232.0, + 46331384.0 + ], + "hidden_norms_avg": [ + 1134.3621826171875, + 24821028.0, + 31074444.0, + 35754528.0, + 42627356.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00043533919961191714, + 3.173189211391758e-10, + 2.687766953446413e-10, + 2.68161992611482e-10, + 2.690903055935223e-10 + ], + "bp_grad_F": [ + 0.09458157420158386, + 1.9965789306297665e-06, + 1.025628915130028e-08, + 9.58252854843522e-09, + 9.523047239667903e-09 + ], + "gamma_dfa": 0.00038969498109509004, + "gamma_dfa_per_layer": [ + -0.00010247333557344973, + 0.0018051008228212595, + 3.0877545214025304e-05, + -0.0001747251080814749 + ], + "acc_eval": 0.2548828125, + "loss_eval": 2.0298049449920654, + "epoch": 50 + }, + { + "hidden_norms_cls": [ + 47.4621696472168, + 34836160.0, + 40469796.0, + 44120564.0, + 46361016.0 + ], + "hidden_norms_avg": [ + 1136.3079833984375, + 24152832.0, + 30436140.0, + 35273740.0, + 42621312.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.000491869286634028, + 3.2774055691575654e-10, + 2.667974174919152e-10, + 2.669577336966711e-10, + 2.680060617876734e-10 + ], + "bp_grad_F": [ + 0.0854402706027031, + 1.6183460047614062e-06, + 9.980491100236577e-09, + 9.461099459429079e-09, + 9.473674289495193e-09 + ], + "gamma_dfa": 0.0005695745421689935, + "gamma_dfa_per_layer": [ + 0.0004214277723804116, + 0.001994946738705039, + 3.653779276646674e-05, + -0.00017461413517594337 + ], + "acc_eval": 0.23828125, + "loss_eval": 2.024928092956543, + "epoch": 51 + }, + { + "hidden_norms_cls": [ + 47.52342224121094, + 36446320.0, + 42468064.0, + 46175108.0, + 47947040.0 + ], + "hidden_norms_avg": [ + 1137.8057861328125, + 25400616.0, + 31703746.0, + 36432956.0, + 43307828.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00034005154157057405, + 3.121023717245208e-10, + 2.6523216956064743e-10, + 2.6489818671926457e-10, + 2.649658548126155e-10 + ], + "bp_grad_F": [ + 0.10125189274549484, + 4.0649438233231194e-06, + 9.830144698241838e-09, + 9.345456852827283e-09, + 9.317212779080819e-09 + ], + "gamma_dfa": 0.0005080709906906122, + "gamma_dfa_per_layer": [ + 0.00023581110872328281, + 0.0019333910895511508, + 3.0449831683654338e-05, + -0.00016736806719563901 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.0343496799468994, + "epoch": 52 + }, + { + "hidden_norms_cls": [ + 47.567466735839844, + 35483484.0, + 41150516.0, + 44742840.0, + 47102380.0 + ], + "hidden_norms_avg": [ + 1139.05029296875, + 25225282.0, + 31585082.0, + 36363108.0, + 43411416.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00046872245729900897, + 3.1678357159670156e-10, + 2.6331647973165673e-10, + 2.64141680750285e-10, + 2.646937946604311e-10 + ], + "bp_grad_F": [ + 0.08037562668323517, + 2.9532295684475685e-06, + 9.44631484145475e-09, + 9.393840372240447e-09, + 9.41009226096412e-09 + ], + "gamma_dfa": 0.0005205844290685491, + "gamma_dfa_per_layer": [ + 0.0003642886003945023, + 0.0018537556752562523, + 3.766161171370186e-05, + -0.00017336817109026015 + ], + "acc_eval": 0.2392578125, + "loss_eval": 2.02734375, + "epoch": 53 + }, + { + "hidden_norms_cls": [ + 47.602928161621094, + 35582280.0, + 41200288.0, + 44686488.0, + 47126900.0 + ], + "hidden_norms_avg": [ + 1139.965087890625, + 25657812.0, + 31984420.0, + 36722060.0, + 43681628.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047245126916095614, + 3.1708738412739024e-10, + 2.6278745846042284e-10, + 2.6274540876336516e-10, + 2.6386243190401615e-10 + ], + "bp_grad_F": [ + 0.08141150325536728, + 1.0596501851978246e-05, + 1.0370135861137442e-08, + 1.0129613592368969e-08, + 9.407171930320146e-09 + ], + "gamma_dfa": 0.00048223476824205136, + "gamma_dfa_per_layer": [ + 0.00032963097328320146, + 0.00173661345615983, + 3.3767075365176424e-05, + -0.00017107243184000254 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.0290825366973877, + "epoch": 54 + }, + { + "hidden_norms_cls": [ + 47.62870788574219, + 36373308.0, + 42049216.0, + 45803868.0, + 47955172.0 + ], + "hidden_norms_avg": [ + 1140.6492919921875, + 25698864.0, + 31990548.0, + 36707920.0, + 43700336.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004157091898377985, + 3.1451533044624114e-10, + 2.6160756894100246e-10, + 2.62937283057596e-10, + 2.633904483406724e-10 + ], + "bp_grad_F": [ + 0.28710466623306274, + 2.876764028769685e-06, + 9.405439982401731e-09, + 9.308096515781017e-09, + 9.319982119393444e-09 + ], + "gamma_dfa": 0.00045457817577698734, + "gamma_dfa_per_layer": [ + 0.00011597995762713253, + 0.0018383568385615945, + 3.561873018043116e-05, + -0.00017164282326120883 + ], + "acc_eval": 0.2509765625, + "loss_eval": 2.0309882164001465, + "epoch": 55 + }, + { + "hidden_norms_cls": [ + 47.646034240722656, + 35748556.0, + 41284136.0, + 44861788.0, + 47367128.0 + ], + "hidden_norms_avg": [ + 1141.1492919921875, + 25812252.0, + 32106642.0, + 36789100.0, + 43809728.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004877470782957971, + 3.1724206595029614e-10, + 2.6251881224403917e-10, + 2.627319750647672e-10, + 2.634734097561875e-10 + ], + "bp_grad_F": [ + 0.08355043828487396, + 2.428784682706464e-06, + 9.579466109244095e-09, + 9.378172016738517e-09, + 9.3862775329967e-09 + ], + "gamma_dfa": 0.0006408758436009521, + "gamma_dfa_per_layer": [ + 0.0009491340606473386, + 0.0017479720991104841, + 4.02485384256579e-05, + -0.00017385132377967238 + ], + "acc_eval": 0.2451171875, + "loss_eval": 2.030231475830078, + "epoch": 56 + }, + { + "hidden_norms_cls": [ + 47.65734100341797, + 35952124.0, + 41526152.0, + 45192104.0, + 47596588.0 + ], + "hidden_norms_avg": [ + 1141.4708251953125, + 25858530.0, + 32145604.0, + 36816776.0, + 43830904.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004684069426730275, + 3.1406693912217065e-10, + 2.6245111639511265e-10, + 2.628100792545496e-10, + 2.632017381820617e-10 + ], + "bp_grad_F": [ + 0.16165603697299957, + 3.1715710520074936e-06, + 1.017021755700398e-08, + 9.52006651289139e-09, + 9.360165087457517e-09 + ], + "gamma_dfa": 0.0005993541035422822, + "gamma_dfa_per_layer": [ + 0.0007396150031127036, + 0.0017993964720517397, + 3.345730510773137e-05, + -0.00017505236610304564 + ], + "acc_eval": 0.2529296875, + "loss_eval": 2.030412197113037, + "epoch": 57 + }, + { + "hidden_norms_cls": [ + 47.6636962890625, + 36249912.0, + 41976852.0, + 45623612.0, + 47785064.0 + ], + "hidden_norms_avg": [ + 1141.6495361328125, + 25785932.0, + 32065610.0, + 36745760.0, + 43805624.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047133295447565615, + 3.155541938859585e-10, + 2.617887573386213e-10, + 2.615481442536094e-10, + 2.6276933406954583e-10 + ], + "bp_grad_F": [ + 0.09146469831466675, + 1.8705788988881977e-06, + 9.432087999527994e-09, + 9.323818161988129e-09, + 9.325629157785897e-09 + ], + "gamma_dfa": 0.0005754136018367717, + "gamma_dfa_per_layer": [ + 0.0005892712506465614, + 0.0018461447907611728, + 3.762807318707928e-05, + -0.00017138970724772662 + ], + "acc_eval": 0.251953125, + "loss_eval": 2.031130790710449, + "epoch": 58 + }, + { + "hidden_norms_cls": [ + 47.66678237915039, + 36057328.0, + 41647260.0, + 45391196.0, + 47626604.0 + ], + "hidden_norms_avg": [ + 1141.7391357421875, + 25717830.0, + 31995718.0, + 36684084.0, + 43781820.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.00047832890413701534, + 3.149952798597866e-10, + 2.614737593109595e-10, + 2.6173804790197153e-10, + 2.6257329643897265e-10 + ], + "bp_grad_F": [ + 0.16335515677928925, + 1.6483251101817586e-06, + 9.493151154060797e-09, + 9.393547273361946e-09, + 9.338456230523207e-09 + ], + "gamma_dfa": 0.0005906115802645218, + "gamma_dfa_per_layer": [ + 0.0007219060207717121, + 0.0017734188586473465, + 3.73886723536998e-05, + -0.00017026723071467131 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.0293946266174316, + "epoch": 59 + }, + { + "hidden_norms_cls": [ + 47.666595458984375, + 36029164.0, + 41621316.0, + 45328004.0, + 47606828.0 + ], + "hidden_norms_avg": [ + 1141.736328125, + 25716872.0, + 31991962.0, + 36680384.0, + 43781988.0 + ], + "bp_grad_per_sample_l2_med": [ + 0.0004811616672668606, + 3.1537170097628575e-10, + 2.6223428983840336e-10, + 2.6155200227861997e-10, + 2.6258059615535956e-10 + ], + "bp_grad_F": [ + 0.0951727032661438, + 1.623439857212361e-06, + 9.415242807619961e-09, + 9.343901652414388e-09, + 9.342033813197759e-09 + ], + "gamma_dfa": 0.000660182828141842, + "gamma_dfa_per_layer": [ + 0.0009655870962888002, + 0.0018112185643985868, + 3.598399052862078e-05, + -0.00017205833864863962 + ], + "acc_eval": 0.255859375, + "loss_eval": 2.029409408569336, + "epoch": 60 + } + ] +}
\ No newline at end of file |
