{ "config": { "output_dir": "results/snapshot_vit_v1", "epochs": 60, "lr": 0.001, "wd": 0.05, "seed": 42, "depth": 4, "d_model": 128, "n_heads": 4 }, "depth": 4, "d_model": 128, "architecture": "ViTMini", "bp_log": [ { "hidden_norms_cls": [ 0.31052109599113464, 3.2536301612854004, 4.7681732177734375, 6.129599571228027, 7.124356746673584 ], "hidden_norms_avg": [ 6.008513927459717, 7.034290313720703, 7.942849636077881, 8.915729522705078, 9.635361671447754 ], "bp_grad_per_sample_l2_med": [ 0.004442029166966677, 0.0012008437188342214, 0.0009976272704079747, 0.0009104337659664452, 0.0008558662957511842 ], "bp_grad_F": [ 0.18535660207271576, 0.03968670591711998, 0.032604776322841644, 0.029427478089928627, 0.02746850810945034 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.1376953125, "loss_eval": 2.35188627243042, "epoch": 0 }, { "hidden_norms_cls": [ 0.511958122253418, 12.453446388244629, 18.366989135742188, 25.54116439819336, 31.80699348449707 ], "hidden_norms_avg": [ 4.10694694519043, 10.166566848754883, 14.66998291015625, 19.93342399597168, 25.32619857788086 ], "bp_grad_per_sample_l2_med": [ 0.0019771556835621595, 0.00022324378369376063, 0.00016308785416185856, 0.00014621105219703168, 0.0001451292191632092 ], "bp_grad_F": [ 0.11066891252994537, 0.01034498494118452, 0.006372526753693819, 0.0052248528227210045, 0.005017552524805069 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.4501953125, "loss_eval": 1.5154438018798828, "epoch": 1 }, { "hidden_norms_cls": [ 0.6518111824989319, 13.549692153930664, 20.607715606689453, 27.90418243408203, 32.70498275756836 ], "hidden_norms_avg": [ 4.0909905433654785, 11.942686080932617, 17.39116096496582, 22.200014114379883, 26.230010986328125 ], "bp_grad_per_sample_l2_med": [ 0.0017800139030441642, 0.00026728332159109414, 0.0001720335567370057, 0.0001423172070644796, 0.00013423117343336344 ], "bp_grad_F": [ 0.08781559765338898, 0.010987765155732632, 0.0064147054217755795, 0.0050079175271093845, 0.004637593869119883 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.494140625, "loss_eval": 1.3824832439422607, "epoch": 2 }, { "hidden_norms_cls": [ 0.755299985408783, 11.224863052368164, 19.053363800048828, 27.303081512451172, 33.078182220458984 ], "hidden_norms_avg": [ 4.027151584625244, 12.449769973754883, 17.769508361816406, 22.97556495666504, 27.065759658813477 ], "bp_grad_per_sample_l2_med": [ 0.0018998769810423255, 0.00030996452551335096, 0.00018013815861195326, 0.0001340982416877523, 0.00012205552775412798 ], "bp_grad_F": [ 0.09037011116743088, 0.013488140888512135, 0.007346263621002436, 0.0051797907799482346, 0.004589984193444252 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.5439453125, "loss_eval": 1.2540550231933594, "epoch": 3 }, { "hidden_norms_cls": [ 0.844818651676178, 13.648336410522461, 20.277976989746094, 28.240915298461914, 33.095726013183594 ], "hidden_norms_avg": [ 4.036877632141113, 12.003630638122559, 17.05451011657715, 22.15869903564453, 25.917491912841797 ], "bp_grad_per_sample_l2_med": [ 0.0016167981084436178, 0.00028610811568796635, 0.0001777650322765112, 0.00012878721463494003, 0.0001112063619075343 ], "bp_grad_F": [ 0.07410340011119843, 0.012637714855372906, 0.007633093744516373, 0.005242784973233938, 0.004431390203535557 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.603515625, "loss_eval": 1.1045944690704346, "epoch": 4 }, { "hidden_norms_cls": [ 0.9051892161369324, 12.476008415222168, 19.24710464477539, 27.6123046875, 32.35737609863281 ], "hidden_norms_avg": [ 4.138596057891846, 12.409324645996094, 17.427003860473633, 22.245147705078125, 25.471385955810547 ], "bp_grad_per_sample_l2_med": [ 0.0016044765943661332, 0.00030248358962126076, 0.00018807635933626443, 0.00013626758300233632, 0.00011398641800042242 ], "bp_grad_F": [ 0.08322811126708984, 0.01390017382800579, 0.008505746722221375, 0.005747759714722633, 0.004776888992637396 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.603515625, "loss_eval": 1.1296963691711426, "epoch": 5 }, { "hidden_norms_cls": [ 0.9687634110450745, 11.625859260559082, 18.38014793395996, 26.869504928588867, 31.455507278442383 ], "hidden_norms_avg": [ 4.263001441955566, 13.1234769821167, 17.853057861328125, 22.476547241210938, 25.29656410217285 ], "bp_grad_per_sample_l2_med": [ 0.0015340449754148722, 0.00033552697277627885, 0.00021536082203965634, 0.00015067037020344287, 0.00012220896314829588 ], "bp_grad_F": [ 0.07571946829557419, 0.015132292173802853, 0.009512492455542088, 0.006373303942382336, 0.005029390100389719 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.603515625, "loss_eval": 1.0963702201843262, "epoch": 6 }, { "hidden_norms_cls": [ 1.0029383897781372, 12.687585830688477, 19.734830856323242, 28.174379348754883, 32.5982780456543 ], "hidden_norms_avg": [ 4.357974052429199, 13.182960510253906, 17.720989227294922, 21.832895278930664, 24.934776306152344 ], "bp_grad_per_sample_l2_med": [ 0.0013370191445574164, 0.00026788320974446833, 0.00018144956266041845, 0.00013219293032307178, 0.00010196284711128101 ], "bp_grad_F": [ 0.06996501982212067, 0.013071151450276375, 0.008477694354951382, 0.0061036222614347935, 0.004761465825140476 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6416015625, "loss_eval": 0.9737913012504578, "epoch": 7 }, { "hidden_norms_cls": [ 1.043707013130188, 12.487404823303223, 18.845643997192383, 26.870864868164062, 31.145292282104492 ], "hidden_norms_avg": [ 4.454991340637207, 13.503378868103027, 18.694488525390625, 23.029804229736328, 25.810880661010742 ], "bp_grad_per_sample_l2_med": [ 0.0013130803126841784, 0.00029930632445029914, 0.0002022052649408579, 0.0001383959170198068, 0.00010439592006150633 ], "bp_grad_F": [ 0.0743240937590599, 0.015402271412312984, 0.009977605193853378, 0.006877230014652014, 0.005202346481382847 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.666015625, "loss_eval": 0.9317076206207275, "epoch": 8 }, { "hidden_norms_cls": [ 1.0887501239776611, 12.662396430969238, 18.622724533081055, 26.599454879760742, 31.788663864135742 ], "hidden_norms_avg": [ 4.529710292816162, 13.683384895324707, 18.47463607788086, 22.395898818969727, 25.244558334350586 ], "bp_grad_per_sample_l2_med": [ 0.0012017677072435617, 0.0002972102665808052, 0.00019775003602262586, 0.00013734954700339586, 9.880279685603455e-05 ], "bp_grad_F": [ 0.0661192312836647, 0.01516024675220251, 0.010001113638281822, 0.006893018260598183, 0.0051134442910552025 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6669921875, "loss_eval": 0.9026263952255249, "epoch": 9 }, { "hidden_norms_cls": [ 1.1163448095321655, 12.711283683776855, 18.790128707885742, 26.846359252929688, 31.663158416748047 ], "hidden_norms_avg": [ 4.502295970916748, 13.801639556884766, 18.488975524902344, 22.378704071044922, 25.22056007385254 ], "bp_grad_per_sample_l2_med": [ 0.0011062510311603546, 0.00029147896566428244, 0.0001970102748600766, 0.00013174059859011322, 0.0001037597976392135 ], "bp_grad_F": [ 0.06217500939965248, 0.014721231535077095, 0.00993143580853939, 0.006723989732563496, 0.005166618153452873 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.6845703125, "loss_eval": 0.8660677671432495, "epoch": 10 }, { "hidden_norms_cls": [ 1.1505078077316284, 12.160571098327637, 18.15353012084961, 25.762012481689453, 31.478300094604492 ], "hidden_norms_avg": [ 4.5605149269104, 13.918573379516602, 18.88881492614746, 22.79344940185547, 25.800094604492188 ], "bp_grad_per_sample_l2_med": [ 0.0009689349099062383, 0.0002486997109372169, 0.0001736732665449381, 0.00011473154881969094, 8.573567902203649e-05 ], "bp_grad_F": [ 0.06455213576555252, 0.01547171175479889, 0.010573537088930607, 0.0071961241774261, 0.005212985444813967 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.71484375, "loss_eval": 0.812907874584198, "epoch": 11 }, { "hidden_norms_cls": [ 1.1844152212142944, 11.332664489746094, 16.57625961303711, 23.82307243347168, 28.492321014404297 ], "hidden_norms_avg": [ 4.602160453796387, 13.876313209533691, 17.891036987304688, 21.410982131958008, 23.97108268737793 ], "bp_grad_per_sample_l2_med": [ 0.0009290817542932928, 0.0002613075776025653, 0.0001877332106232643, 0.0001262558507733047, 9.168039832729846e-05 ], "bp_grad_F": [ 0.06392678618431091, 0.01674485206604004, 0.011727217584848404, 0.007738997228443623, 0.005730107892304659 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7197265625, "loss_eval": 0.7641609907150269, "epoch": 12 }, { "hidden_norms_cls": [ 1.2184560298919678, 12.450925827026367, 18.076860427856445, 25.162586212158203, 30.365047454833984 ], "hidden_norms_avg": [ 4.7080278396606445, 13.851634979248047, 18.517131805419922, 22.074214935302734, 24.72054100036621 ], "bp_grad_per_sample_l2_med": [ 0.0009277731878682971, 0.00024563330225646496, 0.00017736255540512502, 0.00012202116340631619, 8.748921391088516e-05 ], "bp_grad_F": [ 0.06389915198087692, 0.016115156933665276, 0.0110858753323555, 0.0076499818824231625, 0.005541808437556028 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.697265625, "loss_eval": 0.8037601113319397, "epoch": 13 }, { "hidden_norms_cls": [ 1.243064045906067, 11.932015419006348, 17.215856552124023, 24.764291763305664, 29.49314308166504 ], "hidden_norms_avg": [ 4.651937961578369, 13.890728950500488, 18.2476749420166, 21.80103302001953, 24.145692825317383 ], "bp_grad_per_sample_l2_med": [ 0.0009111211402341723, 0.000253814272582531, 0.00018247529806103557, 0.00011639296280918643, 8.364167297258973e-05 ], "bp_grad_F": [ 0.06324896216392517, 0.016394753009080887, 0.01153184287250042, 0.007614497095346451, 0.0056136660277843475 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.728515625, "loss_eval": 0.7384279370307922, "epoch": 14 }, { "hidden_norms_cls": [ 1.2652677297592163, 11.532588005065918, 16.7224178314209, 23.326444625854492, 28.03766441345215 ], "hidden_norms_avg": [ 4.652615547180176, 13.981542587280273, 17.984512329101562, 21.317432403564453, 23.233760833740234 ], "bp_grad_per_sample_l2_med": [ 0.0008032417972572148, 0.00022395161795429885, 0.00016904002404771745, 0.0001078559216693975, 7.841538899810985e-05 ], "bp_grad_F": [ 0.06386830657720566, 0.016731705516576767, 0.012135310098528862, 0.008108492009341717, 0.006046997383236885 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7333984375, "loss_eval": 0.7387630939483643, "epoch": 15 }, { "hidden_norms_cls": [ 1.2944419384002686, 11.34481430053711, 16.45362091064453, 22.63861846923828, 28.011232376098633 ], "hidden_norms_avg": [ 4.738389015197754, 13.769956588745117, 17.63072395324707, 21.14189338684082, 23.455045700073242 ], "bp_grad_per_sample_l2_med": [ 0.0007927753031253815, 0.0002345799293834716, 0.00016934113227762282, 0.00011508075840538368, 7.966109114931896e-05 ], "bp_grad_F": [ 0.0655454769730568, 0.01815187744796276, 0.013005951419472694, 0.008820701390504837, 0.006184164900332689 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7255859375, "loss_eval": 0.7302451133728027, "epoch": 16 }, { "hidden_norms_cls": [ 1.3085625171661377, 11.323317527770996, 15.866230964660645, 21.746976852416992, 27.081127166748047 ], "hidden_norms_avg": [ 4.687533855438232, 13.471115112304688, 17.396968841552734, 20.327377319335938, 22.58539581298828 ], "bp_grad_per_sample_l2_med": [ 0.0006625292589887977, 0.00019486426026560366, 0.00014659677981399, 9.787825547391549e-05, 6.321907130768523e-05 ], "bp_grad_F": [ 0.07393868267536163, 0.020178642123937607, 0.014442694373428822, 0.009784683585166931, 0.00656729843467474 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7412109375, "loss_eval": 0.7063955068588257, "epoch": 17 }, { "hidden_norms_cls": [ 1.3433176279067993, 10.762125968933105, 15.129413604736328, 21.06867790222168, 26.1944522857666 ], "hidden_norms_avg": [ 4.709607124328613, 13.69739055633545, 17.006061553955078, 19.97213363647461, 22.212177276611328 ], "bp_grad_per_sample_l2_med": [ 0.0006978239398449659, 0.00021396303782239556, 0.00016030693950597197, 0.00010856003791559488, 6.917239079484716e-05 ], "bp_grad_F": [ 0.06653428077697754, 0.019508732482790947, 0.014456766657531261, 0.010107609443366528, 0.006681134924292564 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.75, "loss_eval": 0.6990396976470947, "epoch": 18 }, { "hidden_norms_cls": [ 1.3607734441757202, 10.718966484069824, 15.383923530578613, 21.34387969970703, 26.49329376220703 ], "hidden_norms_avg": [ 4.7122907638549805, 13.804581642150879, 17.532636642456055, 20.843929290771484, 23.01592254638672 ], "bp_grad_per_sample_l2_med": [ 0.0007053805165924132, 0.0002122409496223554, 0.00016182110994122922, 0.00011085433652624488, 7.204789289971814e-05 ], "bp_grad_F": [ 0.06105736270546913, 0.017779415473341942, 0.013269647024571896, 0.009227588772773743, 0.006410240661352873 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7763671875, "loss_eval": 0.6498311758041382, "epoch": 19 }, { "hidden_norms_cls": [ 1.3752704858779907, 10.530582427978516, 14.803340911865234, 20.217910766601562, 25.20522689819336 ], "hidden_norms_avg": [ 4.7595720291137695, 13.601245880126953, 17.491943359375, 20.960437774658203, 22.910301208496094 ], "bp_grad_per_sample_l2_med": [ 0.0006476694834418595, 0.00020479912927839905, 0.0001524801627965644, 0.00010630583710735664, 6.906194903422147e-05 ], "bp_grad_F": [ 0.06572327762842178, 0.019566379487514496, 0.01484121847897768, 0.010426007211208344, 0.006943442393094301 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.763671875, "loss_eval": 0.6451045274734497, "epoch": 20 }, { "hidden_norms_cls": [ 1.394100546836853, 9.805717468261719, 14.102628707885742, 19.18745231628418, 24.205224990844727 ], "hidden_norms_avg": [ 4.746951580047607, 13.343804359436035, 16.609134674072266, 19.829851150512695, 21.580671310424805 ], "bp_grad_per_sample_l2_med": [ 0.0006192427244968712, 0.0002108582411892712, 0.0001636892993701622, 0.0001098570428439416, 6.864540046080947e-05 ], "bp_grad_F": [ 0.06809430569410324, 0.02151457779109478, 0.01606965810060501, 0.011247958056628704, 0.007375919260084629 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7705078125, "loss_eval": 0.6522111892700195, "epoch": 21 }, { "hidden_norms_cls": [ 1.4160058498382568, 9.728543281555176, 13.389554977416992, 18.542705535888672, 23.791994094848633 ], "hidden_norms_avg": [ 4.738738536834717, 13.15449333190918, 16.28533172607422, 19.581254959106445, 21.488550186157227 ], "bp_grad_per_sample_l2_med": [ 0.0006278376094996929, 0.00020051853789482266, 0.00015803576388861984, 0.0001043542506522499, 6.271857273532078e-05 ], "bp_grad_F": [ 0.07535671442747116, 0.02472539246082306, 0.01880054548382759, 0.012977317906916142, 0.007879889570176601 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.767578125, "loss_eval": 0.6732022762298584, "epoch": 22 }, { "hidden_norms_cls": [ 1.4301073551177979, 9.656251907348633, 13.501574516296387, 18.518707275390625, 23.49370574951172 ], "hidden_norms_avg": [ 4.7338972091674805, 12.90231704711914, 15.899849891662598, 18.982860565185547, 20.785310745239258 ], "bp_grad_per_sample_l2_med": [ 0.0005697127780877054, 0.00018775691569317132, 0.00014216902491170913, 9.182754729408771e-05, 5.984708695905283e-05 ], "bp_grad_F": [ 0.07130222022533417, 0.023520665243268013, 0.017786188051104546, 0.012143870815634727, 0.007813607342541218 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7763671875, "loss_eval": 0.6380050182342529, "epoch": 23 }, { "hidden_norms_cls": [ 1.4623057842254639, 10.028787612915039, 13.687016487121582, 18.426584243774414, 23.602413177490234 ], "hidden_norms_avg": [ 4.807516574859619, 12.739899635314941, 16.150466918945312, 19.439754486083984, 21.316791534423828 ], "bp_grad_per_sample_l2_med": [ 0.0005416463245637715, 0.00019103426893707365, 0.00014568559709005058, 9.899997530737892e-05, 6.29485584795475e-05 ], "bp_grad_F": [ 0.07191846519708633, 0.023787740617990494, 0.01782786287367344, 0.012350695207715034, 0.007955120876431465 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7841796875, "loss_eval": 0.6439570784568787, "epoch": 24 }, { "hidden_norms_cls": [ 1.4565976858139038, 9.294268608093262, 12.656200408935547, 17.385971069335938, 21.959299087524414 ], "hidden_norms_avg": [ 4.774696350097656, 12.394432067871094, 15.230389595031738, 18.10796356201172, 19.88006591796875 ], "bp_grad_per_sample_l2_med": [ 0.0005462650442495942, 0.00019751323270611465, 0.00015244862879626453, 0.00010562407260295004, 6.40779035165906e-05 ], "bp_grad_F": [ 0.07698184996843338, 0.026412304490804672, 0.02022000029683113, 0.013991317711770535, 0.008763212710618973 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7568359375, "loss_eval": 0.6531677842140198, "epoch": 25 }, { "hidden_norms_cls": [ 1.4813296794891357, 9.043482780456543, 12.308734893798828, 16.513948440551758, 21.061283111572266 ], "hidden_norms_avg": [ 4.7356462478637695, 12.33294677734375, 15.104657173156738, 17.771398544311523, 19.526002883911133 ], "bp_grad_per_sample_l2_med": [ 0.000557436200324446, 0.0002021614054683596, 0.0001567570143379271, 0.00010984922846546397, 6.634221062995493e-05 ], "bp_grad_F": [ 0.07777652144432068, 0.027695877477526665, 0.021396547555923462, 0.015052770264446735, 0.009372876025736332 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7744140625, "loss_eval": 0.6539995074272156, "epoch": 26 }, { "hidden_norms_cls": [ 1.4828969240188599, 8.677760124206543, 12.009501457214355, 16.262908935546875, 20.79404067993164 ], "hidden_norms_avg": [ 4.744379043579102, 12.125540733337402, 14.89413833618164, 17.47431182861328, 18.953710556030273 ], "bp_grad_per_sample_l2_med": [ 0.0005026232684031129, 0.00019721532589755952, 0.00014348917466122657, 0.00010225686855847016, 5.8645866374718025e-05 ], "bp_grad_F": [ 0.0830698236823082, 0.03011341392993927, 0.023107260465621948, 0.016188694164156914, 0.00968033168464899 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7744140625, "loss_eval": 0.6444424390792847, "epoch": 27 }, { "hidden_norms_cls": [ 1.5019822120666504, 9.1107816696167, 12.172623634338379, 16.5975341796875, 20.453947067260742 ], "hidden_norms_avg": [ 4.741573333740234, 12.045503616333008, 14.836026191711426, 17.666833877563477, 19.175966262817383 ], "bp_grad_per_sample_l2_med": [ 0.0005040269461460412, 0.00019225970027036965, 0.0001496450131526217, 0.00010478955664439127, 6.137428135843948e-05 ], "bp_grad_F": [ 0.07822537422180176, 0.02863621897995472, 0.022284477949142456, 0.01552330981940031, 0.009474868886172771 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.6074927449226379, "epoch": 28 }, { "hidden_norms_cls": [ 1.5009087324142456, 8.223862648010254, 11.225082397460938, 15.531359672546387, 19.848068237304688 ], "hidden_norms_avg": [ 4.69788122177124, 11.848491668701172, 14.342337608337402, 16.882020950317383, 18.197385787963867 ], "bp_grad_per_sample_l2_med": [ 0.0004685261519625783, 0.00017912790644913912, 0.00013862684136256576, 9.223359666066244e-05, 5.140554640092887e-05 ], "bp_grad_F": [ 0.09127916395664215, 0.03443564847111702, 0.026544470340013504, 0.01809101179242134, 0.010493002831935883 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7783203125, "loss_eval": 0.6329880952835083, "epoch": 29 }, { "hidden_norms_cls": [ 1.509100079536438, 8.238924980163574, 10.995248794555664, 14.927000045776367, 19.032428741455078 ], "hidden_norms_avg": [ 4.678654193878174, 11.513160705566406, 14.12202262878418, 16.704364776611328, 18.131078720092773 ], "bp_grad_per_sample_l2_med": [ 0.0004594121128320694, 0.00018182865460403264, 0.000145129015436396, 0.00010142508108401671, 5.208289803704247e-05 ], "bp_grad_F": [ 0.09080124646425247, 0.03489048779010773, 0.027099598199129105, 0.018760183826088905, 0.010796112939715385 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7822265625, "loss_eval": 0.625268816947937, "epoch": 30 }, { "hidden_norms_cls": [ 1.503785252571106, 7.896090030670166, 10.495330810546875, 14.530640602111816, 18.728647232055664 ], "hidden_norms_avg": [ 4.70166540145874, 11.420204162597656, 13.774767875671387, 16.2652530670166, 17.631481170654297 ], "bp_grad_per_sample_l2_med": [ 0.00043488750816322863, 0.00017315168224740773, 0.0001335645210929215, 8.99006481631659e-05, 5.126056930748746e-05 ], "bp_grad_F": [ 0.10076858103275299, 0.039271026849746704, 0.0300181582570076, 0.020545953884720802, 0.011564387008547783 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.771484375, "loss_eval": 0.6479744911193848, "epoch": 31 }, { "hidden_norms_cls": [ 1.505173921585083, 7.728392124176025, 10.420252799987793, 14.133453369140625, 18.110719680786133 ], "hidden_norms_avg": [ 4.7109880447387695, 11.242951393127441, 13.997397422790527, 16.60598373413086, 17.915313720703125 ], "bp_grad_per_sample_l2_med": [ 0.00040974540752358735, 0.0001792571711121127, 0.00014464404375758022, 9.883226448437199e-05, 5.038536983192898e-05 ], "bp_grad_F": [ 0.09923475980758667, 0.039516862481832504, 0.03056514263153076, 0.021311543881893158, 0.011838918551802635 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7880859375, "loss_eval": 0.6011433601379395, "epoch": 32 }, { "hidden_norms_cls": [ 1.5013800859451294, 7.8755106925964355, 10.452071189880371, 14.013816833496094, 17.622900009155273 ], "hidden_norms_avg": [ 4.662457466125488, 11.018245697021484, 13.179399490356445, 15.56103515625, 16.739452362060547 ], "bp_grad_per_sample_l2_med": [ 0.00033098450512625277, 0.0001421417691744864, 0.00011021740647265688, 7.645406731171533e-05, 4.017115134047344e-05 ], "bp_grad_F": [ 0.09463275969028473, 0.03948793560266495, 0.03067062795162201, 0.021538278087973595, 0.012101472355425358 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8076171875, "loss_eval": 0.5846524238586426, "epoch": 33 }, { "hidden_norms_cls": [ 1.5032685995101929, 7.549060344696045, 10.04562759399414, 13.609556198120117, 17.36180877685547 ], "hidden_norms_avg": [ 4.688360214233398, 11.03510856628418, 13.660865783691406, 16.024188995361328, 17.242145538330078 ], "bp_grad_per_sample_l2_med": [ 0.0003352685598656535, 0.0001500560319982469, 0.000116633229481522, 8.394405449507758e-05, 4.0652244933880866e-05 ], "bp_grad_F": [ 0.10540100187063217, 0.044482193887233734, 0.03421863541007042, 0.023781608790159225, 0.012753129936754704 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7861328125, "loss_eval": 0.5960580110549927, "epoch": 34 }, { "hidden_norms_cls": [ 1.5032752752304077, 7.387601375579834, 9.652260780334473, 13.042936325073242, 16.688335418701172 ], "hidden_norms_avg": [ 4.644099235534668, 10.739524841308594, 13.165095329284668, 15.435381889343262, 16.59172248840332 ], "bp_grad_per_sample_l2_med": [ 0.0003447248600423336, 0.0001518868375569582, 0.00012246235564816743, 8.41514120111242e-05, 4.193704080535099e-05 ], "bp_grad_F": [ 0.11063266545534134, 0.04730832949280739, 0.03743334487080574, 0.02577192150056362, 0.01377912238240242 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.78515625, "loss_eval": 0.652167797088623, "epoch": 35 }, { "hidden_norms_cls": [ 1.4935848712921143, 7.262828826904297, 9.431328773498535, 12.742668151855469, 16.348758697509766 ], "hidden_norms_avg": [ 4.6145453453063965, 10.670759201049805, 12.641580581665039, 14.64714241027832, 15.685794830322266 ], "bp_grad_per_sample_l2_med": [ 0.0003325030847918242, 0.00014367286348715425, 0.00011324919614708051, 7.871988782426342e-05, 4.058879494550638e-05 ], "bp_grad_F": [ 0.11436768621206284, 0.04893247410655022, 0.03840672969818115, 0.02707456797361374, 0.014087510295212269 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7978515625, "loss_eval": 0.6156834363937378, "epoch": 36 }, { "hidden_norms_cls": [ 1.4897189140319824, 7.156031608581543, 9.365946769714355, 12.499292373657227, 15.942588806152344 ], "hidden_norms_avg": [ 4.635710716247559, 10.602685928344727, 12.637743949890137, 14.74621868133545, 15.834792137145996 ], "bp_grad_per_sample_l2_med": [ 0.000299928622553125, 0.00013245265290606767, 0.00010241761629004031, 7.247657049447298e-05, 3.780105180339888e-05 ], "bp_grad_F": [ 0.11267601698637009, 0.0501401461660862, 0.03941003605723381, 0.0279407799243927, 0.014723201282322407 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.80078125, "loss_eval": 0.5903886556625366, "epoch": 37 }, { "hidden_norms_cls": [ 1.4791479110717773, 7.027911186218262, 9.0321044921875, 12.123476028442383, 15.987238883972168 ], "hidden_norms_avg": [ 4.5436177253723145, 10.157598495483398, 12.115620613098145, 14.023022651672363, 15.130277633666992 ], "bp_grad_per_sample_l2_med": [ 0.0002464659046381712, 0.00011603213351918384, 9.401622082805261e-05, 6.44488463876769e-05, 2.8129303245805204e-05 ], "bp_grad_F": [ 0.1319781094789505, 0.05854209512472153, 0.04639327526092529, 0.03260229155421257, 0.01578359492123127 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7841796875, "loss_eval": 0.6532921195030212, "epoch": 38 }, { "hidden_norms_cls": [ 1.4722236394882202, 6.847982406616211, 9.039284706115723, 11.94421672821045, 15.479789733886719 ], "hidden_norms_avg": [ 4.536457538604736, 10.0848388671875, 11.944480895996094, 13.931117057800293, 15.018562316894531 ], "bp_grad_per_sample_l2_med": [ 0.00023636725381948054, 0.00011084756260970607, 8.837366476655006e-05, 6.370043411152437e-05, 3.0101380616542883e-05 ], "bp_grad_F": [ 0.1352969855070114, 0.06069062277674675, 0.04737559333443642, 0.03317096084356308, 0.016367904841899872 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7783203125, "loss_eval": 0.6675163507461548, "epoch": 39 }, { "hidden_norms_cls": [ 1.4741134643554688, 6.7887864112854, 8.833945274353027, 11.777705192565918, 15.091635704040527 ], "hidden_norms_avg": [ 4.546427249908447, 10.082904815673828, 11.992964744567871, 14.035684585571289, 15.085047721862793 ], "bp_grad_per_sample_l2_med": [ 0.0002497230307199061, 0.00011889061715919524, 9.627552208257839e-05, 6.80557859595865e-05, 3.187589391018264e-05 ], "bp_grad_F": [ 0.13283543288707733, 0.06097453087568283, 0.047521013766527176, 0.033583469688892365, 0.016502397134900093 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7998046875, "loss_eval": 0.6332878470420837, "epoch": 40 }, { "hidden_norms_cls": [ 1.4732073545455933, 6.690948009490967, 8.623305320739746, 11.383458137512207, 14.868409156799316 ], "hidden_norms_avg": [ 4.510478973388672, 9.772372245788574, 11.55829906463623, 13.379657745361328, 14.343344688415527 ], "bp_grad_per_sample_l2_med": [ 0.00019870084361173213, 0.00010116927296621725, 8.329773845616728e-05, 6.15280878264457e-05, 2.8435944841476157e-05 ], "bp_grad_F": [ 0.13917136192321777, 0.06636927276849747, 0.05231080949306488, 0.0366261750459671, 0.017451239749789238 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8017578125, "loss_eval": 0.6271109580993652, "epoch": 41 }, { "hidden_norms_cls": [ 1.4620546102523804, 6.489831924438477, 8.487679481506348, 11.202116966247559, 14.761962890625 ], "hidden_norms_avg": [ 4.5009870529174805, 9.717012405395508, 11.480990409851074, 13.235471725463867, 14.178875923156738 ], "bp_grad_per_sample_l2_med": [ 0.00015383858408313245, 8.131976937875152e-05, 6.472255336120725e-05, 4.378501034807414e-05, 1.9541592337191105e-05 ], "bp_grad_F": [ 0.1546960175037384, 0.07402726262807846, 0.058267489075660706, 0.041084613651037216, 0.018521569669246674 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.794921875, "loss_eval": 0.6767467260360718, "epoch": 42 }, { "hidden_norms_cls": [ 1.4651520252227783, 6.564362525939941, 8.296653747558594, 11.014183044433594, 14.418519973754883 ], "hidden_norms_avg": [ 4.483984470367432, 9.593335151672363, 11.23758316040039, 13.036303520202637, 14.015531539916992 ], "bp_grad_per_sample_l2_med": [ 0.0002037636877503246, 0.00010235400259261951, 8.395169425057247e-05, 5.674947897205129e-05, 2.5295201339758933e-05 ], "bp_grad_F": [ 0.15471766889095306, 0.07422170042991638, 0.05941145122051239, 0.04111991077661514, 0.018912144005298615 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8037109375, "loss_eval": 0.6682149171829224, "epoch": 43 }, { "hidden_norms_cls": [ 1.457137107849121, 6.368557929992676, 8.152215957641602, 10.783031463623047, 14.167640686035156 ], "hidden_norms_avg": [ 4.462830066680908, 9.585762977600098, 11.208064079284668, 13.065739631652832, 13.993027687072754 ], "bp_grad_per_sample_l2_med": [ 0.00016671593766659498, 8.65811962285079e-05, 7.217681559268385e-05, 5.042032353230752e-05, 2.1260022549540736e-05 ], "bp_grad_F": [ 0.15730538964271545, 0.07605564594268799, 0.06052647903561592, 0.04247846081852913, 0.01923321560025215 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8134765625, "loss_eval": 0.6757298111915588, "epoch": 44 }, { "hidden_norms_cls": [ 1.4529122114181519, 6.260828018188477, 8.032843589782715, 10.586301803588867, 13.950445175170898 ], "hidden_norms_avg": [ 4.4613800048828125, 9.4591646194458, 11.012088775634766, 12.760184288024902, 13.692852973937988 ], "bp_grad_per_sample_l2_med": [ 0.0001344321499345824, 6.65406696498394e-05, 5.5920852901181206e-05, 3.9107719203457236e-05, 1.5611329217790626e-05 ], "bp_grad_F": [ 0.1660272479057312, 0.08182978630065918, 0.06507853418588638, 0.046549297869205475, 0.020592277869582176 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.806640625, "loss_eval": 0.685518205165863, "epoch": 45 }, { "hidden_norms_cls": [ 1.4509673118591309, 6.163156032562256, 7.82518196105957, 10.378498077392578, 13.96407699584961 ], "hidden_norms_avg": [ 4.434635162353516, 9.335474967956543, 10.857998847961426, 12.551763534545898, 13.511585235595703 ], "bp_grad_per_sample_l2_med": [ 0.00011230952804908156, 5.540825441130437e-05, 4.5063996367389336e-05, 2.9814285881002434e-05, 1.1903831364179496e-05 ], "bp_grad_F": [ 0.1772848516702652, 0.08942516893148422, 0.07126298546791077, 0.04956020042300224, 0.021146513521671295 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7958984375, "loss_eval": 0.69295334815979, "epoch": 46 }, { "hidden_norms_cls": [ 1.4527415037155151, 6.165233612060547, 7.756027698516846, 10.242467880249023, 13.45471477508545 ], "hidden_norms_avg": [ 4.438976287841797, 9.343517303466797, 10.836493492126465, 12.435514450073242, 13.287426948547363 ], "bp_grad_per_sample_l2_med": [ 0.0001074640967999585, 5.268112363410182e-05, 4.352951145847328e-05, 3.164535519317724e-05, 1.2792614143108949e-05 ], "bp_grad_F": [ 0.17606250941753387, 0.08888891339302063, 0.07090400159358978, 0.05056491121649742, 0.021766021847724915 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.806640625, "loss_eval": 0.6969807147979736, "epoch": 47 }, { "hidden_norms_cls": [ 1.4455187320709229, 6.104230880737305, 7.606966972351074, 10.056215286254883, 13.531522750854492 ], "hidden_norms_avg": [ 4.394144535064697, 9.197455406188965, 10.598797798156738, 12.198134422302246, 13.1181001663208 ], "bp_grad_per_sample_l2_med": [ 9.084033081308007e-05, 4.605063077178784e-05, 3.957438457291573e-05, 2.727917853917461e-05, 1.0920393833657727e-05 ], "bp_grad_F": [ 0.1919114887714386, 0.09742862731218338, 0.07786751538515091, 0.05414625629782677, 0.022070109844207764 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.810546875, "loss_eval": 0.713995635509491, "epoch": 48 }, { "hidden_norms_cls": [ 1.4383388757705688, 6.067695617675781, 7.595578670501709, 9.960418701171875, 13.367838859558105 ], "hidden_norms_avg": [ 4.4121479988098145, 9.207226753234863, 10.62590217590332, 12.186077117919922, 13.054762840270996 ], "bp_grad_per_sample_l2_med": [ 0.00010577002831269056, 5.2172203140798956e-05, 4.119141885894351e-05, 2.997498268086929e-05, 1.1721556802513078e-05 ], "bp_grad_F": [ 0.19711492955684662, 0.09961695969104767, 0.07941404730081558, 0.05621125549077988, 0.02285071834921837 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7998046875, "loss_eval": 0.7457866668701172, "epoch": 49 }, { "hidden_norms_cls": [ 1.438454270362854, 6.097946643829346, 7.5858659744262695, 9.956851959228516, 13.270756721496582 ], "hidden_norms_avg": [ 4.392654895782471, 9.144302368164062, 10.536030769348145, 12.092294692993164, 12.985077857971191 ], "bp_grad_per_sample_l2_med": [ 0.00010758326970972121, 5.274294744594954e-05, 4.421125413500704e-05, 3.0753104510949925e-05, 1.1889996130776126e-05 ], "bp_grad_F": [ 0.19883227348327637, 0.1017213836312294, 0.0807848572731018, 0.056292060762643814, 0.022987989708781242 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7998046875, "loss_eval": 0.7402137517929077, "epoch": 50 }, { "hidden_norms_cls": [ 1.4367005825042725, 6.004332542419434, 7.504194259643555, 9.782310485839844, 13.125389099121094 ], "hidden_norms_avg": [ 4.3845720291137695, 9.06988525390625, 10.41169548034668, 11.905806541442871, 12.784433364868164 ], "bp_grad_per_sample_l2_med": [ 9.236831829184666e-05, 4.803440242540091e-05, 3.901722448063083e-05, 2.752364525804296e-05, 1.1449340490798932e-05 ], "bp_grad_F": [ 0.19664740562438965, 0.10213448107242584, 0.08124449104070663, 0.05709528177976608, 0.023260990157723427 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8017578125, "loss_eval": 0.732274055480957, "epoch": 51 }, { "hidden_norms_cls": [ 1.4371269941329956, 5.965888500213623, 7.401495933532715, 9.748833656311035, 13.274619102478027 ], "hidden_norms_avg": [ 4.380629539489746, 9.019668579101562, 10.396828651428223, 11.923394203186035, 12.77461051940918 ], "bp_grad_per_sample_l2_med": [ 7.760760490782559e-05, 4.048245318699628e-05, 3.216555342078209e-05, 2.2310470740194432e-05, 8.838631401886232e-06 ], "bp_grad_F": [ 0.20731569826602936, 0.10790340602397919, 0.08557390421628952, 0.059937626123428345, 0.023827020078897476 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8046875, "loss_eval": 0.7751725316047668, "epoch": 52 }, { "hidden_norms_cls": [ 1.4341260194778442, 5.9393768310546875, 7.411903381347656, 9.739734649658203, 13.19786548614502 ], "hidden_norms_avg": [ 4.378067493438721, 8.986294746398926, 10.316237449645996, 11.792922019958496, 12.673585891723633 ], "bp_grad_per_sample_l2_med": [ 6.968516390770674e-05, 3.471451054792851e-05, 2.8814916731789708e-05, 1.9318980776006356e-05, 7.639268915227149e-06 ], "bp_grad_F": [ 0.2137812376022339, 0.11110929399728775, 0.08847261965274811, 0.06186935305595398, 0.024307044222950935 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8056640625, "loss_eval": 0.764312744140625, "epoch": 53 }, { "hidden_norms_cls": [ 1.4324616193771362, 5.883492469787598, 7.319663047790527, 9.547243118286133, 13.008822441101074 ], "hidden_norms_avg": [ 4.376597881317139, 8.99113941192627, 10.321625709533691, 11.771256446838379, 12.628817558288574 ], "bp_grad_per_sample_l2_med": [ 7.972177991177887e-05, 3.871036460623145e-05, 3.142197601846419e-05, 2.2371379600372165e-05, 8.571933904022444e-06 ], "bp_grad_F": [ 0.21534259617328644, 0.11241323500871658, 0.08915204554796219, 0.06287811696529388, 0.024627922102808952 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7958984375, "loss_eval": 0.7731261253356934, "epoch": 54 }, { "hidden_norms_cls": [ 1.4321078062057495, 5.858248710632324, 7.306819915771484, 9.56387996673584, 13.071084022521973 ], "hidden_norms_avg": [ 4.371452808380127, 8.94082260131836, 10.26811695098877, 11.765360832214355, 12.617104530334473 ], "bp_grad_per_sample_l2_med": [ 7.236401870613918e-05, 3.8528516597580165e-05, 3.0984694603830576e-05, 2.1565809220192023e-05, 7.989257937879302e-06 ], "bp_grad_F": [ 0.2197490781545639, 0.1155213937163353, 0.09188564866781235, 0.06453806161880493, 0.024861471727490425 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.7958984375, "loss_eval": 0.7778797149658203, "epoch": 55 }, { "hidden_norms_cls": [ 1.4319349527359009, 5.846956253051758, 7.283481121063232, 9.520010948181152, 13.023626327514648 ], "hidden_norms_avg": [ 4.372097969055176, 8.950923919677734, 10.25277328491211, 11.715353012084961, 12.572748184204102 ], "bp_grad_per_sample_l2_med": [ 6.399707490345463e-05, 3.384953743079677e-05, 2.7512824090081267e-05, 1.8538266886025667e-05, 7.2009356699709315e-06 ], "bp_grad_F": [ 0.21942120790481567, 0.11553706228733063, 0.09221186488866806, 0.06456339359283447, 0.024819573387503624 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.798828125, "loss_eval": 0.7808230519294739, "epoch": 56 }, { "hidden_norms_cls": [ 1.4311723709106445, 5.84969425201416, 7.275974273681641, 9.513206481933594, 12.99256420135498 ], "hidden_norms_avg": [ 4.37282133102417, 8.946002006530762, 10.248116493225098, 11.702008247375488, 12.54873275756836 ], "bp_grad_per_sample_l2_med": [ 6.404191663023084e-05, 3.509471571305767e-05, 2.9476050258381292e-05, 1.9310447896714322e-05, 7.2306984293391e-06 ], "bp_grad_F": [ 0.22379544377326965, 0.11763197183609009, 0.09364764392375946, 0.06539658457040787, 0.02503892220556736 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.80078125, "loss_eval": 0.7862963080406189, "epoch": 57 }, { "hidden_norms_cls": [ 1.4306355714797974, 5.837501049041748, 7.250905990600586, 9.502866744995117, 13.022948265075684 ], "hidden_norms_avg": [ 4.368107795715332, 8.927281379699707, 10.20923900604248, 11.650206565856934, 12.504077911376953 ], "bp_grad_per_sample_l2_med": [ 7.216054655145854e-05, 3.7455520214280114e-05, 3.0207094823708758e-05, 2.1436455426737666e-05, 7.401154562103329e-06 ], "bp_grad_F": [ 0.22603340446949005, 0.11918352544307709, 0.0947541669011116, 0.06624340265989304, 0.02514214999973774 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.8017578125, "loss_eval": 0.7883187532424927, "epoch": 58 }, { "hidden_norms_cls": [ 1.4303507804870605, 5.833686351776123, 7.24592399597168, 9.48628044128418, 12.962425231933594 ], "hidden_norms_avg": [ 4.368690013885498, 8.926249504089355, 10.21507453918457, 11.65561294555664, 12.507142066955566 ], "bp_grad_per_sample_l2_med": [ 6.914411642355844e-05, 3.7666370189981535e-05, 3.0613842682214454e-05, 2.0578616386046633e-05, 7.153785645641619e-06 ], "bp_grad_F": [ 0.22665317356586456, 0.1197197362780571, 0.09526386857032776, 0.06651060283184052, 0.02521701157093048 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.798828125, "loss_eval": 0.7879265546798706, "epoch": 59 }, { "hidden_norms_cls": [ 1.430293083190918, 5.832674026489258, 7.243373394012451, 9.484408378601074, 12.968917846679688 ], "hidden_norms_avg": [ 4.368374347686768, 8.92542552947998, 10.214056015014648, 11.65438175201416, 12.507084846496582 ], "bp_grad_per_sample_l2_med": [ 6.862521695438772e-05, 3.740868851309642e-05, 3.050716986763291e-05, 2.0533103452180512e-05, 7.137502961995779e-06 ], "bp_grad_F": [ 0.22697713971138, 0.11988355964422226, 0.09540446847677231, 0.06659507006406784, 0.025233659893274307 ], "gamma_dfa": NaN, "gamma_dfa_per_layer": [], "acc_eval": 0.798828125, "loss_eval": 0.7890625, "epoch": 60 } ], "dfa_log": [ { "hidden_norms_cls": [ 0.31052109599113464, 3.2536301612854004, 4.7681732177734375, 6.129599571228027, 7.124356746673584 ], "hidden_norms_avg": [ 6.008513927459717, 7.034290313720703, 7.942849636077881, 8.915729522705078, 9.635361671447754 ], "bp_grad_per_sample_l2_med": [ 0.004442029166966677, 0.0012008437188342214, 0.0009976272704079747, 0.0009104337659664452, 0.0008558662957511842 ], "bp_grad_F": [ 0.18535660207271576, 0.03968670591711998, 0.032604776322841644, 0.029427478089928627, 0.02746850810945034 ], "gamma_dfa": 0.003905070887412876, "gamma_dfa_per_layer": [ 0.004920602310448885, 0.005249542184174061, 0.0038580193649977446, 0.0015921196900308132 ], "acc_eval": 0.1376953125, "loss_eval": 2.35188627243042, "epoch": 0 }, { "hidden_norms_cls": [ 1.969543218612671, 2409.528564453125, 2965.8515625, 5388.57568359375, 10078.4892578125 ], "hidden_norms_avg": [ 45.02196502685547, 4042.294189453125, 10780.892578125, 14336.607421875, 18185.720703125 ], "bp_grad_per_sample_l2_med": [ 0.00021220046619419008, 6.587009124814358e-07, 6.152115474833408e-07, 6.009134381201875e-07, 6.002246095704322e-07 ], "bp_grad_F": [ 0.327708899974823, 5.584151222137734e-05, 3.1912604754325e-05, 2.0850193322985433e-05, 2.061383202089928e-05 ], "gamma_dfa": 0.0062168055737856776, "gamma_dfa_per_layer": [ 0.0034891567192971706, 0.014096655882894993, 0.008750341832637787, -0.0014689321396872401 ], "acc_eval": 0.240234375, "loss_eval": 2.0569005012512207, "epoch": 1 }, { "hidden_norms_cls": [ 4.063174247741699, 6453.43212890625, 10849.3359375, 13374.7021484375, 36052.8046875 ], "hidden_norms_avg": [ 93.43009185791016, 12578.36328125, 48372.984375, 57469.9609375, 73801.421875 ], "bp_grad_per_sample_l2_med": [ 0.00015539559535682201, 2.588524239399703e-07, 1.9553621655177267e-07, 1.8433813409046707e-07, 1.781664309419284e-07 ], "bp_grad_F": [ 0.09239349514245987, 5.2396142564248294e-05, 9.398144356964622e-06, 6.586112704098923e-06, 6.009819117025472e-06 ], "gamma_dfa": 0.009027999331010506, "gamma_dfa_per_layer": [ 0.010615326464176178, 0.014681536704301834, 0.012467417865991592, -0.0016522837104275823 ], "acc_eval": 0.2236328125, "loss_eval": 2.0732030868530273, "epoch": 2 }, { "hidden_norms_cls": [ 6.139724254608154, 13514.7626953125, 22634.615234375, 30011.625, 105646.9140625 ], "hidden_norms_avg": [ 140.93157958984375, 27337.47265625, 105659.2734375, 131533.03125, 178079.78125 ], "bp_grad_per_sample_l2_med": [ 0.00013191952893976122, 1.5711624712366756e-07, 6.783211148331247e-08, 6.273136676782087e-08, 6.216072989673194e-08 ], "bp_grad_F": [ 0.15658611059188843, 2.8997201297897846e-05, 2.6110699309356278e-06, 2.0865154510829598e-06, 2.029548568316386e-06 ], "gamma_dfa": 0.0068359210272319615, "gamma_dfa_per_layer": [ 0.01239929161965847, 0.008297638036310673, 0.009697571396827698, -0.0030508169438689947 ], "acc_eval": 0.2255859375, "loss_eval": 2.0859451293945312, "epoch": 3 }, { "hidden_norms_cls": [ 8.060498237609863, 26771.85546875, 47700.99609375, 65194.9375, 243467.953125 ], "hidden_norms_avg": [ 189.60569763183594, 53537.2734375, 224677.375, 271932.0625, 380665.78125 ], "bp_grad_per_sample_l2_med": [ 6.88996515236795e-05, 7.635610188572173e-08, 3.178359264666142e-08, 2.8310823907418126e-08, 2.8113991135114702e-08 ], "bp_grad_F": [ 0.18565885722637177, 2.3117625460145064e-05, 1.2200183618915617e-06, 1.0046638863059343e-06, 9.67514324656804e-07 ], "gamma_dfa": 0.00588334770873189, "gamma_dfa_per_layer": [ 0.012929551303386688, 0.005936518311500549, 0.009927853010594845, -0.0052605317905545235 ], "acc_eval": 0.216796875, "loss_eval": 2.1008124351501465, "epoch": 4 }, { "hidden_norms_cls": [ 9.924980163574219, 45836.29296875, 86015.5546875, 115240.734375, 396649.5625 ], "hidden_norms_avg": [ 236.08885192871094, 94806.203125, 447709.03125, 539570.125, 680795.4375 ], "bp_grad_per_sample_l2_med": [ 0.00014524323341902345, 3.066869780354864e-08, 1.9569522891060842e-08, 1.7725259482404e-08, 1.7704602228718613e-08 ], "bp_grad_F": [ 0.21425659954547882, 1.3653657333634328e-05, 6.662682494606997e-07, 5.818570798510336e-07, 5.813048460368009e-07 ], "gamma_dfa": 0.006635856116190553, "gamma_dfa_per_layer": [ 0.010879420675337315, 0.013957185670733452, 0.00779206957668066, -0.006085251457989216 ], "acc_eval": 0.2265625, "loss_eval": 2.1039814949035645, "epoch": 5 }, { "hidden_norms_cls": [ 11.746355056762695, 70552.8046875, 256103.15625, 694951.625, 808366.5625 ], "hidden_norms_avg": [ 279.4807434082031, 128343.046875, 645095.375, 810123.8125, 959871.0 ], "bp_grad_per_sample_l2_med": [ 6.159865733934566e-05, 2.1975946395969004e-08, 1.1060357074654803e-08, 9.967390468546e-09, 1.011228256686536e-08 ], "bp_grad_F": [ 0.09021499752998352, 5.0024723350361455e-06, 4.539916176327097e-07, 3.891582309734076e-07, 3.9641980720261927e-07 ], "gamma_dfa": 0.003665695490781218, "gamma_dfa_per_layer": [ 0.009222292341291904, 0.0031545532401651144, 0.00775552075356245, -0.005469584371894598 ], "acc_eval": 0.220703125, "loss_eval": 2.1214356422424316, "epoch": 6 }, { "hidden_norms_cls": [ 13.500020980834961, 102720.734375, 194937.703125, 291956.1875, 801362.9375 ], "hidden_norms_avg": [ 321.6004943847656, 208601.421875, 1002364.1875, 1189027.25, 1448220.5 ], "bp_grad_per_sample_l2_med": [ 0.00014696457947138697, 1.642234792598174e-08, 8.907985460382406e-09, 8.127726935924784e-09, 8.014287011803845e-09 ], "bp_grad_F": [ 0.06841801106929779, 4.044012712256517e-06, 3.4213746857858496e-07, 2.990170742123155e-07, 2.988945198012516e-07 ], "gamma_dfa": 0.004651258233934641, "gamma_dfa_per_layer": [ 0.007132797501981258, 0.010231958702206612, 0.006907162256538868, -0.0056668855249881744 ], "acc_eval": 0.2099609375, "loss_eval": 2.0963404178619385, "epoch": 7 }, { "hidden_norms_cls": [ 15.302024841308594, 160872.96875, 604043.4375, 1296474.125, 1546227.0 ], "hidden_norms_avg": [ 359.47259521484375, 298263.5, 1317573.75, 1553171.25, 1878602.0 ], "bp_grad_per_sample_l2_med": [ 0.000136460512294434, 1.0422226637274434e-08, 5.898865396147812e-09, 5.4856741371622775e-09, 5.4926698744850455e-09 ], "bp_grad_F": [ 0.07932842522859573, 2.1081664272060152e-06, 2.560300345066935e-07, 2.2075181504987995e-07, 2.2043255398784822e-07 ], "gamma_dfa": 0.004627774120308459, "gamma_dfa_per_layer": [ 0.006024104077368975, 0.01116865873336792, 0.005747191607952118, -0.004428857937455177 ], "acc_eval": 0.220703125, "loss_eval": 2.0744481086730957, "epoch": 8 }, { "hidden_norms_cls": [ 17.009462356567383, 204948.671875, 405065.21875, 549855.3125, 1400973.875 ], "hidden_norms_avg": [ 396.66558837890625, 480022.3125, 2019487.75, 2350966.75, 2708745.25 ], "bp_grad_per_sample_l2_med": [ 0.00026586122112348676, 1.0135083883255902e-08, 6.120911777429683e-09, 5.8359819199438334e-09, 5.662275093243352e-09 ], "bp_grad_F": [ 0.37594228982925415, 1.2430107744876295e-05, 2.3164905371686473e-07, 2.0265188993562333e-07, 2.001279000296563e-07 ], "gamma_dfa": 0.004862090456299484, "gamma_dfa_per_layer": [ 0.006278482731431723, 0.012495312839746475, 0.005351733416318893, -0.004677167162299156 ], "acc_eval": 0.2265625, "loss_eval": 2.0641043186187744, "epoch": 9 }, { "hidden_norms_cls": [ 18.669273376464844, 316404.0625, 619048.375, 804163.5, 1798441.0 ], "hidden_norms_avg": [ 434.9389343261719, 650998.25, 2437815.25, 2802479.0, 3269810.75 ], "bp_grad_per_sample_l2_med": [ 0.0003605277743190527, 6.009571951182124e-09, 4.676837139783174e-09, 4.657723096102018e-09, 4.49635484400801e-09 ], "bp_grad_F": [ 0.14846132695674896, 4.3979816837236285e-06, 1.7215310776919068e-07, 1.581869213396203e-07, 1.561998885790672e-07 ], "gamma_dfa": 0.004480502451770008, "gamma_dfa_per_layer": [ 0.006086423061788082, 0.010957473888993263, 0.004586817231029272, -0.003708704374730587 ], "acc_eval": 0.2265625, "loss_eval": 2.0591208934783936, "epoch": 10 }, { "hidden_norms_cls": [ 20.326766967773438, 443508.46875, 899668.0625, 1131299.375, 2182177.5 ], "hidden_norms_avg": [ 473.4957275390625, 854388.9375, 2926402.0, 3295286.75, 3825241.0 ], "bp_grad_per_sample_l2_med": [ 0.0005711699486710131, 4.8561932253221585e-09, 3.871160725310574e-09, 3.833432238309342e-09, 3.74674646863582e-09 ], "bp_grad_F": [ 1.0882306098937988, 3.257442813264788e-06, 1.6311048511852277e-07, 1.3397652764979284e-07, 1.326638283671855e-07 ], "gamma_dfa": 0.00462920154677704, "gamma_dfa_per_layer": [ 0.008616073988378048, 0.009468363597989082, 0.003528183326125145, -0.003095814725384116 ], "acc_eval": 0.234375, "loss_eval": 2.0471031665802, "epoch": 11 }, { "hidden_norms_cls": [ 21.944751739501953, 581616.1875, 1205317.625, 1456984.375, 2587496.75 ], "hidden_norms_avg": [ 511.203125, 1119566.25, 3562080.25, 3992681.5, 4538977.5 ], "bp_grad_per_sample_l2_med": [ 0.0009346234728582203, 4.117307383921798e-09, 3.257990321969828e-09, 3.2349201095627222e-09, 3.1638915931608835e-09 ], "bp_grad_F": [ 0.42184242606163025, 2.2249487301451154e-06, 1.2586481545895367e-07, 1.1919513553948491e-07, 1.181974553787768e-07 ], "gamma_dfa": 0.0034259117674082518, "gamma_dfa_per_layer": [ 0.00526365265250206, 0.008116653189063072, 0.0030386103317141533, -0.0027152691036462784 ], "acc_eval": 0.2255859375, "loss_eval": 2.0867815017700195, "epoch": 12 }, { "hidden_norms_cls": [ 23.46192741394043, 733909.875, 1508464.125, 1841074.875, 3055228.75 ], "hidden_norms_avg": [ 546.8953247070312, 1235037.0, 3742642.75, 4200378.0, 4892382.5 ], "bp_grad_per_sample_l2_med": [ 0.0009773626225069165, 3.5754739169391314e-09, 2.9525657474493983e-09, 2.9297144710227485e-09, 2.8955173814182444e-09 ], "bp_grad_F": [ 0.15538839995861053, 2.0067516288690967e-06, 1.1871279781416888e-07, 1.046255491132797e-07, 1.0416235340926505e-07 ], "gamma_dfa": 0.002340688748518005, "gamma_dfa_per_layer": [ 0.0019294173689559102, 0.007100729271769524, 0.0026949853636324406, -0.0023623770102858543 ], "acc_eval": 0.232421875, "loss_eval": 2.088564872741699, "epoch": 13 }, { "hidden_norms_cls": [ 24.94734764099121, 1151802.75, 3671404.25, 4625593.5, 5052590.0 ], "hidden_norms_avg": [ 582.0977172851562, 1475600.75, 4403784.0, 5008330.0, 5801902.5 ], "bp_grad_per_sample_l2_med": [ 0.0007562927203252912, 2.676908916754428e-09, 2.2055020032496486e-09, 2.179777247590664e-09, 2.173634161550808e-09 ], "bp_grad_F": [ 0.36642539501190186, 3.967601060139714e-06, 8.444904864290947e-08, 7.993684647544796e-08, 7.900475651467787e-08 ], "gamma_dfa": 0.0017957038653548807, "gamma_dfa_per_layer": [ 0.0019046596717089415, 0.005139546003192663, 0.001759346341714263, -0.0016207365551963449 ], "acc_eval": 0.2109375, "loss_eval": 2.08038330078125, "epoch": 14 }, { "hidden_norms_cls": [ 26.36701011657715, 2210167.25, 6804633.5, 7592304.0, 7772230.0 ], "hidden_norms_avg": [ 615.4749145507812, 1852637.875, 5297662.0, 6054509.0, 6940769.5 ], "bp_grad_per_sample_l2_med": [ 0.0009053644607774913, 2.014937106054049e-09, 1.6813730407960747e-09, 1.63718916201816e-09, 1.6135126568173064e-09 ], "bp_grad_F": [ 0.15154746174812317, 3.760401341423858e-06, 6.479213254806382e-08, 6.350511227992683e-08, 6.00040195308793e-08 ], "gamma_dfa": 0.00026495405472815037, "gamma_dfa_per_layer": [ -0.0023696955759078264, 0.0033954931423068047, 0.0012687842827290297, -0.0012347656302154064 ], "acc_eval": 0.2333984375, "loss_eval": 2.0685791969299316, "epoch": 15 }, { "hidden_norms_cls": [ 27.747814178466797, 2020373.25, 6352088.0, 7372759.0, 7751557.0 ], "hidden_norms_avg": [ 647.8715209960938, 2166255.0, 5964871.0, 6820316.0, 7888183.5 ], "bp_grad_per_sample_l2_med": [ 0.000535959261469543, 1.8833379300531305e-09, 1.6251041623505103e-09, 1.5936774122593533e-09, 1.5920619267362213e-09 ], "bp_grad_F": [ 0.06977186352014542, 4.2289293560315855e-06, 5.94431135425566e-08, 5.634814925770115e-08, 5.626874255426628e-08 ], "gamma_dfa": 0.0009004889943753369, "gamma_dfa_per_layer": [ 1.3074517482891679e-05, 0.003544538514688611, 0.0012792267370969057, -0.0012348837917670608 ], "acc_eval": 0.234375, "loss_eval": 2.0676896572113037, "epoch": 16 }, { "hidden_norms_cls": [ 29.053590774536133, 3083884.0, 8692576.0, 10024582.0, 10278143.0 ], "hidden_norms_avg": [ 679.1322021484375, 2750560.0, 7205648.0, 8204248.5, 9336888.0 ], "bp_grad_per_sample_l2_med": [ 0.0006835769745521247, 1.5781399520520267e-09, 1.3378861352109084e-09, 1.2995797771253592e-09, 1.2820219330578198e-09 ], "bp_grad_F": [ 0.25767308473587036, 1.6246455061263987e-06, 6.349461756371966e-08, 6.242527206268278e-08, 4.5665522918625356e-08 ], "gamma_dfa": 0.0003357882087584585, "gamma_dfa_per_layer": [ -0.001319598057307303, 0.002733789850026369, 0.0008947808528319001, -0.0009658198105171323 ], "acc_eval": 0.23046875, "loss_eval": 2.0777204036712646, "epoch": 17 }, { "hidden_norms_cls": [ 30.246440887451172, 3200014.0, 8626485.0, 9743865.0, 10146681.0 ], "hidden_norms_avg": [ 708.5135498046875, 2989787.0, 7458187.5, 8607358.0, 10070516.0 ], "bp_grad_per_sample_l2_med": [ 0.0005841738311573863, 1.4247033552905464e-09, 1.2406603522308046e-09, 1.21434362565509e-09, 1.217411615961339e-09 ], "bp_grad_F": [ 0.08999939262866974, 1.7538721976961824e-06, 4.803559150445835e-08, 4.36282370230856e-08, 4.3068951072200434e-08 ], "gamma_dfa": -2.2506676032207906e-05, "gamma_dfa_per_layer": [ -0.002581980312243104, 0.002518225461244583, 0.0009317069780081511, -0.0009579788311384618 ], "acc_eval": 0.2392578125, "loss_eval": 2.0627658367156982, "epoch": 18 }, { "hidden_norms_cls": [ 31.42615509033203, 4556513.5, 10711725.0, 11956874.0, 12318100.0 ], "hidden_norms_avg": [ 737.157958984375, 3520006.5, 8303534.5, 9571905.0, 11293369.0 ], "bp_grad_per_sample_l2_med": [ 0.0007374613196589053, 1.2111865954622658e-09, 1.0633514069269268e-09, 1.0194807220642588e-09, 1.0034837405470398e-09 ], "bp_grad_F": [ 0.12247106432914734, 2.740941681622644e-06, 4.6019909660799385e-08, 4.372383344275477e-08, 3.6865596797497346e-08 ], "gamma_dfa": 0.0005736843086197041, "gamma_dfa_per_layer": [ 0.0002251334663014859, 0.0021776340436190367, 0.0006795942317694426, -0.0007876245072111487 ], "acc_eval": 0.22265625, "loss_eval": 2.062939167022705, "epoch": 19 }, { "hidden_norms_cls": [ 32.559165954589844, 4224958.5, 10227904.0, 11507743.0, 12041642.0 ], "hidden_norms_avg": [ 765.5013427734375, 3988012.5, 8953060.0, 10431809.0, 12380471.0 ], "bp_grad_per_sample_l2_med": [ 0.0006474430556409061, 1.179957687114097e-09, 1.0031043773395254e-09, 9.744786089171953e-10, 9.782840093564005e-10 ], "bp_grad_F": [ 0.12209221720695496, 1.616509621271689e-06, 3.8821241332698264e-08, 3.6648025059093925e-08, 3.527756931021031e-08 ], "gamma_dfa": -0.00019280995184089988, "gamma_dfa_per_layer": [ -0.002911232877522707, 0.0022857212461531162, 0.0006594176520593464, -0.0008051458280533552 ], "acc_eval": 0.240234375, "loss_eval": 2.0555338859558105, "epoch": 20 }, { "hidden_norms_cls": [ 33.59370040893555, 5323277.5, 11855673.0, 13697022.0, 14246667.0 ], "hidden_norms_avg": [ 789.9629516601562, 4634178.0, 10205192.0, 11930021.0, 13993152.0 ], "bp_grad_per_sample_l2_med": [ 0.0006352875498123467, 1.0036302899862903e-09, 8.794808215029093e-10, 8.579849608558732e-10, 8.574586596310496e-10 ], "bp_grad_F": [ 0.09745635837316513, 5.127232043378172e-07, 3.342180221466151e-08, 3.173540363832217e-08, 3.091372491326183e-08 ], "gamma_dfa": -0.0006959605379961431, "gamma_dfa_per_layer": [ -0.004454955458641052, 0.0018251645378768444, 0.0005447655566968024, -0.000698816787917167 ], "acc_eval": 0.2265625, "loss_eval": 2.056840181350708, "epoch": 21 }, { "hidden_norms_cls": [ 34.583858489990234, 6778143.0, 13401385.0, 15847366.0, 16344266.0 ], "hidden_norms_avg": [ 814.3038330078125, 5395352.5, 11137891.0, 13094203.0, 15406614.0 ], "bp_grad_per_sample_l2_med": [ 0.0006492820102721453, 8.925201688825268e-10, 7.777718469270667e-10, 7.627384279729199e-10, 7.601627105557895e-10 ], "bp_grad_F": [ 0.08801906555891037, 1.8660392697711359e-06, 3.472371190582635e-08, 2.7845679539950652e-08, 2.7135749647300145e-08 ], "gamma_dfa": -0.0012016263353871182, "gamma_dfa_per_layer": [ -0.006280785892158747, 0.001651690574362874, 0.0004266214673407376, -0.0006040314910933375 ], "acc_eval": 0.2255859375, "loss_eval": 2.0746021270751953, "epoch": 22 }, { "hidden_norms_cls": [ 35.516666412353516, 6985935.5, 14020116.0, 16575473.0, 17109272.0 ], "hidden_norms_avg": [ 838.5614013671875, 6365095.0, 12448551.0, 14566203.0, 16943832.0 ], "bp_grad_per_sample_l2_med": [ 0.0007437304593622684, 8.387662786546457e-10, 7.299132409599451e-10, 7.170505300635455e-10, 7.115786293532267e-10 ], "bp_grad_F": [ 0.1540054827928543, 1.4262270724429982e-06, 2.9031822279534936e-08, 2.776059560005706e-08, 2.5270722403547552e-08 ], "gamma_dfa": -0.00010950746218441054, "gamma_dfa_per_layer": [ -0.0017721566837280989, 0.0015054477844387293, 0.0003872170636896044, -0.000558538013137877 ], "acc_eval": 0.2392578125, "loss_eval": 2.065904140472412, "epoch": 23 }, { "hidden_norms_cls": [ 36.39850997924805, 7861434.0, 14415042.0, 16660478.0, 17496562.0 ], "hidden_norms_avg": [ 862.4805297851562, 6600421.5, 12694272.0, 15043836.0, 17968980.0 ], "bp_grad_per_sample_l2_med": [ 0.0005834798794239759, 7.558619286029966e-10, 6.530426754913776e-10, 6.420492471015393e-10, 6.389526685524061e-10 ], "bp_grad_F": [ 0.09943251311779022, 1.4788431599299656e-06, 2.582997993272329e-08, 2.3754548550414256e-08, 2.322415859623561e-08 ], "gamma_dfa": -0.0009345750440843403, "gamma_dfa_per_layer": [ -0.005123761482536793, 0.0015550897223874927, 0.0003447675844654441, -0.0005143960006535053 ], "acc_eval": 0.2529296875, "loss_eval": 2.041043758392334, "epoch": 24 }, { "hidden_norms_cls": [ 37.283199310302734, 8933519.0, 15359962.0, 17441364.0, 18346258.0 ], "hidden_norms_avg": [ 883.0538330078125, 7354756.0, 13721222.0, 16105006.0, 19368310.0 ], "bp_grad_per_sample_l2_med": [ 0.00026283934130333364, 6.873029922971341e-10, 6.058342161274766e-10, 6.000055452481945e-10, 5.98545990548871e-10 ], "bp_grad_F": [ 0.11474847048521042, 2.4628958271932788e-05, 1.3788282160476228e-07, 2.199209525599599e-08, 2.15279509774291e-08 ], "gamma_dfa": -0.0014451614988502115, "gamma_dfa_per_layer": [ -0.006978219375014305, 0.0013526652473956347, 0.0002992081572301686, -0.0004543000250123441 ], "acc_eval": 0.2451171875, "loss_eval": 2.0492172241210938, "epoch": 25 }, { "hidden_norms_cls": [ 38.11500930786133, 10836846.0, 17507178.0, 19929002.0, 20726542.0 ], "hidden_norms_avg": [ 901.960205078125, 8138403.5, 14552406.0, 17157852.0, 20773122.0 ], "bp_grad_per_sample_l2_med": [ 0.0005291851703077555, 6.35470620569123e-10, 5.6208532273061e-10, 5.496996191567405e-10, 5.433966054901873e-10 ], "bp_grad_F": [ 0.07972504198551178, 1.2489309710872476e-06, 2.2593511062041216e-08, 2.1460177634935462e-08, 1.941634231172884e-08 ], "gamma_dfa": -0.000788729106716346, "gamma_dfa_per_layer": [ -0.00451657734811306, 0.0015372345224022865, 0.00024382121046073735, -0.00041939481161534786 ], "acc_eval": 0.2265625, "loss_eval": 2.0669429302215576, "epoch": 26 }, { "hidden_norms_cls": [ 38.87166213989258, 11480826.0, 18077316.0, 20884150.0, 22098916.0 ], "hidden_norms_avg": [ 920.577880859375, 8893063.0, 15579717.0, 18401958.0, 22225722.0 ], "bp_grad_per_sample_l2_med": [ 0.0005104477168060839, 5.858571405781277e-10, 5.198571018105724e-10, 5.114682011253535e-10, 5.120092128052534e-10 ], "bp_grad_F": [ 0.13577552139759064, 2.0482397303567268e-05, 2.1394010119024642e-08, 2.0649670418038113e-08, 1.8286096192809964e-08 ], "gamma_dfa": -0.0004262418224243447, "gamma_dfa_per_layer": [ -0.0029134145006537437, 0.0013950758147984743, 0.00018188939429819584, -0.0003685179981403053 ], "acc_eval": 0.2490234375, "loss_eval": 2.053382396697998, "epoch": 27 }, { "hidden_norms_cls": [ 39.6179313659668, 10591964.0, 16346992.0, 18847678.0, 21847726.0 ], "hidden_norms_avg": [ 937.9719848632812, 9576851.0, 16784906.0, 19828342.0, 23673520.0 ], "bp_grad_per_sample_l2_med": [ 0.00023470228188671172, 5.629120503058971e-10, 5.04818964408571e-10, 4.974847200855947e-10, 4.968530586957343e-10 ], "bp_grad_F": [ 0.03459252789616585, 8.028884622035548e-06, 1.9716548393944322e-08, 1.807922522800709e-08, 1.7913645677936074e-08 ], "gamma_dfa": -0.0018089709192281589, "gamma_dfa_per_layer": [ -0.008484212681651115, 0.0014374498277902603, 0.00020184949971735477, -0.00039097032276913524 ], "acc_eval": 0.224609375, "loss_eval": 2.0604443550109863, "epoch": 28 }, { "hidden_norms_cls": [ 40.344242095947266, 10467030.0, 15235544.0, 17027748.0, 23281082.0 ], "hidden_norms_avg": [ 954.3844604492188, 10038487.0, 16584430.0, 19613710.0, 24505476.0 ], "bp_grad_per_sample_l2_med": [ 0.00015729073493275791, 5.36418076624301e-10, 4.5378717450361705e-10, 4.4796202858243817e-10, 4.477457571372412e-10 ], "bp_grad_F": [ 0.04820869117975235, 2.3596087430632906e-06, 1.7855482425943592e-08, 1.7340139990551506e-08, 1.672622929049794e-08 ], "gamma_dfa": -0.0013171448226785287, "gamma_dfa_per_layer": [ -0.006438364274799824, 0.0013229507021605968, 0.00020032597240060568, -0.00035349169047549367 ], "acc_eval": 0.236328125, "loss_eval": 2.061581611633301, "epoch": 29 }, { "hidden_norms_cls": [ 41.04903793334961, 12235056.0, 17721728.0, 19784938.0, 25024272.0 ], "hidden_norms_avg": [ 969.5825805664062, 11940616.0, 19401350.0, 22468846.0, 26879212.0 ], "bp_grad_per_sample_l2_med": [ 0.00035265026963315904, 5.423251847602728e-10, 4.4247547292819434e-10, 4.358849947649901e-10, 4.3593659238005955e-10 ], "bp_grad_F": [ 0.0735621377825737, 1.917086819958058e-06, 1.9346130031294706e-08, 1.5936171493535767e-08, 1.5501758099389917e-08 ], "gamma_dfa": -0.001081134716514498, "gamma_dfa_per_layer": [ -0.005434883758425713, 0.0012318368535488844, 0.00019993717432953417, -0.00032142913551069796 ], "acc_eval": 0.2265625, "loss_eval": 2.0760293006896973, "epoch": 30 }, { "hidden_norms_cls": [ 41.723567962646484, 10562926.0, 13746881.0, 15736975.0, 26354068.0 ], "hidden_norms_avg": [ 984.3485717773438, 12533570.0, 19717132.0, 22961588.0, 28083302.0 ], "bp_grad_per_sample_l2_med": [ 0.0002546848263591528, 4.777176432213537e-10, 4.0483683072523036e-10, 4.0072575813177025e-10, 4.013349652609577e-10 ], "bp_grad_F": [ 0.06879052519798279, 1.7057992636182462e-06, 1.6271217262442406e-08, 1.4877675091895526e-08, 1.484982270483215e-08 ], "gamma_dfa": -0.0015064112594700418, "gamma_dfa_per_layer": [ -0.007336798589676619, 0.0013772943057119846, 0.00022022609482519329, -0.0002863668487407267 ], "acc_eval": 0.20703125, "loss_eval": 2.078207492828369, "epoch": 31 }, { "hidden_norms_cls": [ 42.342227935791016, 13283171.0, 17422292.0, 19770980.0, 28086972.0 ], "hidden_norms_avg": [ 999.26123046875, 13875387.0, 21404830.0, 24833206.0, 29923332.0 ], "bp_grad_per_sample_l2_med": [ 0.0003442879824433476, 4.4142753341525065e-10, 3.8908712363117104e-10, 3.845144203040718e-10, 3.8369810106964053e-10 ], "bp_grad_F": [ 0.10482411086559296, 2.8695783385046525e-06, 1.7273855235089286e-08, 1.4195452813225984e-08, 1.3857171410336377e-08 ], "gamma_dfa": -0.0009248298447346315, "gamma_dfa_per_layer": [ -0.004888010676950216, 0.0012753453338518739, 0.00017224671319127083, -0.0002589007490314543 ], "acc_eval": 0.2373046875, "loss_eval": 2.078000068664551, "epoch": 32 }, { "hidden_norms_cls": [ 42.90097427368164, 16870614.0, 22116480.0, 24442270.0, 29665536.0 ], "hidden_norms_avg": [ 1013.56396484375, 14764026.0, 21856036.0, 25334308.0, 30474444.0 ], "bp_grad_per_sample_l2_med": [ 0.00047380090109072626, 4.22005735911668e-10, 3.5831293487831317e-10, 3.5505443030103834e-10, 3.5614466931122024e-10 ], "bp_grad_F": [ 0.1035437062382698, 1.2711110457530594e-06, 1.418432571398398e-08, 1.2978671470875724e-08, 1.2937439564097986e-08 ], "gamma_dfa": -0.00034118785697501153, "gamma_dfa_per_layer": [ -0.002568737603724003, 0.001293556997552514, 0.000137164635816589, -0.00022673545754514635 ], "acc_eval": 0.2265625, "loss_eval": 2.0730109214782715, "epoch": 33 }, { "hidden_norms_cls": [ 43.419898986816406, 18221210.0, 22675590.0, 24728546.0, 30520888.0 ], "hidden_norms_avg": [ 1027.6595458984375, 16337822.0, 23378412.0, 26921720.0, 31927994.0 ], "bp_grad_per_sample_l2_med": [ 0.0004629126051440835, 4.106864293085266e-10, 3.557905081663648e-10, 3.536362591649578e-10, 3.5421768296295397e-10 ], "bp_grad_F": [ 0.08281872421503067, 1.4263683851822861e-06, 1.3245164076636229e-08, 1.2740572152836194e-08, 1.2752362721357713e-08 ], "gamma_dfa": -0.0006677984529233072, "gamma_dfa_per_layer": [ -0.0036979843862354755, 0.0011370242573320866, 0.00012192466238047928, -0.00023215834517031908 ], "acc_eval": 0.23828125, "loss_eval": 2.0669164657592773, "epoch": 34 }, { "hidden_norms_cls": [ 43.868682861328125, 18758150.0, 23109030.0, 25432404.0, 31503354.0 ], "hidden_norms_avg": [ 1040.644287109375, 15512033.0, 21965288.0, 25882228.0, 31813648.0 ], "bp_grad_per_sample_l2_med": [ 0.00048007385339587927, 4.271450415593847e-10, 3.4119135294830016e-10, 3.391489034054729e-10, 3.387232438978316e-10 ], "bp_grad_F": [ 0.36019906401634216, 1.9220671674702317e-05, 1.358929768713324e-08, 1.2455363851415768e-08, 1.2401786264604198e-08 ], "gamma_dfa": -0.00031488661625189707, "gamma_dfa_per_layer": [ -0.002551896497607231, 0.001431336859241128, 9.301750105805695e-05, -0.00023200432769954205 ], "acc_eval": 0.234375, "loss_eval": 2.0609660148620605, "epoch": 35 }, { "hidden_norms_cls": [ 44.293697357177734, 21659484.0, 26491946.0, 29332332.0, 32793040.0 ], "hidden_norms_avg": [ 1051.83740234375, 17567000.0, 24049368.0, 28083622.0, 33467380.0 ], "bp_grad_per_sample_l2_med": [ 0.00043948061647824943, 4.0486294872188466e-10, 3.3493480211532756e-10, 3.3453453895937457e-10, 3.3604671823006527e-10 ], "bp_grad_F": [ 0.10878865420818329, 3.037727083210484e-06, 1.2592222375928941e-08, 1.2103843261002112e-08, 1.2022392859023512e-08 ], "gamma_dfa": -0.00015630935013177805, "gamma_dfa_per_layer": [ -0.0019119374919682741, 0.0014281735057011247, 7.57485831854865e-05, -0.00021722199744544923 ], "acc_eval": 0.2431640625, "loss_eval": 2.0587897300720215, "epoch": 36 }, { "hidden_norms_cls": [ 44.68658447265625, 21628572.0, 26077032.0, 28336790.0, 33305650.0 ], "hidden_norms_avg": [ 1062.067138671875, 18163602.0, 24404446.0, 28478594.0, 34156064.0 ], "bp_grad_per_sample_l2_med": [ 0.0005865619168616831, 4.0249623078914e-10, 3.3121710929506776e-10, 3.310392793220984e-10, 3.318675056984688e-10 ], "bp_grad_F": [ 0.20061102509498596, 1.4544431223839638e-06, 1.3441372459510603e-08, 1.2418687411752671e-08, 1.2016870165609816e-08 ], "gamma_dfa": -0.00039686575473751873, "gamma_dfa_per_layer": [ -0.0029668076895177364, 0.0015295962803065777, 6.985102663747966e-05, -0.00022010263637639582 ], "acc_eval": 0.2275390625, "loss_eval": 2.0569839477539062, "epoch": 37 }, { "hidden_norms_cls": [ 45.062259674072266, 25376026.0, 30203382.0, 32772746.0, 35119040.0 ], "hidden_norms_avg": [ 1071.6630859375, 18637428.0, 24671676.0, 28819074.0, 34739232.0 ], "bp_grad_per_sample_l2_med": [ 0.0005594053072854877, 3.9023292930373543e-10, 3.2509483993692356e-10, 3.23913590394298e-10, 3.250162639023557e-10 ], "bp_grad_F": [ 0.13359014689922333, 4.247889592079446e-06, 1.4051211749688264e-08, 1.2317144637563615e-08, 1.1531787968976914e-08 ], "gamma_dfa": -0.0005283378432068275, "gamma_dfa_per_layer": [ -0.0037097278982400894, 0.0017695487476885319, 4.308431380195543e-05, -0.000216256536077708 ], "acc_eval": 0.2666015625, "loss_eval": 2.0476396083831787, "epoch": 38 }, { "hidden_norms_cls": [ 45.38731384277344, 24903830.0, 30026926.0, 33563200.0, 35539932.0 ], "hidden_norms_avg": [ 1080.0860595703125, 20496828.0, 26709690.0, 30932660.0, 36357072.0 ], "bp_grad_per_sample_l2_med": [ 0.0005004233680665493, 3.8017103354270887e-10, 3.1730867933177365e-10, 3.167333340048373e-10, 3.1768215835725755e-10 ], "bp_grad_F": [ 0.24717594683170319, 2.9436714612529613e-06, 1.1934382371237007e-08, 1.1459838411553847e-08, 1.1365100860416533e-08 ], "gamma_dfa": -0.00022031009211787023, "gamma_dfa_per_layer": [ -0.0022991469595581293, 0.0015725505072623491, 4.821528273168951e-05, -0.00020285919890739024 ], "acc_eval": 0.244140625, "loss_eval": 2.0488319396972656, "epoch": 39 }, { "hidden_norms_cls": [ 45.68830490112305, 27470426.0, 32688434.0, 35418348.0, 37778420.0 ], "hidden_norms_avg": [ 1088.195068359375, 19636778.0, 25748976.0, 30137794.0, 36341748.0 ], "bp_grad_per_sample_l2_med": [ 0.000507087679579854, 3.7039282752004965e-10, 3.106248036566228e-10, 3.096240208666501e-10, 3.10577202844442e-10 ], "bp_grad_F": [ 0.247142493724823, 5.3006801863375586e-06, 1.5794508811950436e-08, 1.5706817180216603e-08, 1.0953104201405495e-08 ], "gamma_dfa": -0.00026929086834570626, "gamma_dfa_per_layer": [ -0.0025479549076408148, 0.0016400209860876203, 2.4549921363359317e-05, -0.00019377947319298983 ], "acc_eval": 0.2548828125, "loss_eval": 2.0380632877349854, "epoch": 40 }, { "hidden_norms_cls": [ 45.95172119140625, 29219790.0, 34751968.0, 37645720.0, 39363420.0 ], "hidden_norms_avg": [ 1095.55908203125, 20059094.0, 26161532.0, 30539128.0, 36948852.0 ], "bp_grad_per_sample_l2_med": [ 0.0004415555449668318, 3.578430884942918e-10, 3.05192260352527e-10, 3.046965735276075e-10, 3.0560776131949297e-10 ], "bp_grad_F": [ 0.1088763028383255, 4.900910880678566e-06, 1.1387745857405207e-08, 1.0883239198733463e-08, 1.0722531307294503e-08 ], "gamma_dfa": -0.0006201292017067317, "gamma_dfa_per_layer": [ -0.004000760614871979, 0.0016785510815680027, 3.265401755925268e-05, -0.0001909612910822034 ], "acc_eval": 0.25, "loss_eval": 2.041342258453369, "epoch": 41 }, { "hidden_norms_cls": [ 46.1973876953125, 29375584.0, 34745100.0, 38109944.0, 40454424.0 ], "hidden_norms_avg": [ 1102.340087890625, 21066706.0, 27296236.0, 31874516.0, 38108092.0 ], "bp_grad_per_sample_l2_med": [ 0.00040148120024241507, 3.579030682931972e-10, 3.0047467292071417e-10, 2.979275159908923e-10, 2.9703536852387913e-10 ], "bp_grad_F": [ 0.2525903582572937, 8.925781003199518e-06, 1.1219404072448924e-08, 1.084880185686643e-08, 1.0492501978376367e-08 ], "gamma_dfa": -0.00034770679030771134, "gamma_dfa_per_layer": [ -0.002933461917564273, 0.001698363572359085, 3.748677045223303e-05, -0.0001932155864778906 ], "acc_eval": 0.244140625, "loss_eval": 2.0345935821533203, "epoch": 42 }, { "hidden_norms_cls": [ 46.42340087890625, 27399134.0, 31821602.0, 34474508.0, 38109560.0 ], "hidden_norms_avg": [ 1108.236328125, 21543940.0, 27684760.0, 32082502.0, 38718660.0 ], "bp_grad_per_sample_l2_med": [ 0.000570801377762109, 3.5802838471710174e-10, 2.990230563160168e-10, 2.9852947891484405e-10, 2.9978877713610075e-10 ], "bp_grad_F": [ 0.173945352435112, 2.9223572255432373e-06, 1.2221713419080515e-08, 1.1539666999738074e-08, 1.0805790928714032e-08 ], "gamma_dfa": -5.9806044191645924e-05, "gamma_dfa_per_layer": [ -0.001857165014371276, 0.0017762510105967522, 3.49261645169463e-05, -0.00019323633750900626 ], "acc_eval": 0.2412109375, "loss_eval": 2.043308734893799, "epoch": 43 }, { "hidden_norms_cls": [ 46.619728088378906, 31052948.0, 36542220.0, 39935176.0, 42316204.0 ], "hidden_norms_avg": [ 1113.68896484375, 22679808.0, 29079456.0, 33751472.0, 40006012.0 ], "bp_grad_per_sample_l2_med": [ 0.00046165595995262265, 3.339039600369631e-10, 2.9132621315319795e-10, 2.9080904351275194e-10, 2.9134980539247124e-10 ], "bp_grad_F": [ 0.08871550858020782, 1.195927779917838e-05, 1.2490571243972681e-08, 1.2371740965022582e-08, 1.015614703447909e-08 ], "gamma_dfa": -0.0003672020420708577, "gamma_dfa_per_layer": [ -0.002894133096560836, 0.0016025153454393148, 2.5333010853501037e-05, -0.0002025234280154109 ], "acc_eval": 0.244140625, "loss_eval": 2.029773473739624, "epoch": 44 }, { "hidden_norms_cls": [ 46.796348571777344, 30912490.0, 36281496.0, 39245376.0, 41656108.0 ], "hidden_norms_avg": [ 1118.38134765625, 23560890.0, 29646840.0, 34192144.0, 40581760.0 ], "bp_grad_per_sample_l2_med": [ 0.0005251869442872703, 3.3097524720915317e-10, 2.891357153700369e-10, 2.8932781170887267e-10, 2.8904145743524623e-10 ], "bp_grad_F": [ 0.09888254106044769, 4.3903874029638246e-06, 1.0815308648659538e-08, 1.040402519691952e-08, 1.0228043301196976e-08 ], "gamma_dfa": -0.00037046667421236634, "gamma_dfa_per_layer": [ -0.002757731592282653, 0.0014231146778911352, 3.9225356886163354e-05, -0.00018647513934411108 ], "acc_eval": 0.234375, "loss_eval": 2.0383992195129395, "epoch": 45 }, { "hidden_norms_cls": [ 46.95427322387695, 31720426.0, 37234788.0, 40129424.0, 42928428.0 ], "hidden_norms_avg": [ 1122.57470703125, 22583276.0, 28617936.0, 33269996.0, 40462568.0 ], "bp_grad_per_sample_l2_med": [ 0.0004295881371945143, 3.419305394380956e-10, 2.8222821302215095e-10, 2.8184321543278656e-10, 2.8312005517783234e-10 ], "bp_grad_F": [ 0.5366736650466919, 2.256676998513285e-05, 1.1914533359913548e-08, 1.1219233542192342e-08, 1.004730165732326e-08 ], "gamma_dfa": 0.00015619578334735706, "gamma_dfa_per_layer": [ -0.0010500183561816812, 0.001834970898926258, 3.652184386737645e-05, -0.00019669125322252512 ], "acc_eval": 0.2431640625, "loss_eval": 2.039337396621704, "epoch": 46 }, { "hidden_norms_cls": [ 47.09259796142578, 32824944.0, 38341332.0, 41754692.0, 44005196.0 ], "hidden_norms_avg": [ 1126.26953125, 24313264.0, 30669532.0, 35293632.0, 41785680.0 ], "bp_grad_per_sample_l2_med": [ 0.0005083036958239973, 3.2607763711389737e-10, 2.8033902976787317e-10, 2.7943025671106625e-10, 2.7980692762774595e-10 ], "bp_grad_F": [ 0.06971772015094757, 2.262569068989251e-06, 1.0069017619684928e-08, 9.845756210324907e-09, 9.862499261714675e-09 ], "gamma_dfa": 0.0007457349984179018, "gamma_dfa_per_layer": [ 0.0015201317146420479, 0.0016060702037066221, 3.652479063021019e-05, -0.00017978671530727297 ], "acc_eval": 0.25, "loss_eval": 2.0368857383728027, "epoch": 47 }, { "hidden_norms_cls": [ 47.21082305908203, 33649040.0, 39036836.0, 42500816.0, 44653764.0 ], "hidden_norms_avg": [ 1129.5389404296875, 24447482.0, 30689206.0, 35330028.0, 42064012.0 ], "bp_grad_per_sample_l2_med": [ 0.00046678923536092043, 3.204189136241098e-10, 2.755325689829391e-10, 2.7554050707756517e-10, 2.7654081802275243e-10 ], "bp_grad_F": [ 0.07496139407157898, 2.2861270281282486e-06, 9.997683569906712e-09, 9.715622084627284e-09, 9.736355721656764e-09 ], "gamma_dfa": 0.0006021281524226652, "gamma_dfa_per_layer": [ 0.0007927162805572152, 0.001763419946655631, 3.104796996922232e-05, -0.000178671587491408 ], "acc_eval": 0.259765625, "loss_eval": 2.0324196815490723, "epoch": 48 }, { "hidden_norms_cls": [ 47.315826416015625, 34514608.0, 40222940.0, 43606628.0, 45508540.0 ], "hidden_norms_avg": [ 1132.157958984375, 24487910.0, 30821460.0, 35505456.0, 42327908.0 ], "bp_grad_per_sample_l2_med": [ 0.00041785358916968107, 3.3263317100740153e-10, 2.696754763942266e-10, 2.701733836651954e-10, 2.71275196750409e-10 ], "bp_grad_F": [ 0.08130628615617752, 3.3661247016425477e-06, 1.078094857831502e-08, 9.643851939244996e-09, 9.617946439277603e-09 ], "gamma_dfa": 0.0005021913366363151, "gamma_dfa_per_layer": [ 0.00036606384674087167, 0.0017899572849273682, 2.7483671146910638e-05, -0.00017473945626989007 ], "acc_eval": 0.2626953125, "loss_eval": 2.028841495513916, "epoch": 49 }, { "hidden_norms_cls": [ 47.388946533203125, 35118772.0, 40722008.0, 44347232.0, 46331384.0 ], "hidden_norms_avg": [ 1134.3621826171875, 24821028.0, 31074444.0, 35754528.0, 42627356.0 ], "bp_grad_per_sample_l2_med": [ 0.00043533919961191714, 3.173189211391758e-10, 2.687766953446413e-10, 2.68161992611482e-10, 2.690903055935223e-10 ], "bp_grad_F": [ 0.09458157420158386, 1.9965789306297665e-06, 1.025628915130028e-08, 9.58252854843522e-09, 9.523047239667903e-09 ], "gamma_dfa": 0.00038969498109509004, "gamma_dfa_per_layer": [ -0.00010247333557344973, 0.0018051008228212595, 3.0877545214025304e-05, -0.0001747251080814749 ], "acc_eval": 0.2548828125, "loss_eval": 2.0298049449920654, "epoch": 50 }, { "hidden_norms_cls": [ 47.4621696472168, 34836160.0, 40469796.0, 44120564.0, 46361016.0 ], "hidden_norms_avg": [ 1136.3079833984375, 24152832.0, 30436140.0, 35273740.0, 42621312.0 ], "bp_grad_per_sample_l2_med": [ 0.000491869286634028, 3.2774055691575654e-10, 2.667974174919152e-10, 2.669577336966711e-10, 2.680060617876734e-10 ], "bp_grad_F": [ 0.0854402706027031, 1.6183460047614062e-06, 9.980491100236577e-09, 9.461099459429079e-09, 9.473674289495193e-09 ], "gamma_dfa": 0.0005695745421689935, "gamma_dfa_per_layer": [ 0.0004214277723804116, 0.001994946738705039, 3.653779276646674e-05, -0.00017461413517594337 ], "acc_eval": 0.23828125, "loss_eval": 2.024928092956543, "epoch": 51 }, { "hidden_norms_cls": [ 47.52342224121094, 36446320.0, 42468064.0, 46175108.0, 47947040.0 ], "hidden_norms_avg": [ 1137.8057861328125, 25400616.0, 31703746.0, 36432956.0, 43307828.0 ], "bp_grad_per_sample_l2_med": [ 0.00034005154157057405, 3.121023717245208e-10, 2.6523216956064743e-10, 2.6489818671926457e-10, 2.649658548126155e-10 ], "bp_grad_F": [ 0.10125189274549484, 4.0649438233231194e-06, 9.830144698241838e-09, 9.345456852827283e-09, 9.317212779080819e-09 ], "gamma_dfa": 0.0005080709906906122, "gamma_dfa_per_layer": [ 0.00023581110872328281, 0.0019333910895511508, 3.0449831683654338e-05, -0.00016736806719563901 ], "acc_eval": 0.251953125, "loss_eval": 2.0343496799468994, "epoch": 52 }, { "hidden_norms_cls": [ 47.567466735839844, 35483484.0, 41150516.0, 44742840.0, 47102380.0 ], "hidden_norms_avg": [ 1139.05029296875, 25225282.0, 31585082.0, 36363108.0, 43411416.0 ], "bp_grad_per_sample_l2_med": [ 0.00046872245729900897, 3.1678357159670156e-10, 2.6331647973165673e-10, 2.64141680750285e-10, 2.646937946604311e-10 ], "bp_grad_F": [ 0.08037562668323517, 2.9532295684475685e-06, 9.44631484145475e-09, 9.393840372240447e-09, 9.41009226096412e-09 ], "gamma_dfa": 0.0005205844290685491, "gamma_dfa_per_layer": [ 0.0003642886003945023, 0.0018537556752562523, 3.766161171370186e-05, -0.00017336817109026015 ], "acc_eval": 0.2392578125, "loss_eval": 2.02734375, "epoch": 53 }, { "hidden_norms_cls": [ 47.602928161621094, 35582280.0, 41200288.0, 44686488.0, 47126900.0 ], "hidden_norms_avg": [ 1139.965087890625, 25657812.0, 31984420.0, 36722060.0, 43681628.0 ], "bp_grad_per_sample_l2_med": [ 0.00047245126916095614, 3.1708738412739024e-10, 2.6278745846042284e-10, 2.6274540876336516e-10, 2.6386243190401615e-10 ], "bp_grad_F": [ 0.08141150325536728, 1.0596501851978246e-05, 1.0370135861137442e-08, 1.0129613592368969e-08, 9.407171930320146e-09 ], "gamma_dfa": 0.00048223476824205136, "gamma_dfa_per_layer": [ 0.00032963097328320146, 0.00173661345615983, 3.3767075365176424e-05, -0.00017107243184000254 ], "acc_eval": 0.251953125, "loss_eval": 2.0290825366973877, "epoch": 54 }, { "hidden_norms_cls": [ 47.62870788574219, 36373308.0, 42049216.0, 45803868.0, 47955172.0 ], "hidden_norms_avg": [ 1140.6492919921875, 25698864.0, 31990548.0, 36707920.0, 43700336.0 ], "bp_grad_per_sample_l2_med": [ 0.0004157091898377985, 3.1451533044624114e-10, 2.6160756894100246e-10, 2.62937283057596e-10, 2.633904483406724e-10 ], "bp_grad_F": [ 0.28710466623306274, 2.876764028769685e-06, 9.405439982401731e-09, 9.308096515781017e-09, 9.319982119393444e-09 ], "gamma_dfa": 0.00045457817577698734, "gamma_dfa_per_layer": [ 0.00011597995762713253, 0.0018383568385615945, 3.561873018043116e-05, -0.00017164282326120883 ], "acc_eval": 0.2509765625, "loss_eval": 2.0309882164001465, "epoch": 55 }, { "hidden_norms_cls": [ 47.646034240722656, 35748556.0, 41284136.0, 44861788.0, 47367128.0 ], "hidden_norms_avg": [ 1141.1492919921875, 25812252.0, 32106642.0, 36789100.0, 43809728.0 ], "bp_grad_per_sample_l2_med": [ 0.0004877470782957971, 3.1724206595029614e-10, 2.6251881224403917e-10, 2.627319750647672e-10, 2.634734097561875e-10 ], "bp_grad_F": [ 0.08355043828487396, 2.428784682706464e-06, 9.579466109244095e-09, 9.378172016738517e-09, 9.3862775329967e-09 ], "gamma_dfa": 0.0006408758436009521, "gamma_dfa_per_layer": [ 0.0009491340606473386, 0.0017479720991104841, 4.02485384256579e-05, -0.00017385132377967238 ], "acc_eval": 0.2451171875, "loss_eval": 2.030231475830078, "epoch": 56 }, { "hidden_norms_cls": [ 47.65734100341797, 35952124.0, 41526152.0, 45192104.0, 47596588.0 ], "hidden_norms_avg": [ 1141.4708251953125, 25858530.0, 32145604.0, 36816776.0, 43830904.0 ], "bp_grad_per_sample_l2_med": [ 0.0004684069426730275, 3.1406693912217065e-10, 2.6245111639511265e-10, 2.628100792545496e-10, 2.632017381820617e-10 ], "bp_grad_F": [ 0.16165603697299957, 3.1715710520074936e-06, 1.017021755700398e-08, 9.52006651289139e-09, 9.360165087457517e-09 ], "gamma_dfa": 0.0005993541035422822, "gamma_dfa_per_layer": [ 0.0007396150031127036, 0.0017993964720517397, 3.345730510773137e-05, -0.00017505236610304564 ], "acc_eval": 0.2529296875, "loss_eval": 2.030412197113037, "epoch": 57 }, { "hidden_norms_cls": [ 47.6636962890625, 36249912.0, 41976852.0, 45623612.0, 47785064.0 ], "hidden_norms_avg": [ 1141.6495361328125, 25785932.0, 32065610.0, 36745760.0, 43805624.0 ], "bp_grad_per_sample_l2_med": [ 0.00047133295447565615, 3.155541938859585e-10, 2.617887573386213e-10, 2.615481442536094e-10, 2.6276933406954583e-10 ], "bp_grad_F": [ 0.09146469831466675, 1.8705788988881977e-06, 9.432087999527994e-09, 9.323818161988129e-09, 9.325629157785897e-09 ], "gamma_dfa": 0.0005754136018367717, "gamma_dfa_per_layer": [ 0.0005892712506465614, 0.0018461447907611728, 3.762807318707928e-05, -0.00017138970724772662 ], "acc_eval": 0.251953125, "loss_eval": 2.031130790710449, "epoch": 58 }, { "hidden_norms_cls": [ 47.66678237915039, 36057328.0, 41647260.0, 45391196.0, 47626604.0 ], "hidden_norms_avg": [ 1141.7391357421875, 25717830.0, 31995718.0, 36684084.0, 43781820.0 ], "bp_grad_per_sample_l2_med": [ 0.00047832890413701534, 3.149952798597866e-10, 2.614737593109595e-10, 2.6173804790197153e-10, 2.6257329643897265e-10 ], "bp_grad_F": [ 0.16335515677928925, 1.6483251101817586e-06, 9.493151154060797e-09, 9.393547273361946e-09, 9.338456230523207e-09 ], "gamma_dfa": 0.0005906115802645218, "gamma_dfa_per_layer": [ 0.0007219060207717121, 0.0017734188586473465, 3.73886723536998e-05, -0.00017026723071467131 ], "acc_eval": 0.255859375, "loss_eval": 2.0293946266174316, "epoch": 59 }, { "hidden_norms_cls": [ 47.666595458984375, 36029164.0, 41621316.0, 45328004.0, 47606828.0 ], "hidden_norms_avg": [ 1141.736328125, 25716872.0, 31991962.0, 36680384.0, 43781988.0 ], "bp_grad_per_sample_l2_med": [ 0.0004811616672668606, 3.1537170097628575e-10, 2.6223428983840336e-10, 2.6155200227861997e-10, 2.6258059615535956e-10 ], "bp_grad_F": [ 0.0951727032661438, 1.623439857212361e-06, 9.415242807619961e-09, 9.343901652414388e-09, 9.342033813197759e-09 ], "gamma_dfa": 0.000660182828141842, "gamma_dfa_per_layer": [ 0.0009655870962888002, 0.0018112185643985868, 3.598399052862078e-05, -0.00017205833864863962 ], "acc_eval": 0.255859375, "loss_eval": 2.029409408569336, "epoch": 60 } ] }