diff options
Diffstat (limited to 'results/optionA_random_targets_s42/snapshot_evolution_s42.json')
| -rw-r--r-- | results/optionA_random_targets_s42/snapshot_evolution_s42.json | 2749 |
1 files changed, 2749 insertions, 0 deletions
diff --git a/results/optionA_random_targets_s42/snapshot_evolution_s42.json b/results/optionA_random_targets_s42/snapshot_evolution_s42.json new file mode 100644 index 0000000..9a24e69 --- /dev/null +++ b/results/optionA_random_targets_s42/snapshot_evolution_s42.json @@ -0,0 +1,2749 @@ +{ + "config": { + "output_dir": "results/optionA_random_targets_s42", + "epochs": 100, + "lr": 0.001, + "wd": 0.01, + "seed": 42, + "depth": 4, + "d_hidden": 256, + "log_every": 1, + "no_residual_add": false, + "w2_std": 0.01, + "random_targets": true, + "skip_bp": true + }, + "depth": 4, + "d_hidden": 256, + "num_classes": 10, + "bp_log": null, + "dfa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010068593546748161, + 0.000997236929833889, + 0.0009934091940522194, + 0.0009870644425973296, + 0.0009829498594626784 + ], + "bp_grad_norms_F": [ + 0.03544403985142708, + 0.03507080301642418, + 0.03477022796869278, + 0.03443896397948265, + 0.03407429903745651 + ], + "gamma_dfa": 0.007406219025142491, + "acc_eval": 0.115234375, + "loss_eval": 2.383650302886963, + "epoch": 0 + }, + { + "hidden_norms": [ + 290.9817199707031, + 627.6629028320312, + 1287.7171630859375, + 1459.1513671875, + 1616.4718017578125 + ], + "bp_grad_norms_per_sample_med": [ + 5.262210834189318e-06, + 5.14477824253845e-06, + 5.1224119488324504e-06, + 5.1222677939222194e-06, + 5.123215942148818e-06 + ], + "bp_grad_norms_F": [ + 0.0008317740284837782, + 0.0008041572291404009, + 0.0007967103738337755, + 0.0007942747906781733, + 0.0007939037750475109 + ], + "gamma_dfa": -0.01952565903775394, + "acc_eval": 0.078125, + "loss_eval": 2.3129711151123047, + "epoch": 1 + }, + { + "hidden_norms": [ + 530.2883911132812, + 4770.83984375, + 10422.763671875, + 12636.15234375, + 13907.7587890625 + ], + "bp_grad_norms_per_sample_med": [ + 7.561958454971318e-07, + 5.883355242985999e-07, + 5.877673743270861e-07, + 5.877889748262533e-07, + 5.877806756870996e-07 + ], + "bp_grad_norms_F": [ + 0.00048568230704404414, + 0.0004738113493658602, + 0.0004746047197841108, + 0.00046957648009993136, + 0.00046837228001095355 + ], + "gamma_dfa": -0.02824715618044138, + "acc_eval": 0.0751953125, + "loss_eval": 2.327746868133545, + "epoch": 2 + }, + { + "hidden_norms": [ + 776.7593994140625, + 14701.5390625, + 31384.16015625, + 38395.3359375, + 42461.37890625 + ], + "bp_grad_norms_per_sample_med": [ + 3.0913437853996584e-07, + 1.869875916327146e-07, + 1.8700784210068377e-07, + 1.870558179462023e-07, + 1.870270267545493e-07 + ], + "bp_grad_norms_F": [ + 0.0003413700615055859, + 0.0003374870866537094, + 0.0003392821818124503, + 0.00030567243811674416, + 0.0003016987757291645 + ], + "gamma_dfa": -0.038137396797537804, + "acc_eval": 0.1044921875, + "loss_eval": 2.3107361793518066, + "epoch": 3 + }, + { + "hidden_norms": [ + 968.3828125, + 37952.72265625, + 72785.1328125, + 87599.4140625, + 96238.84375 + ], + "bp_grad_norms_per_sample_med": [ + 2.4106981300064945e-07, + 8.08614899483473e-08, + 8.070540502558288e-08, + 8.066034951070833e-08, + 8.066343326618153e-08 + ], + "bp_grad_norms_F": [ + 0.0002630708331707865, + 0.00023605814203619957, + 0.00023638480342924595, + 0.00023389894340652972, + 0.00021539803128689528 + ], + "gamma_dfa": -0.037757945246994495, + "acc_eval": 0.103515625, + "loss_eval": 2.312647819519043, + "epoch": 4 + }, + { + "hidden_norms": [ + 1094.08642578125, + 78769.9453125, + 140437.5625, + 168767.5625, + 184955.890625 + ], + "bp_grad_norms_per_sample_med": [ + 1.8580334426587797e-07, + 4.146673404648027e-08, + 4.152716215344299e-08, + 4.1506435621840865e-08, + 4.150659904667009e-08 + ], + "bp_grad_norms_F": [ + 0.00017344040679745376, + 0.0001734093384584412, + 0.00017384161765221506, + 0.00017216427659150213, + 0.0001493075687903911 + ], + "gamma_dfa": -0.04355482757091522, + "acc_eval": 0.07421875, + "loss_eval": 2.3431315422058105, + "epoch": 5 + }, + { + "hidden_norms": [ + 1341.3931884765625, + 139090.921875, + 231652.84375, + 281000.15625, + 307253.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.95400020795023e-08, + 2.393203679673661e-08, + 2.393579912052246e-08, + 2.3937987592148602e-08, + 2.3940138760281116e-08 + ], + "bp_grad_norms_F": [ + 8.837149653118104e-05, + 8.386950503336266e-05, + 8.389632421312854e-05, + 8.345059177372605e-05, + 7.231948256958276e-05 + ], + "gamma_dfa": -0.044815219938755035, + "acc_eval": 0.0947265625, + "loss_eval": 2.3063740730285645, + "epoch": 6 + }, + { + "hidden_norms": [ + 1541.082763671875, + 221682.3125, + 361269.78125, + 435912.5, + 477745.59375 + ], + "bp_grad_norms_per_sample_med": [ + 8.871538881294327e-08, + 1.5129883124131993e-08, + 1.5129455022133698e-08, + 1.513093117466724e-08, + 1.5129749897369038e-08 + ], + "bp_grad_norms_F": [ + 6.570185360033065e-05, + 1.65565506904386e-05, + 1.6456760931760073e-05, + 1.2925677765451837e-05, + 1.2370261174510233e-05 + ], + "gamma_dfa": -0.0455410098657012, + "acc_eval": 0.1083984375, + "loss_eval": 2.322909355163574, + "epoch": 7 + }, + { + "hidden_norms": [ + 1785.2386474609375, + 320922.03125, + 530986.4375, + 634164.875, + 698474.0625 + ], + "bp_grad_norms_per_sample_med": [ + 4.730902603000686e-08, + 1.0146245621456274e-08, + 1.0146251838705211e-08, + 1.0143652140470749e-08, + 1.014903983076465e-08 + ], + "bp_grad_norms_F": [ + 1.1641483069979586e-05, + 5.675432475982234e-06, + 5.721857633034233e-06, + 7.849063763387676e-07, + 7.832054507161956e-07 + ], + "gamma_dfa": -0.039457285893149674, + "acc_eval": 0.1279296875, + "loss_eval": 2.3133440017700195, + "epoch": 8 + }, + { + "hidden_norms": [ + 2014.4766845703125, + 439754.375, + 730323.4375, + 876362.4375, + 967547.375 + ], + "bp_grad_norms_per_sample_med": [ + 3.3528117171499616e-08, + 7.06648384252162e-09, + 7.059930862141073e-09, + 7.054891337787694e-09, + 7.054930861727371e-09 + ], + "bp_grad_norms_F": [ + 8.620314474683255e-06, + 5.386140401242301e-06, + 5.411964593804441e-06, + 4.715600994131819e-07, + 4.707477785359515e-07 + ], + "gamma_dfa": -0.018979715649038553, + "acc_eval": 0.0869140625, + "loss_eval": 2.3219242095947266, + "epoch": 9 + }, + { + "hidden_norms": [ + 2227.54052734375, + 609797.1875, + 983513.8125, + 1188663.0, + 1307053.25 + ], + "bp_grad_norms_per_sample_med": [ + 2.0001076350695257e-08, + 5.128104607621253e-09, + 5.1290607316900605e-09, + 5.126524982301817e-09, + 5.12929876350654e-09 + ], + "bp_grad_norms_F": [ + 6.190822659846162e-06, + 3.060452399950009e-06, + 3.074174401263008e-06, + 3.294025248123944e-07, + 3.29135190213492e-07 + ], + "gamma_dfa": -0.01813346426934004, + "acc_eval": 0.1044921875, + "loss_eval": 2.331584930419922, + "epoch": 10 + }, + { + "hidden_norms": [ + 2457.193115234375, + 803897.3125, + 1286980.25, + 1553564.875, + 1716479.25 + ], + "bp_grad_norms_per_sample_med": [ + 1.729943654993349e-08, + 3.841335249887834e-09, + 3.838269257983029e-09, + 3.838585449500442e-09, + 3.837864692712856e-09 + ], + "bp_grad_norms_F": [ + 3.917093636118807e-06, + 2.7961248179053655e-06, + 2.805686108331429e-06, + 2.3621770139925502e-07, + 2.3617232614014938e-07 + ], + "gamma_dfa": -0.02396334079094231, + "acc_eval": 0.111328125, + "loss_eval": 2.3206071853637695, + "epoch": 11 + }, + { + "hidden_norms": [ + 2634.52099609375, + 1040589.8125, + 1656069.25, + 1991088.125, + 2196123.75 + ], + "bp_grad_norms_per_sample_med": [ + 2.1142980699551117e-08, + 2.8919602268473454e-09, + 2.8948958785690593e-09, + 2.8949218577878355e-09, + 2.8939526330873377e-09 + ], + "bp_grad_norms_F": [ + 2.204534575867001e-05, + 2.299454763488029e-06, + 2.206897988799028e-06, + 1.7700770627016027e-07, + 1.7689913534013613e-07 + ], + "gamma_dfa": -0.020109509699977934, + "acc_eval": 0.087890625, + "loss_eval": 2.315797805786133, + "epoch": 12 + }, + { + "hidden_norms": [ + 2877.5615234375, + 1376012.25, + 2111297.75, + 2523565.25, + 2781256.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.216429978967426e-08, + 2.2570649793607345e-09, + 2.2583199754677707e-09, + 2.258467191040836e-09, + 2.2585668890684474e-09 + ], + "bp_grad_norms_F": [ + 3.714726335601881e-05, + 2.6385948785900837e-06, + 2.600723519208259e-06, + 1.345374585071113e-07, + 1.344694169347349e-07 + ], + "gamma_dfa": -0.013240656815469265, + "acc_eval": 0.0703125, + "loss_eval": 2.3100953102111816, + "epoch": 13 + }, + { + "hidden_norms": [ + 3088.69287109375, + 1698364.75, + 2601432.25, + 3103900.5, + 3421196.25 + ], + "bp_grad_norms_per_sample_med": [ + 1.9957044017360204e-08, + 1.783974634683716e-09, + 1.783756697903982e-09, + 1.7829976384220458e-09, + 1.7823481579526401e-09 + ], + "bp_grad_norms_F": [ + 3.862057383230422e-06, + 2.0336331090220483e-06, + 2.036696969298646e-06, + 1.0464794542031086e-07, + 1.0456345478360163e-07 + ], + "gamma_dfa": -0.005813862895593047, + "acc_eval": 0.1005859375, + "loss_eval": 2.3175578117370605, + "epoch": 14 + }, + { + "hidden_norms": [ + 3303.89599609375, + 2057797.625, + 3208369.75, + 3840521.25, + 4226141.5 + ], + "bp_grad_norms_per_sample_med": [ + 1.0653308457619914e-08, + 1.3972134560447103e-09, + 1.3960789191358458e-09, + 1.3953704858238325e-09, + 1.395240034618439e-09 + ], + "bp_grad_norms_F": [ + 3.350825500092469e-05, + 1.8437043536323472e-06, + 1.7324912278127158e-06, + 8.088576919362822e-08, + 8.08555569165037e-08 + ], + "gamma_dfa": -0.009977308567613363, + "acc_eval": 0.0888671875, + "loss_eval": 2.313873052597046, + "epoch": 15 + }, + { + "hidden_norms": [ + 3511.251708984375, + 2498907.0, + 3838076.75, + 4584989.5, + 5056157.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2424533402111138e-08, + 1.1319180037716592e-09, + 1.1314524872574339e-09, + 1.1313682213298648e-09, + 1.1311728220775308e-09 + ], + "bp_grad_norms_F": [ + 3.6209145036991686e-05, + 1.2319624147494324e-06, + 1.1622746569628362e-06, + 6.361955939837571e-08, + 6.359429960411944e-08 + ], + "gamma_dfa": -0.003661318449303508, + "acc_eval": 0.0888671875, + "loss_eval": 2.3163557052612305, + "epoch": 16 + }, + { + "hidden_norms": [ + 3775.89697265625, + 2830713.5, + 4406309.0, + 5287962.5, + 5866003.5 + ], + "bp_grad_norms_per_sample_med": [ + 9.175260551330666e-09, + 9.454962368593556e-10, + 9.453093863243112e-10, + 9.453505755985248e-10, + 9.453685612115237e-10 + ], + "bp_grad_norms_F": [ + 7.906389510026202e-05, + 1.4282334177551093e-06, + 1.2143628964622621e-06, + 4.9730939366554594e-08, + 4.970008760096789e-08 + ], + "gamma_dfa": -0.00987274688668549, + "acc_eval": 0.0986328125, + "loss_eval": 2.310572624206543, + "epoch": 17 + }, + { + "hidden_norms": [ + 3992.62939453125, + 3305205.5, + 5135523.0, + 6172568.0, + 6858123.5 + ], + "bp_grad_norms_per_sample_med": [ + 7.447438221674929e-09, + 7.795076806260681e-10, + 7.787387401592127e-10, + 7.785659339454298e-10, + 7.786636335715968e-10 + ], + "bp_grad_norms_F": [ + 6.625035166507587e-05, + 1.4839708910585614e-06, + 5.721043407902471e-07, + 3.443057750018852e-08, + 3.4421322681055244e-08 + ], + "gamma_dfa": -0.006256722612306476, + "acc_eval": 0.099609375, + "loss_eval": 2.3168537616729736, + "epoch": 18 + }, + { + "hidden_norms": [ + 4142.52978515625, + 3917073.0, + 6029541.5, + 7244691.5, + 8040561.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.708185980499934e-09, + 6.548476760848132e-10, + 6.543839359274273e-10, + 6.541163166673414e-10, + 6.541419628192102e-10 + ], + "bp_grad_norms_F": [ + 8.116958838400024e-07, + 2.7829198501194696e-08, + 2.171442403664514e-08, + 2.171425173003172e-08, + 2.1709443132067463e-08 + ], + "gamma_dfa": -0.008716321433894336, + "acc_eval": 0.1103515625, + "loss_eval": 2.307344675064087, + "epoch": 19 + }, + { + "hidden_norms": [ + 4319.63134765625, + 4541538.0, + 7015912.0, + 8395939.0, + 9318214.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.706714212294628e-09, + 5.475734865534321e-10, + 5.474371511660081e-10, + 5.474699027452345e-10, + 5.470845443333872e-10 + ], + "bp_grad_norms_F": [ + 9.98826635623118e-07, + 1.9267284656621086e-08, + 1.8231443021932137e-08, + 1.8230153386866732e-08, + 1.822698791897892e-08 + ], + "gamma_dfa": -0.009770376258529723, + "acc_eval": 0.1044921875, + "loss_eval": 2.3123068809509277, + "epoch": 20 + }, + { + "hidden_norms": [ + 4493.5576171875, + 5295852.0, + 8144737.5, + 9706496.0, + 10771585.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.5074546883274706e-09, + 4.5678333338017296e-10, + 4.567042022340928e-10, + 4.5673645421295817e-10, + 4.5639386714313446e-10 + ], + "bp_grad_norms_F": [ + 7.984108947312052e-07, + 1.5798146790757528e-08, + 1.5310378742583453e-08, + 1.531174653734979e-08, + 1.5307973555422905e-08 + ], + "gamma_dfa": 0.001372043276205659, + "acc_eval": 0.08984375, + "loss_eval": 2.304574728012085, + "epoch": 21 + }, + { + "hidden_norms": [ + 4713.58544921875, + 6076811.0, + 9296267.0, + 11104688.0, + 12313681.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7650869089134176e-09, + 3.880850918402956e-10, + 3.8772021704325255e-10, + 3.877534959784157e-10, + 3.877534959784157e-10 + ], + "bp_grad_norms_F": [ + 8.055810098994698e-07, + 1.3297294820802108e-08, + 1.2999676002323213e-08, + 1.2997061205055616e-08, + 1.2994151532552678e-08 + ], + "gamma_dfa": -0.001540843746624887, + "acc_eval": 0.0927734375, + "loss_eval": 2.3001956939697266, + "epoch": 22 + }, + { + "hidden_norms": [ + 4932.0283203125, + 6808919.0, + 10515250.0, + 12614906.0, + 13952134.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.722823604945802e-09, + 3.3205604932362576e-10, + 3.3200522886467354e-10, + 3.319224339826121e-10, + 3.319316765892921e-10 + ], + "bp_grad_norms_F": [ + 8.157737738656579e-07, + 1.1298772584211747e-08, + 1.1099826835447857e-08, + 1.1101125352297458e-08, + 1.1098639340900718e-08 + ], + "gamma_dfa": -0.0038606239249929786, + "acc_eval": 0.1005859375, + "loss_eval": 2.3065578937530518, + "epoch": 23 + }, + { + "hidden_norms": [ + 5160.6142578125, + 7539331.0, + 11751434.0, + 14133378.0, + 15619303.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.541834742686433e-09, + 2.862569903339107e-10, + 2.861809678122995e-10, + 2.8618746261699357e-10, + 2.8600946611057054e-10 + ], + "bp_grad_norms_F": [ + 5.115749672768288e-07, + 9.68886215702014e-09, + 9.564988801002983e-09, + 9.563906999687788e-09, + 9.562156400022559e-09 + ], + "gamma_dfa": -0.005291882203891873, + "acc_eval": 0.0888671875, + "loss_eval": 2.306269645690918, + "epoch": 24 + }, + { + "hidden_norms": [ + 5342.28369140625, + 8587680.0, + 13221096.0, + 15854032.0, + 17531438.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.404613562769555e-09, + 2.500546436579043e-10, + 2.498238005355091e-10, + 2.5007032555812714e-10, + 2.5000959635868014e-10 + ], + "bp_grad_norms_F": [ + 8.579532959629432e-07, + 8.395090844715014e-09, + 8.30485546998716e-09, + 8.305622856141781e-09, + 8.304008147774766e-09 + ], + "gamma_dfa": -0.0010773324174806476, + "acc_eval": 0.0810546875, + "loss_eval": 2.3139305114746094, + "epoch": 25 + }, + { + "hidden_norms": [ + 5483.166015625, + 9723498.0, + 14831751.0, + 17743800.0, + 19587500.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.163097422349438e-09, + 2.162879736422596e-10, + 2.1617001244589318e-10, + 2.1610728484500186e-10, + 2.1611390454978618e-10 + ], + "bp_grad_norms_F": [ + 8.197772558560246e-07, + 7.273167845767148e-09, + 7.203821983381431e-09, + 7.205678720367814e-09, + 7.204227880919234e-09 + ], + "gamma_dfa": 1.8637801986187696e-05, + "acc_eval": 0.0751953125, + "loss_eval": 2.313469648361206, + "epoch": 26 + }, + { + "hidden_norms": [ + 5764.373046875, + 10784341.0, + 16432148.0, + 19679324.0, + 21736526.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.4971423534813084e-09, + 1.883019018489307e-10, + 1.8820056624235804e-10, + 1.881857447649793e-10, + 1.8821781633260315e-10 + ], + "bp_grad_norms_F": [ + 7.796735417286982e-07, + 6.3456924159766e-09, + 6.269113672630056e-09, + 6.2696292602026915e-09, + 6.268407570786394e-09 + ], + "gamma_dfa": -0.009387154830619693, + "acc_eval": 0.1240234375, + "loss_eval": 2.306946277618408, + "epoch": 27 + }, + { + "hidden_norms": [ + 5953.8154296875, + 12087036.0, + 18197724.0, + 21766380.0, + 23964956.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.9581326277394737e-09, + 1.6603075858601102e-10, + 1.6546233827519075e-10, + 1.654698739139704e-10, + 1.654279768725786e-10 + ], + "bp_grad_norms_F": [ + 7.887553010732518e-07, + 5.60325252862981e-09, + 5.523563828546685e-09, + 5.524424029346164e-09, + 5.523790314043708e-09 + ], + "gamma_dfa": 0.004911014751996845, + "acc_eval": 0.099609375, + "loss_eval": 2.3079466819763184, + "epoch": 28 + }, + { + "hidden_norms": [ + 6103.1767578125, + 13586370.0, + 20138950.0, + 24031604.0, + 26432166.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.675929033912894e-09, + 1.4642610735027262e-10, + 1.4630179012709021e-10, + 1.4625449462624118e-10, + 1.4625445299287776e-10 + ], + "bp_grad_norms_F": [ + 5.090974468657805e-07, + 4.923043306348518e-09, + 4.85900208957446e-09, + 4.858577984379053e-09, + 4.8580677258769356e-09 + ], + "gamma_dfa": -0.001665741903707385, + "acc_eval": 0.119140625, + "loss_eval": 2.3058736324310303, + "epoch": 29 + }, + { + "hidden_norms": [ + 6289.6884765625, + 14985982.0, + 22021216.0, + 26264438.0, + 28881832.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.36727260016778e-09, + 1.3193185433024723e-10, + 1.3139930810091016e-10, + 1.313865682917026e-10, + 1.313865821694904e-10 + ], + "bp_grad_norms_F": [ + 5.067869324193452e-07, + 4.352318949685241e-09, + 4.3002512661871606e-09, + 4.300079403662949e-09, + 4.299330669255141e-09 + ], + "gamma_dfa": -0.0004749984946101904, + "acc_eval": 0.134765625, + "loss_eval": 2.2982680797576904, + "epoch": 30 + }, + { + "hidden_norms": [ + 6523.13232421875, + 16536787.0, + 24215278.0, + 28796266.0, + 31602218.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.811848170443e-09, + 1.1650350129066567e-10, + 1.168874996793079e-10, + 1.1678497058298376e-10, + 1.1676350164524507e-10 + ], + "bp_grad_norms_F": [ + 1.0699311587814009e-06, + 3.859509600800948e-09, + 3.8213117115049045e-09, + 3.820499028250879e-09, + 3.8199492458090845e-09 + ], + "gamma_dfa": -0.0009061050368472934, + "acc_eval": 0.1181640625, + "loss_eval": 2.3070034980773926, + "epoch": 31 + }, + { + "hidden_norms": [ + 6718.77001953125, + 18189110.0, + 26350528.0, + 31306452.0, + 34333380.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.6170128286651106e-09, + 1.026562307382406e-10, + 1.0235094716204429e-10, + 1.0229352781498946e-10, + 1.0229320168697598e-10 + ], + "bp_grad_norms_F": [ + 7.658765639462217e-07, + 3.4193439191199104e-09, + 3.3851728087341826e-09, + 3.3853084779877918e-09, + 3.3853269076900006e-09 + ], + "gamma_dfa": -0.003424330148845911, + "acc_eval": 0.1025390625, + "loss_eval": 2.307239532470703, + "epoch": 32 + }, + { + "hidden_norms": [ + 6883.12548828125, + 19488106.0, + 28346706.0, + 33685484.0, + 36926260.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.087009980973221e-09, + 9.127182343249274e-11, + 9.115138505100262e-11, + 9.112680748879498e-11, + 9.108464676943484e-11 + ], + "bp_grad_norms_F": [ + 6.505949841084657e-07, + 3.0607936185589324e-09, + 3.031910944528704e-09, + 3.0311655407899707e-09, + 3.030735440390231e-09 + ], + "gamma_dfa": 0.0007484849775210023, + "acc_eval": 0.126953125, + "loss_eval": 2.299861431121826, + "epoch": 33 + }, + { + "hidden_norms": [ + 7075.13671875, + 20968554.0, + 30458362.0, + 36184532.0, + 39704584.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7312005990154375e-09, + 8.229845277485381e-11, + 8.220574915229761e-11, + 8.216692604090525e-11, + 8.216703706320772e-11 + ], + "bp_grad_norms_F": [ + 5.460973966364691e-07, + 2.7569984073494425e-09, + 2.731066262029458e-09, + 2.7299451588191914e-09, + 2.7297459848085737e-09 + ], + "gamma_dfa": 0.0019178662332706153, + "acc_eval": 0.10546875, + "loss_eval": 2.304497241973877, + "epoch": 34 + }, + { + "hidden_norms": [ + 7259.11181640625, + 23033338.0, + 32925422.0, + 39030248.0, + 42756800.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.3574480973186382e-09, + 7.317867145584245e-11, + 7.298522203269542e-11, + 7.29523316755909e-11, + 7.295326148737402e-11 + ], + "bp_grad_norms_F": [ + 9.340447491013038e-07, + 2.4876549709063056e-09, + 2.468606430383602e-09, + 2.468798498966862e-09, + 2.4683108890144467e-09 + ], + "gamma_dfa": 0.0004995002527721226, + "acc_eval": 0.0927734375, + "loss_eval": 2.316316604614258, + "epoch": 35 + }, + { + "hidden_norms": [ + 7421.775390625, + 24686730.0, + 35197740.0, + 41724168.0, + 45731128.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6613123099418203e-09, + 6.675621860852132e-11, + 6.666651952702551e-11, + 6.660563073301873e-11, + 6.660502011035518e-11 + ], + "bp_grad_norms_F": [ + 5.461850491883524e-07, + 2.235697182939589e-09, + 2.218524031150082e-09, + 2.2181974035362373e-09, + 2.217934280679401e-09 + ], + "gamma_dfa": -0.0007714751118328422, + "acc_eval": 0.115234375, + "loss_eval": 2.299975872039795, + "epoch": 36 + }, + { + "hidden_norms": [ + 7595.57861328125, + 26510854.0, + 37595356.0, + 44555964.0, + 48780100.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.225840178837757e-09, + 6.114001666057689e-11, + 6.093330007228559e-11, + 6.092592402806574e-11, + 6.092682608427324e-11 + ], + "bp_grad_norms_F": [ + 5.346724947230541e-07, + 2.03656935759966e-09, + 2.023372358550546e-09, + 2.0227952646223457e-09, + 2.022433331916318e-09 + ], + "gamma_dfa": -0.002239674242446199, + "acc_eval": 0.125, + "loss_eval": 2.301793336868286, + "epoch": 37 + }, + { + "hidden_norms": [ + 7750.2373046875, + 28535444.0, + 40272040.0, + 47577320.0, + 52073104.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8177556126985905e-09, + 5.451538873102457e-11, + 5.443305875485471e-11, + 5.4429814821954636e-11, + 5.4436097990384624e-11 + ], + "bp_grad_norms_F": [ + 4.054070359416073e-07, + 1.8392830591906772e-09, + 1.8223703657227475e-09, + 1.8226138376320478e-09, + 1.8224435294200703e-09 + ], + "gamma_dfa": -7.494278543163091e-05, + "acc_eval": 0.0859375, + "loss_eval": 2.3060522079467773, + "epoch": 38 + }, + { + "hidden_norms": [ + 7842.494140625, + 30102162.0, + 42567964.0, + 50335104.0, + 55107076.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.4601239106681874e-09, + 4.961669269887281e-11, + 4.958486399253559e-11, + 4.9537509511088373e-11, + 4.9538078500388494e-11 + ], + "bp_grad_norms_F": [ + 3.688643346322351e-07, + 1.6754320153467006e-09, + 1.6663495028268471e-09, + 1.6659863488754922e-09, + 1.6657608625791909e-09 + ], + "gamma_dfa": -0.0012932312965858728, + "acc_eval": 0.123046875, + "loss_eval": 2.305074691772461, + "epoch": 39 + }, + { + "hidden_norms": [ + 7978.84033203125, + 31648130.0, + 44751680.0, + 52999412.0, + 58060848.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.122314324282115e-09, + 4.579963838735601e-11, + 4.578180889946992e-11, + 4.577443632469702e-11, + 4.57794635533304e-11 + ], + "bp_grad_norms_F": [ + 5.346829539121245e-07, + 1.5462353619710711e-09, + 1.5314658430298778e-09, + 1.5317623835997551e-09, + 1.531660798193002e-09 + ], + "gamma_dfa": -0.0015878456179052591, + "acc_eval": 0.078125, + "loss_eval": 2.311302661895752, + "epoch": 40 + }, + { + "hidden_norms": [ + 8110.69677734375, + 33538538.0, + 47405844.0, + 56144432.0, + 61445208.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.846236801801183e-09, + 4.287940835734361e-11, + 4.277651843853647e-11, + 4.270922504545638e-11, + 4.270716419396692e-11 + ], + "bp_grad_norms_F": [ + 6.336174465104705e-07, + 1.4277677928831167e-09, + 1.411427863473591e-09, + 1.4113960000727843e-09, + 1.4115042468176853e-09 + ], + "gamma_dfa": 0.0003075850836466998, + "acc_eval": 0.06640625, + "loss_eval": 2.3155269622802734, + "epoch": 41 + }, + { + "hidden_norms": [ + 8218.2890625, + 35439168.0, + 50034100.0, + 59178108.0, + 64727180.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5490064786405355e-09, + 3.9022073766714627e-11, + 3.8900438426026085e-11, + 3.885531826841593e-11, + 3.885488111809998e-11 + ], + "bp_grad_norms_F": [ + 4.209731514492887e-07, + 1.29418675776094e-09, + 1.2822323203209862e-09, + 1.282524864087975e-09, + 1.282538297786573e-09 + ], + "gamma_dfa": 0.004402266175020486, + "acc_eval": 0.0888671875, + "loss_eval": 2.3072235584259033, + "epoch": 42 + }, + { + "hidden_norms": [ + 8356.0576171875, + 37748524.0, + 52921432.0, + 62358388.0, + 68150840.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.2101902530380357e-09, + 3.5293011568793276e-11, + 3.5220604210906004e-11, + 3.520495353570574e-11, + 3.5206077636518174e-11 + ], + "bp_grad_norms_F": [ + 4.58017922255749e-07, + 1.1915447517552025e-09, + 1.1833590773946412e-09, + 1.1830882939989351e-09, + 1.183062092735554e-09 + ], + "gamma_dfa": -0.0026363012730143964, + "acc_eval": 0.1064453125, + "loss_eval": 2.301530361175537, + "epoch": 43 + }, + { + "hidden_norms": [ + 8468.8984375, + 39503084.0, + 55376920.0, + 65278316.0, + 71385032.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8453949479635412e-09, + 3.246405921863982e-11, + 3.238384560511065e-11, + 3.2375737507583935e-11, + 3.2377513864423335e-11 + ], + "bp_grad_norms_F": [ + 4.802472517440037e-07, + 1.1004476219156345e-09, + 1.0926821669698938e-09, + 1.092572032845851e-09, + 1.0924769977549431e-09 + ], + "gamma_dfa": 0.0010803540208144113, + "acc_eval": 0.1396484375, + "loss_eval": 2.3026890754699707, + "epoch": 44 + }, + { + "hidden_norms": [ + 8563.8193359375, + 41138400.0, + 57739148.0, + 68164040.0, + 74560624.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7058150447724074e-09, + 3.018212416106003e-11, + 3.0175469761806184e-11, + 3.0169026998816406e-11, + 3.017583058428919e-11 + ], + "bp_grad_norms_F": [ + 4.471017973628477e-07, + 1.0233066616294195e-09, + 1.0133889283281405e-09, + 1.0129664884672707e-09, + 1.0129456162744077e-09 + ], + "gamma_dfa": 0.001452172189601697, + "acc_eval": 0.119140625, + "loss_eval": 2.3021607398986816, + "epoch": 45 + }, + { + "hidden_norms": [ + 8657.7607421875, + 43261356.0, + 60519764.0, + 71481504.0, + 78138984.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.013100575126714e-09, + 2.8044349828504345e-11, + 2.8007120927986406e-11, + 2.800258289137325e-11, + 2.7994129583874816e-11 + ], + "bp_grad_norms_F": [ + 4.194439213733858e-07, + 9.434407699515646e-10, + 9.384462096306834e-10, + 9.380274335057948e-10, + 9.378612331190084e-10 + ], + "gamma_dfa": 0.0007094524626154453, + "acc_eval": 0.1376953125, + "loss_eval": 2.2962775230407715, + "epoch": 46 + }, + { + "hidden_norms": [ + 8790.2177734375, + 45091320.0, + 63046644.0, + 74457320.0, + 81331192.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.4347481808462135e-09, + 2.630745274401214e-11, + 2.622063850765688e-11, + 2.6189189705760896e-11, + 2.618921746133651e-11 + ], + "bp_grad_norms_F": [ + 7.371211836471048e-07, + 8.928198735880244e-10, + 8.842627741145748e-10, + 8.843225596244508e-10, + 8.844897037008081e-10 + ], + "gamma_dfa": 0.0035163145803380758, + "acc_eval": 0.0869140625, + "loss_eval": 2.308018207550049, + "epoch": 47 + }, + { + "hidden_norms": [ + 8908.1201171875, + 47254860.0, + 65723668.0, + 77611024.0, + 84728680.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.7307127670184173e-09, + 2.504270402159392e-11, + 2.5052317859097784e-11, + 2.5023790331535345e-11, + 2.5014615379070904e-11 + ], + "bp_grad_norms_F": [ + 6.292835905696847e-07, + 8.318437605403517e-10, + 8.267081463841919e-10, + 8.263784656570294e-10, + 8.262315831508715e-10 + ], + "gamma_dfa": 0.0013402553158812225, + "acc_eval": 0.0751953125, + "loss_eval": 2.3012595176696777, + "epoch": 48 + }, + { + "hidden_norms": [ + 9040.81640625, + 49197456.0, + 68364032.0, + 80749512.0, + 88194248.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2460811271708394e-09, + 2.3192125303550526e-11, + 2.3115362055015076e-11, + 2.3076223223950088e-11, + 2.3076362001828166e-11 + ], + "bp_grad_norms_F": [ + 4.4760727746506745e-07, + 7.767143594961112e-10, + 7.696474568774647e-10, + 7.699579307463011e-10, + 7.697840698206448e-10 + ], + "gamma_dfa": 0.0011345145248924382, + "acc_eval": 0.109375, + "loss_eval": 2.3025381565093994, + "epoch": 49 + }, + { + "hidden_norms": [ + 9096.951171875, + 51418580.0, + 71253736.0, + 84008288.0, + 91700160.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.652081027536667e-09, + 2.1794503701766388e-11, + 2.1752362064364483e-11, + 2.1721518680961616e-11, + 2.1714638767655892e-11 + ], + "bp_grad_norms_F": [ + 4.2562598423501186e-07, + 7.30644378332812e-10, + 7.245531952193573e-10, + 7.24433568688454e-10, + 7.243706190429577e-10 + ], + "gamma_dfa": -0.0012115467980038375, + "acc_eval": 0.0986328125, + "loss_eval": 2.3028664588928223, + "epoch": 50 + }, + { + "hidden_norms": [ + 9195.421875, + 53477960.0, + 73949888.0, + 87218208.0, + 95104784.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.0763821773073232e-09, + 2.0283105056639883e-11, + 2.0292134292332342e-11, + 2.0280107454473395e-11, + 2.0280043269704784e-11 + ], + "bp_grad_norms_F": [ + 4.4348283267936495e-07, + 6.856579193303958e-10, + 6.817193476393868e-10, + 6.813303254915581e-10, + 6.81267153801457e-10 + ], + "gamma_dfa": 0.00014059534441912547, + "acc_eval": 0.12109375, + "loss_eval": 2.300283432006836, + "epoch": 51 + }, + { + "hidden_norms": [ + 9354.1484375, + 54696328.0, + 76135840.0, + 89854944.0, + 98086680.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.338345073127357e-09, + 1.9446970075942538e-11, + 1.951434153157905e-11, + 1.9502762252376904e-11, + 1.950522555971279e-11 + ], + "bp_grad_norms_F": [ + 7.923298426248948e-07, + 6.581531986071809e-10, + 6.558240617238198e-10, + 6.55002219129841e-10, + 6.549716324855126e-10 + ], + "gamma_dfa": 0.0009868293709587306, + "acc_eval": 0.08203125, + "loss_eval": 2.308971405029297, + "epoch": 52 + }, + { + "hidden_norms": [ + 9396.91796875, + 56824088.0, + 78830128.0, + 92998112.0, + 101473056.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5743603087869928e-09, + 1.830174033157217e-11, + 1.83033917883213e-11, + 1.828929195590856e-11, + 1.8287725500609753e-11 + ], + "bp_grad_norms_F": [ + 5.051292646385264e-07, + 6.139382335845767e-10, + 6.081654624345845e-10, + 6.082383485761511e-10, + 6.080949632725208e-10 + ], + "gamma_dfa": -0.0033112295641331, + "acc_eval": 0.0869140625, + "loss_eval": 2.3057596683502197, + "epoch": 53 + }, + { + "hidden_norms": [ + 9468.728515625, + 58575712.0, + 81144072.0, + 95889464.0, + 104606984.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.8610024632437216e-09, + 1.757114766187673e-11, + 1.7507960359264274e-11, + 1.7509681204952443e-11, + 1.751184267040351e-11 + ], + "bp_grad_norms_F": [ + 4.554808015200251e-07, + 5.796045865480437e-10, + 5.748747033962331e-10, + 5.745580122784588e-10, + 5.745347531060929e-10 + ], + "gamma_dfa": -0.0003432991070440039, + "acc_eval": 0.08984375, + "loss_eval": 2.298818588256836, + "epoch": 54 + }, + { + "hidden_norms": [ + 9555.708984375, + 60407900.0, + 83458520.0, + 98574208.0, + 107551688.0 + ], + "bp_grad_norms_per_sample_med": [ + 2.279448629849412e-09, + 1.684081346597921e-11, + 1.677817607070864e-11, + 1.677138462830019e-11, + 1.677173851188929e-11 + ], + "bp_grad_norms_F": [ + 4.388069214655843e-07, + 5.62806412585104e-10, + 5.561613392046638e-10, + 5.564256833068271e-10, + 5.564126381862877e-10 + ], + "gamma_dfa": -0.0005112638318678364, + "acc_eval": 0.0869140625, + "loss_eval": 2.3081560134887695, + "epoch": 55 + }, + { + "hidden_norms": [ + 9638.900390625, + 62801376.0, + 86421992.0, + 101967032.0, + 111112024.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.658361892253879e-09, + 1.6043997727588355e-11, + 1.598270821245862e-11, + 1.5972815084475123e-11, + 1.5974208067426332e-11 + ], + "bp_grad_norms_F": [ + 3.7533030194936146e-07, + 5.26626853236678e-10, + 5.223827481692922e-10, + 5.223168009216295e-10, + 5.222874355226281e-10 + ], + "gamma_dfa": 0.0029356127051869407, + "acc_eval": 0.1162109375, + "loss_eval": 2.2985568046569824, + "epoch": 56 + }, + { + "hidden_norms": [ + 9718.0244140625, + 64624960.0, + 89000072.0, + 104851280.0, + 114205744.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.292640661176847e-09, + 1.499218110767586e-11, + 1.4987202451299808e-11, + 1.4976865234106462e-11, + 1.497728503718765e-11 + ], + "bp_grad_norms_F": [ + 2.8470327606555657e-07, + 5.047448570216773e-10, + 4.990237667534814e-10, + 4.992751767574077e-10, + 4.992522506519492e-10 + ], + "gamma_dfa": -5.288697866490111e-05, + "acc_eval": 0.083984375, + "loss_eval": 2.308565139770508, + "epoch": 57 + }, + { + "hidden_norms": [ + 9801.466796875, + 66401824.0, + 91302272.0, + 107465608.0, + 117121048.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.6839835081938759e-09, + 1.4242066727343516e-11, + 1.4184016808305167e-11, + 1.417683158366767e-11, + 1.41777934878351e-11 + ], + "bp_grad_norms_F": [ + 4.110351881081442e-07, + 4.848813572877475e-10, + 4.80424644511146e-10, + 4.804525666202153e-10, + 4.804344699849139e-10 + ], + "gamma_dfa": 0.005033881159761222, + "acc_eval": 0.0810546875, + "loss_eval": 2.3111414909362793, + "epoch": 58 + }, + { + "hidden_norms": [ + 9890.490234375, + 68205280.0, + 93614360.0, + 110285296.0, + 120199864.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.280599737363275e-09, + 1.3558537972913065e-11, + 1.3508410535989501e-11, + 1.350657866799887e-11, + 1.3504152657217716e-11 + ], + "bp_grad_norms_F": [ + 2.917624613019143e-07, + 4.580297252587684e-10, + 4.5511858171032316e-10, + 4.5487102973140736e-10, + 4.548312837471258e-10 + ], + "gamma_dfa": -0.0010600784517009743, + "acc_eval": 0.1337890625, + "loss_eval": 2.3005125522613525, + "epoch": 59 + }, + { + "hidden_norms": [ + 9970.1796875, + 70070560.0, + 95841760.0, + 112873624.0, + 122957488.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5372191297657878e-09, + 1.2977110705469919e-11, + 1.3014193021854137e-11, + 1.301157879357584e-11, + 1.301332045594572e-11 + ], + "bp_grad_norms_F": [ + 3.609145835525851e-07, + 4.4097417384314497e-10, + 4.391887409305184e-10, + 4.386717655791017e-10, + 4.3868858545792477e-10 + ], + "gamma_dfa": -0.0019604496665124316, + "acc_eval": 0.150390625, + "loss_eval": 2.2972958087921143, + "epoch": 60 + }, + { + "hidden_norms": [ + 10013.4111328125, + 71841280.0, + 98034728.0, + 115420424.0, + 125712432.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.980667851952944e-09, + 1.2545815081255185e-11, + 1.2525404324836842e-11, + 1.2530108027541953e-11, + 1.2529619702883465e-11 + ], + "bp_grad_norms_F": [ + 4.7472269670834066e-07, + 4.2379699749517385e-10, + 4.224821603671103e-10, + 4.2210435147183034e-10, + 4.2200473671094585e-10 + ], + "gamma_dfa": 0.001835448889323743, + "acc_eval": 0.1123046875, + "loss_eval": 2.301358222961426, + "epoch": 61 + }, + { + "hidden_norms": [ + 10096.0283203125, + 73830392.0, + 100452376.0, + 118091624.0, + 128521440.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0877483358484596e-09, + 1.2145178092393127e-11, + 1.2089194229014666e-11, + 1.2089107492840867e-11, + 1.2089683421034891e-11 + ], + "bp_grad_norms_F": [ + 3.47462531635756e-07, + 4.1091860469855135e-10, + 4.074744708315592e-10, + 4.072828740930845e-10, + 4.072460701998182e-10 + ], + "gamma_dfa": 0.001284073296119459, + "acc_eval": 0.0986328125, + "loss_eval": 2.306840419769287, + "epoch": 62 + }, + { + "hidden_norms": [ + 10180.875, + 75552776.0, + 102509640.0, + 120544920.0, + 131168024.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.552231787549374e-09, + 1.1890774823108963e-11, + 1.1859568882499616e-11, + 1.1871844653177366e-11, + 1.187336080149537e-11 + ], + "bp_grad_norms_F": [ + 3.4558294714770454e-07, + 3.966963146861957e-10, + 3.9473879720475225e-10, + 3.9452693889607815e-10, + 3.9439784771388986e-10 + ], + "gamma_dfa": 0.0016765635373303667, + "acc_eval": 0.115234375, + "loss_eval": 2.298762798309326, + "epoch": 63 + }, + { + "hidden_norms": [ + 10240.1455078125, + 77067560.0, + 104630624.0, + 122945856.0, + 133711672.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.7201819968448717e-09, + 1.1546708901521985e-11, + 1.1524695260611839e-11, + 1.1516852575776948e-11, + 1.1515758832625345e-11 + ], + "bp_grad_norms_F": [ + 4.471509669201623e-07, + 3.9150541142340956e-10, + 3.873180665081577e-10, + 3.8728689699674135e-10, + 3.8727610007782687e-10 + ], + "gamma_dfa": 0.00234126152281533, + "acc_eval": 0.099609375, + "loss_eval": 2.3141303062438965, + "epoch": 64 + }, + { + "hidden_norms": [ + 10319.01171875, + 78272792.0, + 106212480.0, + 124890544.0, + 135898992.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.082502087967896e-09, + 1.1041124611810282e-11, + 1.099913302798905e-11, + 1.099662808728974e-11, + 1.0998860676403321e-11 + ], + "bp_grad_norms_F": [ + 2.724834757827921e-07, + 3.732617270824079e-10, + 3.7087055648754585e-10, + 3.705740991843953e-10, + 3.7055333801383483e-10 + ], + "gamma_dfa": -0.0016588781545578968, + "acc_eval": 0.076171875, + "loss_eval": 2.301309585571289, + "epoch": 65 + }, + { + "hidden_norms": [ + 10393.1220703125, + 79820272.0, + 108085488.0, + 127064000.0, + 138196272.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.1938173782866102e-09, + 1.0600672249727605e-11, + 1.0572632179461916e-11, + 1.0572812590703418e-11, + 1.0572290438937149e-11 + ], + "bp_grad_norms_F": [ + 2.4229757400462404e-07, + 3.608289500522943e-10, + 3.590567010380852e-10, + 3.5867539494027767e-10, + 3.5869879289052164e-10 + ], + "gamma_dfa": -0.0006768384373572189, + "acc_eval": 0.1162109375, + "loss_eval": 2.300891876220703, + "epoch": 66 + }, + { + "hidden_norms": [ + 10441.87109375, + 81050488.0, + 109770584.0, + 129123352.0, + 140471120.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.23911914062802e-09, + 1.040783778605281e-11, + 1.0406573172638822e-11, + 1.0404551352427571e-11, + 1.0400711542013497e-11 + ], + "bp_grad_norms_F": [ + 3.1678638379162294e-07, + 3.529202208252258e-10, + 3.508623114267806e-10, + 3.5074002036061813e-10, + 3.507301671312746e-10 + ], + "gamma_dfa": 0.002077823784929933, + "acc_eval": 0.078125, + "loss_eval": 2.302239179611206, + "epoch": 67 + }, + { + "hidden_norms": [ + 10470.16796875, + 82310688.0, + 111439184.0, + 131022848.0, + 142428160.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.5865209146426196e-09, + 1.0226258208290151e-11, + 1.02605328747285e-11, + 1.0260522466387645e-11, + 1.0260643897030963e-11 + ], + "bp_grad_norms_F": [ + 3.3883526384670404e-07, + 3.5046832103091674e-10, + 3.5014954824497124e-10, + 3.4966474160569305e-10, + 3.496121170343258e-10 + ], + "gamma_dfa": -0.0026201284417766146, + "acc_eval": 0.107421875, + "loss_eval": 2.298029661178589, + "epoch": 68 + }, + { + "hidden_norms": [ + 10513.3203125, + 83437016.0, + 113127648.0, + 132967152.0, + 144543232.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.473118955938276e-10, + 1.0023389236668567e-11, + 9.974353808173131e-12, + 9.973816911257316e-12, + 9.97038302613662e-12 + ], + "bp_grad_norms_F": [ + 2.5441801199121983e-07, + 3.393485770164517e-10, + 3.373779589033177e-10, + 3.371187218270677e-10, + 3.370881351827393e-10 + ], + "gamma_dfa": 0.0005034620153310243, + "acc_eval": 0.0986328125, + "loss_eval": 2.301563262939453, + "epoch": 69 + }, + { + "hidden_norms": [ + 10551.1669921875, + 84680168.0, + 114672840.0, + 134819488.0, + 146567616.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0249410209439702e-09, + 9.764996970751394e-12, + 9.731633034137932e-12, + 9.726664786102734e-12, + 9.72637768936746e-12 + ], + "bp_grad_norms_F": [ + 2.863991426238499e-07, + 3.3205654892398684e-10, + 3.300854312104917e-10, + 3.3006170019334036e-10, + 3.300271445016989e-10 + ], + "gamma_dfa": -0.00030547842834494077, + "acc_eval": 0.0888671875, + "loss_eval": 2.3098697662353516, + "epoch": 70 + }, + { + "hidden_norms": [ + 10571.28515625, + 85669488.0, + 115961600.0, + 136359216.0, + 148233216.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.3427733369653083e-09, + 9.57579241595008e-12, + 9.569240365381315e-12, + 9.571362799554173e-12, + 9.572694199821985e-12 + ], + "bp_grad_norms_F": [ + 3.248615314532799e-07, + 3.252469404912972e-10, + 3.2484867573678855e-10, + 3.24500371018388e-10, + 3.244539636959587e-10 + ], + "gamma_dfa": -0.0020247000393283088, + "acc_eval": 0.1142578125, + "loss_eval": 2.2976913452148438, + "epoch": 71 + }, + { + "hidden_norms": [ + 10612.2607421875, + 86644544.0, + 117219120.0, + 137880144.0, + 149864576.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.2906055113504067e-09, + 9.509206790048186e-12, + 9.47129093903376e-12, + 9.464854247576149e-12, + 9.465737221825421e-12 + ], + "bp_grad_norms_F": [ + 2.801213554448623e-07, + 3.198223630374031e-10, + 3.183240893100958e-10, + 3.1834490599180754e-10, + 3.1827357416247537e-10 + ], + "gamma_dfa": -0.001203124011226464, + "acc_eval": 0.10546875, + "loss_eval": 2.3055059909820557, + "epoch": 72 + }, + { + "hidden_norms": [ + 10637.9248046875, + 87766232.0, + 118693968.0, + 139534048.0, + 151658064.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.839014827202504e-10, + 9.328608198411192e-12, + 9.353431223990682e-12, + 9.345346545230893e-12, + 9.345603284305337e-12 + ], + "bp_grad_norms_F": [ + 2.646772543357656e-07, + 3.13234327364853e-10, + 3.120789182631256e-10, + 3.1186964122298377e-10, + 3.118231783894032e-10 + ], + "gamma_dfa": -0.0021326720525394194, + "acc_eval": 0.1201171875, + "loss_eval": 2.3003604412078857, + "epoch": 73 + }, + { + "hidden_norms": [ + 10656.4482421875, + 88713800.0, + 119968392.0, + 141039184.0, + 153268816.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.779404980785444e-10, + 9.102603219790506e-12, + 9.076880740088722e-12, + 9.072962867118228e-12, + 9.071843970476223e-12 + ], + "bp_grad_norms_F": [ + 2.0230599773185531e-07, + 3.0828151142969773e-10, + 3.0691377217451077e-10, + 3.067752996077644e-10, + 3.0672925310781807e-10 + ], + "gamma_dfa": 0.00048369063733844087, + "acc_eval": 0.0908203125, + "loss_eval": 2.3012309074401855, + "epoch": 74 + }, + { + "hidden_norms": [ + 10672.1494140625, + 89505176.0, + 120986568.0, + 142222336.0, + 154574096.0 + ], + "bp_grad_norms_per_sample_med": [ + 9.261312272634825e-10, + 9.015565204106846e-12, + 8.995597669536615e-12, + 8.994238513693187e-12, + 8.993757127928603e-12 + ], + "bp_grad_norms_F": [ + 2.1154608020879095e-07, + 3.072229692868689e-10, + 3.052531283298521e-10, + 3.0519622939984004e-10, + 3.051366936901445e-10 + ], + "gamma_dfa": -0.0005316346723702736, + "acc_eval": 0.11328125, + "loss_eval": 2.3040223121643066, + "epoch": 75 + }, + { + "hidden_norms": [ + 10723.896484375, + 90374152.0, + 122032824.0, + 143367616.0, + 155819504.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.261785617274086e-10, + 8.993932334999677e-12, + 8.987987437647504e-12, + 8.987462683796021e-12, + 8.98797182513622e-12 + ], + "bp_grad_norms_F": [ + 1.5789649410180573e-07, + 3.019114402924572e-10, + 3.00178187861988e-10, + 2.999948345294712e-10, + 2.9999083772658253e-10 + ], + "gamma_dfa": -0.0012852016006945632, + "acc_eval": 0.0830078125, + "loss_eval": 2.3029680252075195, + "epoch": 76 + }, + { + "hidden_norms": [ + 10752.4677734375, + 91243824.0, + 123139408.0, + 144679744.0, + 157141888.0 + ], + "bp_grad_norms_per_sample_med": [ + 1.0187789500903932e-09, + 8.908308986310676e-12, + 8.877474276525188e-12, + 8.871863313442141e-12, + 8.872454854147449e-12 + ], + "bp_grad_norms_F": [ + 2.2995939730208192e-07, + 2.996720371850614e-10, + 2.9733623896355255e-10, + 2.9736765827514944e-10, + 2.9736227369348e-10 + ], + "gamma_dfa": 0.0009152928978437558, + "acc_eval": 0.078125, + "loss_eval": 2.3087785243988037, + "epoch": 77 + }, + { + "hidden_norms": [ + 10774.716796875, + 91815512.0, + 124004224.0, + 145694656.0, + 158276032.0 + ], + "bp_grad_norms_per_sample_med": [ + 8.046535660000131e-10, + 8.72336057555767e-12, + 8.693952675831174e-12, + 8.687773590809744e-12, + 8.688093647291062e-12 + ], + "bp_grad_norms_F": [ + 1.826059730092311e-07, + 2.946680122128953e-10, + 2.92846163985061e-10, + 2.9275293300656813e-10, + 2.927521280948753e-10 + ], + "gamma_dfa": 0.0014372464029293042, + "acc_eval": 0.064453125, + "loss_eval": 2.3071916103363037, + "epoch": 78 + }, + { + "hidden_norms": [ + 10790.939453125, + 92420488.0, + 124895360.0, + 146715424.0, + 159350832.0 + ], + "bp_grad_norms_per_sample_med": [ + 7.62354623873307e-10, + 8.534323421571788e-12, + 8.523472726229553e-12, + 8.523020830764061e-12, + 8.520370173292768e-12 + ], + "bp_grad_norms_F": [ + 2.139736210438059e-07, + 2.9157729009021693e-10, + 2.8999641576987756e-10, + 2.899117335086743e-10, + 2.898933315620411e-10 + ], + "gamma_dfa": 0.0007644326506124344, + "acc_eval": 0.107421875, + "loss_eval": 2.307311534881592, + "epoch": 79 + }, + { + "hidden_norms": [ + 10804.537109375, + 93059200.0, + 125634128.0, + 147548304.0, + 160277184.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.631766802378536e-10, + 8.465870365848005e-12, + 8.435890007374436e-12, + 8.433719868305989e-12, + 8.432757096776822e-12 + ], + "bp_grad_norms_F": [ + 1.5449778345555387e-07, + 2.894649520079895e-10, + 2.876322513500895e-10, + 2.8752078495841715e-10, + 2.8753605052500575e-10 + ], + "gamma_dfa": -0.0008484880891046487, + "acc_eval": 0.0703125, + "loss_eval": 2.3064723014831543, + "epoch": 80 + }, + { + "hidden_norms": [ + 10826.3466796875, + 93631016.0, + 126376416.0, + 148363712.0, + 161162256.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.068867630659724e-10, + 8.39008376662953e-12, + 8.381075347618783e-12, + 8.379246949075103e-12, + 8.377123647540508e-12 + ], + "bp_grad_norms_F": [ + 1.5745726500426827e-07, + 2.870276794020299e-10, + 2.8557434195164433e-10, + 2.853116076728668e-10, + 2.853256519941283e-10 + ], + "gamma_dfa": -0.0032648725573380943, + "acc_eval": 0.09375, + "loss_eval": 2.301131248474121, + "epoch": 81 + }, + { + "hidden_norms": [ + 10839.0986328125, + 94148792.0, + 127019560.0, + 149143280.0, + 162023376.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.829024042278917e-10, + 8.344799677650894e-12, + 8.329600897916123e-12, + 8.328910477972684e-12, + 8.32927910671133e-12 + ], + "bp_grad_norms_F": [ + 1.0639800507306063e-07, + 2.8474167468317546e-10, + 2.829097234258171e-10, + 2.8278687724814233e-10, + 2.827818257333803e-10 + ], + "gamma_dfa": 0.0004431852612469811, + "acc_eval": 0.1240234375, + "loss_eval": 2.302319049835205, + "epoch": 82 + }, + { + "hidden_norms": [ + 10845.5009765625, + 94622624.0, + 127620392.0, + 149820912.0, + 162751232.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.976296597014596e-10, + 8.380781311989605e-12, + 8.37097405281817e-12, + 8.368299109218214e-12, + 8.368221046661795e-12 + ], + "bp_grad_norms_F": [ + 1.5657094820653583e-07, + 2.842148183468396e-10, + 2.8250898842507866e-10, + 2.8236088467359366e-10, + 2.8235377924623606e-10 + ], + "gamma_dfa": 0.0011154523126606364, + "acc_eval": 0.0859375, + "loss_eval": 2.3030214309692383, + "epoch": 83 + }, + { + "hidden_norms": [ + 10858.826171875, + 95010072.0, + 128124352.0, + 150449040.0, + 163406224.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.707155303902312e-10, + 8.22641173930938e-12, + 8.219256872332714e-12, + 8.215187211058073e-12, + 8.215540227285434e-12 + ], + "bp_grad_norms_F": [ + 1.3043053570527263e-07, + 2.814159738573352e-10, + 2.796477494015903e-10, + 2.795675912992124e-10, + 2.7956112425009394e-10 + ], + "gamma_dfa": 0.00044634643927565776, + "acc_eval": 0.0849609375, + "loss_eval": 2.3043744564056396, + "epoch": 84 + }, + { + "hidden_norms": [ + 10870.2197265625, + 95329544.0, + 128596424.0, + 150994576.0, + 163991392.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.56519053063198e-10, + 8.213814177426837e-12, + 8.202234898224692e-12, + 8.199945063236402e-12, + 8.200029197324987e-12 + ], + "bp_grad_norms_F": [ + 1.2775484492522082e-07, + 2.8084765069102957e-10, + 2.791658848533274e-10, + 2.790815634146071e-10, + 2.7906171817804193e-10 + ], + "gamma_dfa": 0.00020755327568622306, + "acc_eval": 0.083984375, + "loss_eval": 2.3030991554260254, + "epoch": 85 + }, + { + "hidden_norms": [ + 10879.8818359375, + 95701368.0, + 129014928.0, + 151496160.0, + 164549552.0 + ], + "bp_grad_norms_per_sample_med": [ + 6.791080475743172e-10, + 8.169613423258948e-12, + 8.157244844875233e-12, + 8.15449097135712e-12, + 8.153281869094364e-12 + ], + "bp_grad_norms_F": [ + 1.5473247572117543e-07, + 2.7922636425259384e-10, + 2.774635243785184e-10, + 2.7745489239450194e-10, + 2.774172003228159e-10 + ], + "gamma_dfa": 3.1085157388588414e-05, + "acc_eval": 0.1064453125, + "loss_eval": 2.303433418273926, + "epoch": 86 + }, + { + "hidden_norms": [ + 10884.3349609375, + 95902000.0, + 129303088.0, + 151867408.0, + 164970960.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.919178953066705e-10, + 8.147189520246734e-12, + 8.125238329381723e-12, + 8.123910398560863e-12, + 8.123323194664245e-12 + ], + "bp_grad_norms_F": [ + 9.07293014051902e-08, + 2.7798055524108634e-10, + 2.7618457520972584e-10, + 2.761503803405674e-10, + 2.7613575315221794e-10 + ], + "gamma_dfa": -0.0002183817014156375, + "acc_eval": 0.0849609375, + "loss_eval": 2.304762363433838, + "epoch": 87 + }, + { + "hidden_norms": [ + 10897.5751953125, + 96208496.0, + 129661472.0, + 152266096.0, + 165380960.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.258827817655742e-10, + 8.113974769852206e-12, + 8.097599847600723e-12, + 8.095455729384415e-12, + 8.095571955857306e-12 + ], + "bp_grad_norms_F": [ + 1.5276340548098233e-07, + 2.7692478865581904e-10, + 2.752131300631788e-10, + 2.751227301533987e-10, + 2.751290584246391e-10 + ], + "gamma_dfa": 0.0012931385499541648, + "acc_eval": 0.08203125, + "loss_eval": 2.3039329051971436, + "epoch": 88 + }, + { + "hidden_norms": [ + 10904.84375, + 96462512.0, + 129958240.0, + 152599856.0, + 165729872.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.247893786197722e-10, + 8.085110705935428e-12, + 8.072378702983496e-12, + 8.07249319473291e-12, + 8.071344807791814e-12 + ], + "bp_grad_norms_F": [ + 1.0969206698518974e-07, + 2.758918649092834e-10, + 2.7459995388667835e-10, + 2.7444016503785917e-10, + 2.7442872974070553e-10 + ], + "gamma_dfa": -0.00021380887119448744, + "acc_eval": 0.1181640625, + "loss_eval": 2.3010976314544678, + "epoch": 89 + }, + { + "hidden_norms": [ + 10912.2958984375, + 96621360.0, + 130177664.0, + 152860160.0, + 166016640.0 + ], + "bp_grad_norms_per_sample_med": [ + 5.230118005350448e-10, + 8.057754116719273e-12, + 8.04393184006269e-12, + 8.043486016129364e-12, + 8.04203491994171e-12 + ], + "bp_grad_norms_F": [ + 1.1847043168700111e-07, + 2.7523416878949547e-10, + 2.739179438826511e-10, + 2.7376986788674174e-10, + 2.7375315903022113e-10 + ], + "gamma_dfa": -0.00048403643450001255, + "acc_eval": 0.1083984375, + "loss_eval": 2.3003616333007812, + "epoch": 90 + }, + { + "hidden_norms": [ + 10917.05859375, + 96728752.0, + 130332528.0, + 153046592.0, + 166225136.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.476303216982558e-10, + 8.051880343029616e-12, + 8.02496437357636e-12, + 8.026921141657262e-12, + 8.025202898054307e-12 + ], + "bp_grad_norms_F": [ + 9.623265384561819e-08, + 2.746256555496984e-10, + 2.7323307505433547e-10, + 2.730623227531481e-10, + 2.73067457534637e-10 + ], + "gamma_dfa": -0.0015982053701009136, + "acc_eval": 0.125, + "loss_eval": 2.3003616333007812, + "epoch": 91 + }, + { + "hidden_norms": [ + 10923.0517578125, + 96870376.0, + 130487432.0, + 153217872.0, + 166403392.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7786268558548386e-10, + 8.030507682443844e-12, + 8.02036388691807e-12, + 8.021478446751384e-12, + 8.020081126991485e-12 + ], + "bp_grad_norms_F": [ + 8.926052430524578e-08, + 2.743367200075397e-10, + 2.7284480230704844e-10, + 2.726960879328999e-10, + 2.7270555258418483e-10 + ], + "gamma_dfa": -0.0004921842846670188, + "acc_eval": 0.125, + "loss_eval": 2.300823211669922, + "epoch": 92 + }, + { + "hidden_norms": [ + 10922.423828125, + 96967520.0, + 130610968.0, + 153345712.0, + 166543008.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.468065084584083e-10, + 8.020029952648944e-12, + 8.011922722483966e-12, + 8.012338188756463e-12, + 8.013246316496137e-12 + ], + "bp_grad_norms_F": [ + 1.1504861419098233e-07, + 2.742139570965918e-10, + 2.7267893498716944e-10, + 2.725325520813726e-10, + 2.725419612215063e-10 + ], + "gamma_dfa": -0.0009440958092454821, + "acc_eval": 0.1201171875, + "loss_eval": 2.3005006313323975, + "epoch": 93 + }, + { + "hidden_norms": [ + 10924.3486328125, + 97010512.0, + 130686240.0, + 153444928.0, + 166653632.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.0347483687419583e-10, + 8.026363428059735e-12, + 8.013480504165393e-12, + 8.012077980235066e-12, + 8.010573107619656e-12 + ], + "bp_grad_norms_F": [ + 9.41274009846893e-08, + 2.740666027456484e-10, + 2.725613068577104e-10, + 2.7241114919362985e-10, + 2.7241911504383154e-10 + ], + "gamma_dfa": -0.0009883725906547625, + "acc_eval": 0.1240234375, + "loss_eval": 2.3007426261901855, + "epoch": 94 + }, + { + "hidden_norms": [ + 10926.5390625, + 97067000.0, + 130754976.0, + 153525008.0, + 166741232.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.34201924415234e-10, + 8.020669198249841e-12, + 8.007470554682872e-12, + 8.006251911440998e-12, + 8.004616067203152e-12 + ], + "bp_grad_norms_F": [ + 9.773965103931914e-08, + 2.7412291880857254e-10, + 2.725366043954125e-10, + 2.7240124045313507e-10, + 2.724127867725912e-10 + ], + "gamma_dfa": -0.0006572065904038027, + "acc_eval": 0.1240234375, + "loss_eval": 2.3012468814849854, + "epoch": 95 + }, + { + "hidden_norms": [ + 10928.3896484375, + 97092400.0, + 130798760.0, + 153578400.0, + 166798624.0 + ], + "bp_grad_norms_per_sample_med": [ + 4.0636483067402196e-10, + 8.025032895153661e-12, + 8.005560624135821e-12, + 8.006460078258115e-12, + 8.00502199249653e-12 + ], + "bp_grad_norms_F": [ + 9.727948935278619e-08, + 2.740962179448303e-10, + 2.725039638384885e-10, + 2.72373013032734e-10, + 2.723824221728677e-10 + ], + "gamma_dfa": -0.0003809257905231789, + "acc_eval": 0.1240234375, + "loss_eval": 2.3011176586151123, + "epoch": 96 + }, + { + "hidden_norms": [ + 10928.3759765625, + 97099208.0, + 130815104.0, + 153601264.0, + 166826208.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.9727551803814265e-10, + 8.031460045632155e-12, + 8.006649163116997e-12, + 8.006433190044238e-12, + 8.007052486325161e-12 + ], + "bp_grad_norms_F": [ + 8.93527598577748e-08, + 2.7405827607296374e-10, + 2.7247276657149655e-10, + 2.723416214767127e-10, + 2.723492820155826e-10 + ], + "gamma_dfa": -0.00030210223485482857, + "acc_eval": 0.1240234375, + "loss_eval": 2.301220178604126, + "epoch": 97 + }, + { + "hidden_norms": [ + 10928.6552734375, + 97115416.0, + 130835856.0, + 153625952.0, + 166852032.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.794573821824798e-10, + 8.030101757150465e-12, + 8.005353324680442e-12, + 8.005096585605997e-12, + 8.00570807563128e-12 + ], + "bp_grad_norms_F": [ + 8.692392583498076e-08, + 2.739931892481451e-10, + 2.724127867725912e-10, + 2.7228078125496324e-10, + 2.7228858057171124e-10 + ], + "gamma_dfa": -0.00032888483474380337, + "acc_eval": 0.1240234375, + "loss_eval": 2.3012919425964355, + "epoch": 98 + }, + { + "hidden_norms": [ + 10928.8115234375, + 97125048.0, + 130846640.0, + 153637296.0, + 166864480.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7600883517896477e-10, + 8.028339278098873e-12, + 8.003602121331443e-12, + 8.003305483617051e-12, + 8.003913504195381e-12 + ], + "bp_grad_norms_F": [ + 8.798993178515957e-08, + 2.7396546142810507e-10, + 2.7238306055110684e-10, + 2.7225180443402053e-10, + 2.7225932619501236e-10 + ], + "gamma_dfa": -0.0003425047798373271, + "acc_eval": 0.1240234375, + "loss_eval": 2.301285743713379, + "epoch": 99 + }, + { + "hidden_norms": [ + 10928.8310546875, + 97125584.0, + 130847152.0, + 153637792.0, + 166864928.0 + ], + "bp_grad_norms_per_sample_med": [ + 3.7847944223123875e-10, + 8.028382646185772e-12, + 8.003642019971391e-12, + 8.00335752532133e-12, + 8.003966413261399e-12 + ], + "bp_grad_norms_F": [ + 8.822269847996722e-08, + 2.739633520043583e-10, + 2.7238253319517014e-10, + 2.7225077747772275e-10, + 2.7225843801659266e-10 + ], + "gamma_dfa": -0.0003516010765451938, + "acc_eval": 0.1240234375, + "loss_eval": 2.301274299621582, + "epoch": 100 + } + ] +}
\ No newline at end of file |
