diff options
Diffstat (limited to 'results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json')
| -rw-r--r-- | results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json | 1824 |
1 files changed, 1824 insertions, 0 deletions
diff --git a/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json new file mode 100644 index 0000000..7e5cb37 --- /dev/null +++ b/results/snapshot_no_outln_v1/snapshot_fa_canonical_noln_s42.json @@ -0,0 +1,1824 @@ +{ + "fa_log": [ + { + "hidden_norms": [ + 8.718070030212402, + 8.780964851379395, + 8.812002182006836, + 8.828720092773438, + 8.893179893493652 + ], + "bp_grad_norms_per_sample_med": [ + 0.0005561555735766888, + 0.0005519049009308219, + 0.0005482902633957565, + 0.0005436676437966526, + 0.000538847001735121 + ], + "acc_eval": 0.1123046875, + "epoch": 0 + }, + { + "hidden_norms": [ + 736.34716796875, + 1637.1044921875, + 2033.1922607421875, + 2161.380859375, + 2126.18505859375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0006836718530394137, + 0.0006813183426856995, + 0.0006814387743361294, + 0.0006832550279796124, + 0.0006794488872401416 + ], + "acc_eval": 0.1953125, + "epoch": 1 + }, + { + "hidden_norms": [ + 1106.3868408203125, + 2963.552001953125, + 4087.33837890625, + 4421.4921875, + 4265.1083984375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007476353785023093, + 0.0007440777844749391, + 0.0007443943759426475, + 0.0007477496401406825, + 0.0007366884965449572 + ], + "acc_eval": 0.1044921875, + "epoch": 2 + }, + { + "hidden_norms": [ + 1371.9425048828125, + 4214.05078125, + 6238.47265625, + 6697.2333984375, + 6399.22314453125 + ], + "bp_grad_norms_per_sample_med": [ + 0.000730870058760047, + 0.00072717375587672, + 0.0007270713686011732, + 0.0007290731882676482, + 0.0007233614451251924 + ], + "acc_eval": 0.1943359375, + "epoch": 3 + }, + { + "hidden_norms": [ + 1574.7962646484375, + 4805.0556640625, + 7044.64599609375, + 7593.78955078125, + 7215.32763671875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007098641362972558, + 0.0007034889422357082, + 0.0007031699060462415, + 0.0007120345253497362, + 0.000694308546371758 + ], + "acc_eval": 0.2451171875, + "epoch": 4 + }, + { + "hidden_norms": [ + 1726.088623046875, + 6184.34521484375, + 9521.791015625, + 10387.7236328125, + 9721.431640625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007400272879749537, + 0.0007343650795519352, + 0.0007334973197430372, + 0.0007343514007516205, + 0.0007319966680370271 + ], + "acc_eval": 0.212890625, + "epoch": 5 + }, + { + "hidden_norms": [ + 1902.689697265625, + 7697.52197265625, + 12328.0595703125, + 13597.1787109375, + 12504.158203125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007165716378949583, + 0.0007126733544282615, + 0.0007124089752323925, + 0.0007126083364710212, + 0.0007107863784767687 + ], + "acc_eval": 0.15625, + "epoch": 6 + }, + { + "hidden_norms": [ + 2069.750244140625, + 10379.2958984375, + 16444.7421875, + 18267.94921875, + 16595.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007099996437318623, + 0.0007088935235515237, + 0.0007090346189215779, + 0.000710709486156702, + 0.0007023006328381598 + ], + "acc_eval": 0.154296875, + "epoch": 7 + }, + { + "hidden_norms": [ + 2226.40673828125, + 12703.916015625, + 20184.30859375, + 22453.73828125, + 20183.220703125 + ], + "bp_grad_norms_per_sample_med": [ + 0.00072157580871135, + 0.0007210742915049195, + 0.0007212630589492619, + 0.0007244180305860937, + 0.0007163899717852473 + ], + "acc_eval": 0.2236328125, + "epoch": 8 + }, + { + "hidden_norms": [ + 2289.455078125, + 15611.2138671875, + 24559.412109375, + 27336.787109375, + 24451.6796875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007243232685141265, + 0.0007221215637400746, + 0.0007219284889288247, + 0.0007259267731569707, + 0.0007173537742346525 + ], + "acc_eval": 0.169921875, + "epoch": 9 + }, + { + "hidden_norms": [ + 2396.09814453125, + 19678.587890625, + 30417.08203125, + 34140.70703125, + 30261.052734375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007124242256395519, + 0.0007074667955748737, + 0.0007074963650666177, + 0.0007131542661227286, + 0.0007022957433946431 + ], + "acc_eval": 0.1904296875, + "epoch": 10 + }, + { + "hidden_norms": [ + 2467.864013671875, + 24019.642578125, + 41156.921875, + 46706.38671875, + 41256.71484375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007333463290706277, + 0.0007277126424014568, + 0.0007268521003425121, + 0.000731462670955807, + 0.0007225224399007857 + ], + "acc_eval": 0.169921875, + "epoch": 11 + }, + { + "hidden_norms": [ + 2518.561767578125, + 28957.451171875, + 55737.69140625, + 64112.609375, + 56246.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007202349370345473, + 0.0007073598098941147, + 0.0007049349951557815, + 0.0007059182389639318, + 0.0007044971571303904 + ], + "acc_eval": 0.1513671875, + "epoch": 12 + }, + { + "hidden_norms": [ + 2614.843994140625, + 34279.15625, + 74158.109375, + 86073.96875, + 75187.59375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007299556746147573, + 0.0007100331713445485, + 0.0007101728115230799, + 0.0007166104041971266, + 0.0007030466804280877 + ], + "acc_eval": 0.24609375, + "epoch": 13 + }, + { + "hidden_norms": [ + 2697.871337890625, + 41263.5390625, + 96222.8984375, + 112901.9765625, + 98551.3046875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007336065755225718, + 0.0007151410100050271, + 0.0007150733144953847, + 0.0007166287978179753, + 0.0007151660392992198 + ], + "acc_eval": 0.134765625, + "epoch": 14 + }, + { + "hidden_norms": [ + 2815.983154296875, + 53842.3828125, + 126185.5625, + 149526.796875, + 130144.4765625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007365003693848848, + 0.0007177364313974977, + 0.0007168670417740941, + 0.000717108603566885, + 0.0007130720769055188 + ], + "acc_eval": 0.150390625, + "epoch": 15 + }, + { + "hidden_norms": [ + 2928.448974609375, + 65162.98046875, + 153909.296875, + 184005.875, + 159483.03125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007613440393470228, + 0.000720723532140255, + 0.000720796815585345, + 0.0007208258030004799, + 0.0007211563643068075 + ], + "acc_eval": 0.166015625, + "epoch": 16 + }, + { + "hidden_norms": [ + 2970.975341796875, + 76176.9609375, + 179093.75, + 216167.875, + 186723.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007602480472996831, + 0.0007191941258497536, + 0.0007163456757552922, + 0.0007164765265770257, + 0.0007142137037590146 + ], + "acc_eval": 0.1796875, + "epoch": 17 + }, + { + "hidden_norms": [ + 3078.336181640625, + 91839.40625, + 215980.015625, + 263515.15625, + 227071.515625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007584959384985268, + 0.0007150565506890416, + 0.0007151922909542918, + 0.000715585716534406, + 0.0007152389152906835 + ], + "acc_eval": 0.1767578125, + "epoch": 18 + }, + { + "hidden_norms": [ + 3202.803466796875, + 104358.6875, + 248325.390625, + 305395.84375, + 262365.46875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007867171661928296, + 0.0007155268103815615, + 0.0007155817584134638, + 0.0007157608633860946, + 0.0007155768107622862 + ], + "acc_eval": 0.138671875, + "epoch": 19 + }, + { + "hidden_norms": [ + 3282.27490234375, + 117747.359375, + 284217.3125, + 351018.15625, + 300903.65625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007691550417803228, + 0.0007147297146730125, + 0.0007147309370338917, + 0.0007150261080823839, + 0.0007147534633986652 + ], + "acc_eval": 0.1923828125, + "epoch": 20 + }, + { + "hidden_norms": [ + 3394.945556640625, + 129443.9765625, + 317078.65625, + 393509.375, + 336658.40625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008442914695478976, + 0.0007179519161581993, + 0.0007190873729996383, + 0.000723545381333679, + 0.0007175213540904224 + ], + "acc_eval": 0.1376953125, + "epoch": 21 + }, + { + "hidden_norms": [ + 3484.2763671875, + 140426.171875, + 355086.84375, + 443148.09375, + 378501.53125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007702927687205374, + 0.0006826652679592371, + 0.0006794629734940827, + 0.0006826536264270544, + 0.0006794703076593578 + ], + "acc_eval": 0.19140625, + "epoch": 22 + }, + { + "hidden_norms": [ + 3529.414306640625, + 153612.265625, + 393522.9375, + 493183.03125, + 421284.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008731107809580863, + 0.0007047304534353316, + 0.0007038630428723991, + 0.000708943116478622, + 0.000701444165315479 + ], + "acc_eval": 0.16796875, + "epoch": 23 + }, + { + "hidden_norms": [ + 3604.90283203125, + 165405.75, + 423586.46875, + 533219.375, + 454992.90625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008110221242532134, + 0.0006812610663473606, + 0.0006812110659666359, + 0.0006817537359893322, + 0.0006813214858993888 + ], + "acc_eval": 0.20703125, + "epoch": 24 + }, + { + "hidden_norms": [ + 3761.85400390625, + 178944.296875, + 464984.875, + 587869.375, + 501438.21875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008038324886001647, + 0.0006578225293196738, + 0.0006502956384792924, + 0.000664222112391144, + 0.0006502254982478917 + ], + "acc_eval": 0.240234375, + "epoch": 25 + }, + { + "hidden_norms": [ + 3818.5869140625, + 193167.4375, + 505599.375, + 643764.4375, + 550033.3125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007956585614010692, + 0.0007038708426989615, + 0.0007025190279819071, + 0.0007078333292156458, + 0.0006988184759393334 + ], + "acc_eval": 0.185546875, + "epoch": 26 + }, + { + "hidden_norms": [ + 3924.1787109375, + 207801.1875, + 548741.125, + 701043.0625, + 599520.4375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009222823427990079, + 0.000673642847687006, + 0.0006724554114043713, + 0.0006726986612193286, + 0.0006725445855408907 + ], + "acc_eval": 0.216796875, + "epoch": 27 + }, + { + "hidden_norms": [ + 4061.806884765625, + 222595.921875, + 590807.5, + 755718.75, + 646775.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008092334610410035, + 0.0007093537133187056, + 0.0007078479393385351, + 0.0007069098646752536, + 0.0007029378321021795 + ], + "acc_eval": 0.2158203125, + "epoch": 28 + }, + { + "hidden_norms": [ + 4216.11083984375, + 237549.296875, + 636429.5625, + 816954.9375, + 699524.9375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008620031294412911, + 0.0007326522027142346, + 0.00072627910412848, + 0.000725903722923249, + 0.0007269763154909015 + ], + "acc_eval": 0.1533203125, + "epoch": 29 + }, + { + "hidden_norms": [ + 4319.05029296875, + 251667.5, + 681409.75, + 874567.9375, + 748820.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008448463049717247, + 0.0007160686072893441, + 0.000714016379788518, + 0.0007141274982132018, + 0.0007095346227288246 + ], + "acc_eval": 0.1591796875, + "epoch": 30 + }, + { + "hidden_norms": [ + 4387.8330078125, + 268470.375, + 733153.125, + 943456.375, + 808793.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009849616326391697, + 0.0007160623208619654, + 0.0007154300110414624, + 0.0007152247708290815, + 0.0007160453242249787 + ], + "acc_eval": 0.1884765625, + "epoch": 31 + }, + { + "hidden_norms": [ + 4495.54638671875, + 291274.59375, + 806698.75, + 1039374.875, + 892062.1875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008646573405712843, + 0.000731874315533787, + 0.0007177238585427403, + 0.0007205329020507634, + 0.0007192457560449839 + ], + "acc_eval": 0.17578125, + "epoch": 32 + }, + { + "hidden_norms": [ + 4596.96337890625, + 305228.46875, + 848072.5625, + 1092268.625, + 937583.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009474663529545069, + 0.0007221641135402024, + 0.000721680698916316, + 0.0007284134044311941, + 0.0007212713244371116 + ], + "acc_eval": 0.171875, + "epoch": 33 + }, + { + "hidden_norms": [ + 4724.111328125, + 321366.5, + 891238.9375, + 1149886.25, + 987910.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009131877450272441, + 0.0007397676818072796, + 0.0007398735033348203, + 0.0007397927111014724, + 0.0007406016811728477 + ], + "acc_eval": 0.125, + "epoch": 34 + }, + { + "hidden_norms": [ + 4865.970703125, + 344027.15625, + 946722.0625, + 1219714.625, + 1049445.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001010064734145999, + 0.0007341124583035707, + 0.0007336883572861552, + 0.0007345521007664502, + 0.0007338698487728834 + ], + "acc_eval": 0.119140625, + "epoch": 35 + }, + { + "hidden_norms": [ + 5003.3857421875, + 373410.21875, + 1026535.0625, + 1321456.25, + 1139824.625 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010555180488154292, + 0.0007112861494533718, + 0.0007111895247362554, + 0.0007112334715202451, + 0.000711193191818893 + ], + "acc_eval": 0.1591796875, + "epoch": 36 + }, + { + "hidden_norms": [ + 5121.19287109375, + 405646.9375, + 1111111.125, + 1430716.625, + 1237074.375 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010308363707736135, + 0.0007563655963167548, + 0.0007560031372122467, + 0.000755665882024914, + 0.0007561628590337932 + ], + "acc_eval": 0.134765625, + "epoch": 37 + }, + { + "hidden_norms": [ + 5212.7294921875, + 434054.15625, + 1180238.125, + 1518019.875, + 1314350.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001035128254443407, + 0.0007314062095247209, + 0.0007304889149963856, + 0.0007291524088941514, + 0.0007313747191801667 + ], + "acc_eval": 0.140625, + "epoch": 38 + }, + { + "hidden_norms": [ + 5322.74951171875, + 462000.6875, + 1248006.75, + 1606243.125, + 1392563.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009023830061778426, + 0.000720554031431675, + 0.0007195135112851858, + 0.0007197313825599849, + 0.0007196948863565922 + ], + "acc_eval": 0.1708984375, + "epoch": 39 + }, + { + "hidden_norms": [ + 5453.89111328125, + 498941.0625, + 1343521.0, + 1731177.375, + 1504101.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010444134240970016, + 0.0007362678297795355, + 0.0007352089160121977, + 0.0007340405718423426, + 0.0007357052527368069 + ], + "acc_eval": 0.1328125, + "epoch": 40 + }, + { + "hidden_norms": [ + 5515.6982421875, + 529817.75, + 1409505.625, + 1816151.0, + 1580539.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011280628386884928, + 0.0007231750059872866, + 0.0007211649208329618, + 0.000721275107935071, + 0.0007212632917799056 + ], + "acc_eval": 0.1611328125, + "epoch": 41 + }, + { + "hidden_norms": [ + 5617.26513671875, + 567492.4375, + 1498097.5, + 1931607.875, + 1684206.875 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010544253746047616, + 0.0007354306289926171, + 0.0007348860381171107, + 0.0007349851075559855, + 0.0007350810337811708 + ], + "acc_eval": 0.1416015625, + "epoch": 42 + }, + { + "hidden_norms": [ + 5740.7978515625, + 596215.625, + 1561745.25, + 2014107.25, + 1758526.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010764201870188117, + 0.0007244387525133789, + 0.000723967794328928, + 0.000724096957128495, + 0.0007241644198074937 + ], + "acc_eval": 0.19921875, + "epoch": 43 + }, + { + "hidden_norms": [ + 5808.19677734375, + 630780.3125, + 1636034.875, + 2109305.75, + 1845552.125 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010526466649025679, + 0.0007206913433037698, + 0.0007207048474811018, + 0.0007211468764580786, + 0.0007207895396277308 + ], + "acc_eval": 0.173828125, + "epoch": 44 + }, + { + "hidden_norms": [ + 5868.3583984375, + 673578.625, + 1729325.25, + 2227518.0, + 1953361.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009479392319917679, + 0.0007091389270499349, + 0.0007090644794516265, + 0.0007082624360918999, + 0.0007085782708600163 + ], + "acc_eval": 0.1923828125, + "epoch": 45 + }, + { + "hidden_norms": [ + 5953.82421875, + 720273.0, + 1840695.5, + 2372038.0, + 2084658.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0014002618845552206, + 0.0007315247785300016, + 0.0007256051758304238, + 0.0007254919619299471, + 0.000725599646102637 + ], + "acc_eval": 0.17578125, + "epoch": 46 + }, + { + "hidden_norms": [ + 6054.7861328125, + 758000.6875, + 1930354.375, + 2488163.75, + 2190582.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001109408913180232, + 0.0007018125616014004, + 0.0007016566814854741, + 0.000701890152413398, + 0.0007018494652584195 + ], + "acc_eval": 0.203125, + "epoch": 47 + }, + { + "hidden_norms": [ + 6155.0859375, + 790443.0, + 2009565.875, + 2590829.25, + 2285268.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010253023356199265, + 0.0007347314967773855, + 0.0007304528844542801, + 0.0007322027231566608, + 0.0007312395609915257 + ], + "acc_eval": 0.154296875, + "epoch": 48 + }, + { + "hidden_norms": [ + 6216.64453125, + 830678.125, + 2088773.5, + 2691122.0, + 2376731.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010403504129499197, + 0.0006902964669279754, + 0.0006906419876031578, + 0.0006905900663696229, + 0.0006906461785547435 + ], + "acc_eval": 0.1591796875, + "epoch": 49 + }, + { + "hidden_norms": [ + 6252.98486328125, + 867790.1875, + 2159729.75, + 2781409.5, + 2460902.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0011370684951543808, + 0.0007390088285319507, + 0.0007305812323465943, + 0.0007310720975510776, + 0.0007304322207346559 + ], + "acc_eval": 0.15234375, + "epoch": 50 + }, + { + "hidden_norms": [ + 6294.51611328125, + 897267.5625, + 2218282.5, + 2858224.75, + 2530432.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0013790406519547105, + 0.0007320911972783506, + 0.0007304649334400892, + 0.0007293879170902073, + 0.0007303770980797708 + ], + "acc_eval": 0.1591796875, + "epoch": 51 + }, + { + "hidden_norms": [ + 6312.2314453125, + 935570.375, + 2299086.0, + 2963619.0, + 2627515.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000999285257421434, + 0.0007227054447866976, + 0.0007246703025884926, + 0.0007245387532748282, + 0.0007243558065965772 + ], + "acc_eval": 0.20703125, + "epoch": 52 + }, + { + "hidden_norms": [ + 6387.30322265625, + 977101.125, + 2387243.0, + 3077676.25, + 2733147.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.001396833686158061, + 0.0007110408041626215, + 0.0007093287422321737, + 0.000708233390469104, + 0.0007085108081810176 + ], + "acc_eval": 0.1787109375, + "epoch": 53 + }, + { + "hidden_norms": [ + 6406.59033203125, + 1011753.1875, + 2450391.25, + 3158275.0, + 2807055.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0012408416951075196, + 0.0007304692408069968, + 0.000724659999832511, + 0.0007247650064527988, + 0.0007249858463183045 + ], + "acc_eval": 0.130859375, + "epoch": 54 + }, + { + "hidden_norms": [ + 6396.32080078125, + 1051044.375, + 2521085.5, + 3249326.75, + 2890642.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010854896390810609, + 0.0006957638543099165, + 0.0006896257400512695, + 0.0006964386557228863, + 0.0006897017010487616 + ], + "acc_eval": 0.234375, + "epoch": 55 + }, + { + "hidden_norms": [ + 6413.91357421875, + 1083474.5, + 2597945.5, + 3348271.5, + 2981405.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.00098806235473603, + 0.000719150179065764, + 0.0007170068565756083, + 0.0007178731029853225, + 0.0007173708290793002 + ], + "acc_eval": 0.205078125, + "epoch": 56 + }, + { + "hidden_norms": [ + 6406.4228515625, + 1124429.875, + 2675529.5, + 3447474.25, + 3073241.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.001149638439528644, + 0.0007225789595395327, + 0.0007212197524495423, + 0.0007210947806015611, + 0.0007211659685708582 + ], + "acc_eval": 0.1494140625, + "epoch": 57 + }, + { + "hidden_norms": [ + 6443.423828125, + 1166184.375, + 2758561.25, + 3551879.75, + 3171214.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.001115654013119638, + 0.000685695675201714, + 0.0006846366450190544, + 0.0006861463189125061, + 0.0006862673326395452 + ], + "acc_eval": 0.2490234375, + "epoch": 58 + }, + { + "hidden_norms": [ + 6477.5, + 1208826.0, + 2842194.75, + 3654862.0, + 3267617.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.000923235435038805, + 0.0006659153732471168, + 0.0006642267107963562, + 0.0006722065154463053, + 0.000664416525978595 + ], + "acc_eval": 0.2353515625, + "epoch": 59 + }, + { + "hidden_norms": [ + 6486.1689453125, + 1249377.0, + 2928293.75, + 3765881.75, + 3370835.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008846685523167253, + 0.0006866253679618239, + 0.000686973100528121, + 0.0006869880016893148, + 0.0006870955694466829 + ], + "acc_eval": 0.2373046875, + "epoch": 60 + }, + { + "hidden_norms": [ + 6499.3720703125, + 1291233.25, + 3012714.75, + 3873429.75, + 3471234.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009820004925131798, + 0.0007174524944275618, + 0.0007178467349149287, + 0.0007176626822911203, + 0.0007174718775786459 + ], + "acc_eval": 0.216796875, + "epoch": 61 + }, + { + "hidden_norms": [ + 6486.14404296875, + 1327247.75, + 3088322.75, + 3971415.75, + 3562299.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010241338750347495, + 0.0007171124452725053, + 0.0007174332858994603, + 0.0007172181503847241, + 0.0007169945747591555 + ], + "acc_eval": 0.18359375, + "epoch": 62 + }, + { + "hidden_norms": [ + 6455.17236328125, + 1355067.375, + 3142698.25, + 4041006.5, + 3627490.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009781530825421214, + 0.0007034538430161774, + 0.000703376077581197, + 0.0007118352805264294, + 0.0007080681971274316 + ], + "acc_eval": 0.189453125, + "epoch": 63 + }, + { + "hidden_norms": [ + 6454.62841796875, + 1384795.75, + 3199654.0, + 4114095.75, + 3696468.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009227422997355461, + 0.0007023688522167504, + 0.0007012909045442939, + 0.0007004260551184416, + 0.0007006779196672142 + ], + "acc_eval": 0.21484375, + "epoch": 64 + }, + { + "hidden_norms": [ + 6451.345703125, + 1420232.75, + 3260116.5, + 4190244.25, + 3768354.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008870494784787297, + 0.0007146014831960201, + 0.0007149986922740936, + 0.0007148014265112579, + 0.0007145918207243085 + ], + "acc_eval": 0.197265625, + "epoch": 65 + }, + { + "hidden_norms": [ + 6445.890625, + 1448264.875, + 3319505.0, + 4267505.0, + 3840047.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0010003555798903108, + 0.0007171350298449397, + 0.0007168895681388676, + 0.0007169176824390888, + 0.0007170233875513077 + ], + "acc_eval": 0.1591796875, + "epoch": 66 + }, + { + "hidden_norms": [ + 6440.8212890625, + 1478082.75, + 3376291.25, + 4340727.0, + 3909334.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009646597318351269, + 0.0007130720769055188, + 0.0007134011830203235, + 0.0007131980964913964, + 0.0007129770237952471 + ], + "acc_eval": 0.171875, + "epoch": 67 + }, + { + "hidden_norms": [ + 6398.03955078125, + 1508487.5, + 3436526.25, + 4417271.5, + 3981251.75 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009445869363844395, + 0.0007122856914065778, + 0.0007126569980755448, + 0.0007124742260202765, + 0.0007122504175640643 + ], + "acc_eval": 0.189453125, + "epoch": 68 + }, + { + "hidden_norms": [ + 6389.02392578125, + 1530834.625, + 3480246.5, + 4471170.0, + 4032576.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009853171650320292, + 0.0006874292739666998, + 0.0006876476109027863, + 0.0006881517474539578, + 0.0006880395230837166 + ], + "acc_eval": 0.1904296875, + "epoch": 69 + }, + { + "hidden_norms": [ + 6338.54443359375, + 1561198.875, + 3541681.5, + 4548099.0, + 4105499.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009333671187050641, + 0.0006952910916879773, + 0.0006947650690563023, + 0.0006940987077541649, + 0.0006943742628209293 + ], + "acc_eval": 0.23046875, + "epoch": 70 + }, + { + "hidden_norms": [ + 6280.18603515625, + 1585008.0, + 3589125.25, + 4608667.0, + 4162480.25 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009699579677544534, + 0.0007101434166543186, + 0.0007104446412995458, + 0.000710242718923837, + 0.0007100136135704815 + ], + "acc_eval": 0.146484375, + "epoch": 71 + }, + { + "hidden_norms": [ + 6252.455078125, + 1608187.875, + 3635014.75, + 4667478.5, + 4218253.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008955001248978078, + 0.0006863236776553094, + 0.0006864941096864641, + 0.000687020889017731, + 0.0006868807831779122 + ], + "acc_eval": 0.2431640625, + "epoch": 72 + }, + { + "hidden_norms": [ + 6201.6845703125, + 1619508.875, + 3661275.25, + 4700652.0, + 4249921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009069991065189242, + 0.0006539999740198255, + 0.0006531713879667222, + 0.0006594359292648733, + 0.000653320224955678 + ], + "acc_eval": 0.2216796875, + "epoch": 73 + }, + { + "hidden_norms": [ + 6182.8115234375, + 1632587.875, + 3679586.25, + 4722070.5, + 4271567.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009595821611583233, + 0.0007079984061419964, + 0.0007082773372530937, + 0.0007081056828610599, + 0.000707884959410876 + ], + "acc_eval": 0.193359375, + "epoch": 74 + }, + { + "hidden_norms": [ + 6153.7392578125, + 1653576.875, + 3722935.0, + 4776921.0, + 4323508.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008598894928582013, + 0.0007073319284245372, + 0.0007075938628986478, + 0.0007074539898894727, + 0.0007072555599734187 + ], + "acc_eval": 0.201171875, + "epoch": 75 + }, + { + "hidden_norms": [ + 6135.21240234375, + 1667474.375, + 3750912.75, + 4812450.5, + 4357575.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0009454588289372623, + 0.0007068001432344317, + 0.0007069715647958219, + 0.0007067638216540217, + 0.0007065933896228671 + ], + "acc_eval": 0.2158203125, + "epoch": 76 + }, + { + "hidden_norms": [ + 6085.7109375, + 1679251.75, + 3774334.5, + 4840148.5, + 4384792.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008410231093876064, + 0.0006843701121397316, + 0.0006845371681265533, + 0.00068506138632074, + 0.0006849151104688644 + ], + "acc_eval": 0.2578125, + "epoch": 77 + }, + { + "hidden_norms": [ + 6042.693359375, + 1685705.5, + 3787479.75, + 4856211.0, + 4400193.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008572259685024619, + 0.0006840305286459625, + 0.0006841861759312451, + 0.0006847094628028572, + 0.0006845552125014365 + ], + "acc_eval": 0.2568359375, + "epoch": 78 + }, + { + "hidden_norms": [ + 6003.5390625, + 1702685.5, + 3813174.5, + 4888481.0, + 4430612.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008342780056409538, + 0.0006777377566322684, + 0.0006779460818506777, + 0.0006789933540858328, + 0.0006781259435229003 + ], + "acc_eval": 0.2685546875, + "epoch": 79 + }, + { + "hidden_norms": [ + 5948.60107421875, + 1714243.125, + 3830846.5, + 4910337.5, + 4451921.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008218465954996645, + 0.0006832804065197706, + 0.0006831764476373792, + 0.0006826326716691256, + 0.0006829035119153559 + ], + "acc_eval": 0.2529296875, + "epoch": 80 + }, + { + "hidden_norms": [ + 5881.8525390625, + 1718113.375, + 3838036.5, + 4920025.5, + 4461931.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007958809728734195, + 0.000677398347761482, + 0.0006775528891012073, + 0.0006775871734134853, + 0.0006777321686968207 + ], + "acc_eval": 0.2548828125, + "epoch": 81 + }, + { + "hidden_norms": [ + 5816.7880859375, + 1723461.25, + 3850904.75, + 4936806.0, + 4478473.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008361428044736385, + 0.0006769691244699061, + 0.0006771331536583602, + 0.0006771665066480637, + 0.0006773129571229219 + ], + "acc_eval": 0.251953125, + "epoch": 82 + }, + { + "hidden_norms": [ + 5760.41845703125, + 1732135.25, + 3859576.0, + 4947171.0, + 4488986.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008036325452849269, + 0.0006821549613960087, + 0.0006806753808632493, + 0.0006799713592045009, + 0.0006802318384870887 + ], + "acc_eval": 0.2490234375, + "epoch": 83 + }, + { + "hidden_norms": [ + 5710.22998046875, + 1740014.25, + 3871992.25, + 4962337.5, + 4503463.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008278922759927809, + 0.0006754198693670332, + 0.000675307004712522, + 0.0006768241291865706, + 0.0006769676692783833 + ], + "acc_eval": 0.26171875, + "epoch": 84 + }, + { + "hidden_norms": [ + 5685.73828125, + 1745863.25, + 3880256.75, + 4973639.5, + 4514457.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008255501161329448, + 0.0006466225022450089, + 0.0006466452032327652, + 0.0006467151688411832, + 0.0006467655766755342 + ], + "acc_eval": 0.283203125, + "epoch": 85 + }, + { + "hidden_norms": [ + 5637.498046875, + 1743128.375, + 3879796.5, + 4973009.0, + 4514424.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008148956694640219, + 0.0006465681362897158, + 0.0006463592289946973, + 0.0006491504609584808, + 0.0006464755861088634 + ], + "acc_eval": 0.2587890625, + "epoch": 86 + }, + { + "hidden_norms": [ + 5601.87744140625, + 1741859.375, + 3884447.75, + 4978445.5, + 4518886.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008254973217844963, + 0.0006783050484955311, + 0.0006774527719244361, + 0.0006768335006199777, + 0.0006770920008420944 + ], + "acc_eval": 0.298828125, + "epoch": 87 + }, + { + "hidden_norms": [ + 5587.505859375, + 1748285.875, + 3887730.5, + 4982144.0, + 4523151.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008113561780191958, + 0.0006764904828742146, + 0.000676542054861784, + 0.0006762324483133852, + 0.0006764894351363182 + ], + "acc_eval": 0.2734375, + "epoch": 88 + }, + { + "hidden_norms": [ + 5553.013671875, + 1748456.75, + 3890722.0, + 4986538.5, + 4527315.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007909060223028064, + 0.0006763285491615534, + 0.0006762049742974341, + 0.0006756742368452251, + 0.000675930583383888 + ], + "acc_eval": 0.2861328125, + "epoch": 89 + }, + { + "hidden_norms": [ + 5524.611328125, + 1748210.0, + 3893003.75, + 4989732.5, + 4530436.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.000797618820797652, + 0.0006453269743360579, + 0.0006453663809224963, + 0.0006454290705733001, + 0.0006454723770730197 + ], + "acc_eval": 0.28515625, + "epoch": 90 + }, + { + "hidden_norms": [ + 5506.21923828125, + 1750958.0, + 3894639.5, + 4992073.0, + 4532399.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007834367570467293, + 0.0006762953125871718, + 0.0006754640489816666, + 0.0006748714949935675, + 0.0006751226610504091 + ], + "acc_eval": 0.2939453125, + "epoch": 91 + }, + { + "hidden_norms": [ + 5485.10791015625, + 1747546.25, + 3895030.0, + 4992480.5, + 4532805.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007779909064993262, + 0.0006450997898355126, + 0.0006451247027143836, + 0.0006455867551267147, + 0.0006452234229072928 + ], + "acc_eval": 0.2890625, + "epoch": 92 + }, + { + "hidden_norms": [ + 5464.07763671875, + 1749313.125, + 3894610.75, + 4991684.0, + 4532270.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0008090221090242267, + 0.0006661301013082266, + 0.0006646219990216196, + 0.0006726695573888719, + 0.0006649038987234235 + ], + "acc_eval": 0.283203125, + "epoch": 93 + }, + { + "hidden_norms": [ + 5451.2841796875, + 1749389.0, + 3894315.25, + 4990837.5, + 4531011.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007907215040177107, + 0.0006448677740991116, + 0.0006448915228247643, + 0.0006451430963352323, + 0.0006449950742535293 + ], + "acc_eval": 0.2958984375, + "epoch": 94 + }, + { + "hidden_norms": [ + 5437.77099609375, + 1750653.125, + 3895251.75, + 4992303.0, + 4532441.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007774807745590806, + 0.000676269584801048, + 0.0006763145211152732, + 0.0006763775018043816, + 0.000676501716952771 + ], + "acc_eval": 0.2763671875, + "epoch": 95 + }, + { + "hidden_norms": [ + 5427.34619140625, + 1751408.875, + 3894547.75, + 4991554.5, + 4532145.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797307334840298, + 0.000664835621137172, + 0.0006642266525886953, + 0.000671364541631192, + 0.0006645115208812058 + ], + "acc_eval": 0.296875, + "epoch": 96 + }, + { + "hidden_norms": [ + 5420.30615234375, + 1751757.5, + 3894027.5, + 4991042.0, + 4531674.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007797667058184743, + 0.0006446840125136077, + 0.0006447113119065762, + 0.0006447701598517597, + 0.0006448116037063301 + ], + "acc_eval": 0.2939453125, + "epoch": 97 + }, + { + "hidden_norms": [ + 5416.81396484375, + 1751629.625, + 3893959.25, + 4991021.5, + 4531639.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007706825854256749, + 0.0006446407060138881, + 0.0006406756583601236, + 0.0006447536870837212, + 0.0006393496878445148 + ], + "acc_eval": 0.306640625, + "epoch": 98 + }, + { + "hidden_norms": [ + 5415.3095703125, + 1751552.75, + 3893897.0, + 4990973.0, + 4531587.5 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007776900893077254, + 0.0006458400748670101, + 0.0006446869228966534, + 0.0006466003833338618, + 0.0006447876221500337 + ], + "acc_eval": 0.2978515625, + "epoch": 99 + }, + { + "hidden_norms": [ + 5414.92822265625, + 1751530.25, + 3893876.5, + 4990954.0, + 4531568.0 + ], + "bp_grad_norms_per_sample_med": [ + 0.0007761479937471449, + 0.0006465426995418966, + 0.0006446881452575326, + 0.0006466349004767835, + 0.0006447875639423728 + ], + "acc_eval": 0.294921875, + "epoch": 100 + } + ], + "arch": "resmlp_noln", + "seed": 42 +}
\ No newline at end of file |
