summaryrefslogtreecommitdiff
path: root/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json
diff options
context:
space:
mode:
Diffstat (limited to 'results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json')
-rw-r--r--results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json1824
1 files changed, 1824 insertions, 0 deletions
diff --git a/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json
new file mode 100644
index 0000000..7e5cb37
--- /dev/null
+++ b/results/snapshot_no_outln_v1/snapshot_fa_noln_s42.json
@@ -0,0 +1,1824 @@
+{
+ "fa_log": [
+ {
+ "hidden_norms": [
+ 8.718070030212402,
+ 8.780964851379395,
+ 8.812002182006836,
+ 8.828720092773438,
+ 8.893179893493652
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0005561555735766888,
+ 0.0005519049009308219,
+ 0.0005482902633957565,
+ 0.0005436676437966526,
+ 0.000538847001735121
+ ],
+ "acc_eval": 0.1123046875,
+ "epoch": 0
+ },
+ {
+ "hidden_norms": [
+ 736.34716796875,
+ 1637.1044921875,
+ 2033.1922607421875,
+ 2161.380859375,
+ 2126.18505859375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0006836718530394137,
+ 0.0006813183426856995,
+ 0.0006814387743361294,
+ 0.0006832550279796124,
+ 0.0006794488872401416
+ ],
+ "acc_eval": 0.1953125,
+ "epoch": 1
+ },
+ {
+ "hidden_norms": [
+ 1106.3868408203125,
+ 2963.552001953125,
+ 4087.33837890625,
+ 4421.4921875,
+ 4265.1083984375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007476353785023093,
+ 0.0007440777844749391,
+ 0.0007443943759426475,
+ 0.0007477496401406825,
+ 0.0007366884965449572
+ ],
+ "acc_eval": 0.1044921875,
+ "epoch": 2
+ },
+ {
+ "hidden_norms": [
+ 1371.9425048828125,
+ 4214.05078125,
+ 6238.47265625,
+ 6697.2333984375,
+ 6399.22314453125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000730870058760047,
+ 0.00072717375587672,
+ 0.0007270713686011732,
+ 0.0007290731882676482,
+ 0.0007233614451251924
+ ],
+ "acc_eval": 0.1943359375,
+ "epoch": 3
+ },
+ {
+ "hidden_norms": [
+ 1574.7962646484375,
+ 4805.0556640625,
+ 7044.64599609375,
+ 7593.78955078125,
+ 7215.32763671875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007098641362972558,
+ 0.0007034889422357082,
+ 0.0007031699060462415,
+ 0.0007120345253497362,
+ 0.000694308546371758
+ ],
+ "acc_eval": 0.2451171875,
+ "epoch": 4
+ },
+ {
+ "hidden_norms": [
+ 1726.088623046875,
+ 6184.34521484375,
+ 9521.791015625,
+ 10387.7236328125,
+ 9721.431640625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007400272879749537,
+ 0.0007343650795519352,
+ 0.0007334973197430372,
+ 0.0007343514007516205,
+ 0.0007319966680370271
+ ],
+ "acc_eval": 0.212890625,
+ "epoch": 5
+ },
+ {
+ "hidden_norms": [
+ 1902.689697265625,
+ 7697.52197265625,
+ 12328.0595703125,
+ 13597.1787109375,
+ 12504.158203125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007165716378949583,
+ 0.0007126733544282615,
+ 0.0007124089752323925,
+ 0.0007126083364710212,
+ 0.0007107863784767687
+ ],
+ "acc_eval": 0.15625,
+ "epoch": 6
+ },
+ {
+ "hidden_norms": [
+ 2069.750244140625,
+ 10379.2958984375,
+ 16444.7421875,
+ 18267.94921875,
+ 16595.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007099996437318623,
+ 0.0007088935235515237,
+ 0.0007090346189215779,
+ 0.000710709486156702,
+ 0.0007023006328381598
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 7
+ },
+ {
+ "hidden_norms": [
+ 2226.40673828125,
+ 12703.916015625,
+ 20184.30859375,
+ 22453.73828125,
+ 20183.220703125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00072157580871135,
+ 0.0007210742915049195,
+ 0.0007212630589492619,
+ 0.0007244180305860937,
+ 0.0007163899717852473
+ ],
+ "acc_eval": 0.2236328125,
+ "epoch": 8
+ },
+ {
+ "hidden_norms": [
+ 2289.455078125,
+ 15611.2138671875,
+ 24559.412109375,
+ 27336.787109375,
+ 24451.6796875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007243232685141265,
+ 0.0007221215637400746,
+ 0.0007219284889288247,
+ 0.0007259267731569707,
+ 0.0007173537742346525
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 9
+ },
+ {
+ "hidden_norms": [
+ 2396.09814453125,
+ 19678.587890625,
+ 30417.08203125,
+ 34140.70703125,
+ 30261.052734375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007124242256395519,
+ 0.0007074667955748737,
+ 0.0007074963650666177,
+ 0.0007131542661227286,
+ 0.0007022957433946431
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 10
+ },
+ {
+ "hidden_norms": [
+ 2467.864013671875,
+ 24019.642578125,
+ 41156.921875,
+ 46706.38671875,
+ 41256.71484375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007333463290706277,
+ 0.0007277126424014568,
+ 0.0007268521003425121,
+ 0.000731462670955807,
+ 0.0007225224399007857
+ ],
+ "acc_eval": 0.169921875,
+ "epoch": 11
+ },
+ {
+ "hidden_norms": [
+ 2518.561767578125,
+ 28957.451171875,
+ 55737.69140625,
+ 64112.609375,
+ 56246.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007202349370345473,
+ 0.0007073598098941147,
+ 0.0007049349951557815,
+ 0.0007059182389639318,
+ 0.0007044971571303904
+ ],
+ "acc_eval": 0.1513671875,
+ "epoch": 12
+ },
+ {
+ "hidden_norms": [
+ 2614.843994140625,
+ 34279.15625,
+ 74158.109375,
+ 86073.96875,
+ 75187.59375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007299556746147573,
+ 0.0007100331713445485,
+ 0.0007101728115230799,
+ 0.0007166104041971266,
+ 0.0007030466804280877
+ ],
+ "acc_eval": 0.24609375,
+ "epoch": 13
+ },
+ {
+ "hidden_norms": [
+ 2697.871337890625,
+ 41263.5390625,
+ 96222.8984375,
+ 112901.9765625,
+ 98551.3046875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007336065755225718,
+ 0.0007151410100050271,
+ 0.0007150733144953847,
+ 0.0007166287978179753,
+ 0.0007151660392992198
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 14
+ },
+ {
+ "hidden_norms": [
+ 2815.983154296875,
+ 53842.3828125,
+ 126185.5625,
+ 149526.796875,
+ 130144.4765625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007365003693848848,
+ 0.0007177364313974977,
+ 0.0007168670417740941,
+ 0.000717108603566885,
+ 0.0007130720769055188
+ ],
+ "acc_eval": 0.150390625,
+ "epoch": 15
+ },
+ {
+ "hidden_norms": [
+ 2928.448974609375,
+ 65162.98046875,
+ 153909.296875,
+ 184005.875,
+ 159483.03125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007613440393470228,
+ 0.000720723532140255,
+ 0.000720796815585345,
+ 0.0007208258030004799,
+ 0.0007211563643068075
+ ],
+ "acc_eval": 0.166015625,
+ "epoch": 16
+ },
+ {
+ "hidden_norms": [
+ 2970.975341796875,
+ 76176.9609375,
+ 179093.75,
+ 216167.875,
+ 186723.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007602480472996831,
+ 0.0007191941258497536,
+ 0.0007163456757552922,
+ 0.0007164765265770257,
+ 0.0007142137037590146
+ ],
+ "acc_eval": 0.1796875,
+ "epoch": 17
+ },
+ {
+ "hidden_norms": [
+ 3078.336181640625,
+ 91839.40625,
+ 215980.015625,
+ 263515.15625,
+ 227071.515625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007584959384985268,
+ 0.0007150565506890416,
+ 0.0007151922909542918,
+ 0.000715585716534406,
+ 0.0007152389152906835
+ ],
+ "acc_eval": 0.1767578125,
+ "epoch": 18
+ },
+ {
+ "hidden_norms": [
+ 3202.803466796875,
+ 104358.6875,
+ 248325.390625,
+ 305395.84375,
+ 262365.46875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007867171661928296,
+ 0.0007155268103815615,
+ 0.0007155817584134638,
+ 0.0007157608633860946,
+ 0.0007155768107622862
+ ],
+ "acc_eval": 0.138671875,
+ "epoch": 19
+ },
+ {
+ "hidden_norms": [
+ 3282.27490234375,
+ 117747.359375,
+ 284217.3125,
+ 351018.15625,
+ 300903.65625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007691550417803228,
+ 0.0007147297146730125,
+ 0.0007147309370338917,
+ 0.0007150261080823839,
+ 0.0007147534633986652
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 20
+ },
+ {
+ "hidden_norms": [
+ 3394.945556640625,
+ 129443.9765625,
+ 317078.65625,
+ 393509.375,
+ 336658.40625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008442914695478976,
+ 0.0007179519161581993,
+ 0.0007190873729996383,
+ 0.000723545381333679,
+ 0.0007175213540904224
+ ],
+ "acc_eval": 0.1376953125,
+ "epoch": 21
+ },
+ {
+ "hidden_norms": [
+ 3484.2763671875,
+ 140426.171875,
+ 355086.84375,
+ 443148.09375,
+ 378501.53125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007702927687205374,
+ 0.0006826652679592371,
+ 0.0006794629734940827,
+ 0.0006826536264270544,
+ 0.0006794703076593578
+ ],
+ "acc_eval": 0.19140625,
+ "epoch": 22
+ },
+ {
+ "hidden_norms": [
+ 3529.414306640625,
+ 153612.265625,
+ 393522.9375,
+ 493183.03125,
+ 421284.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008731107809580863,
+ 0.0007047304534353316,
+ 0.0007038630428723991,
+ 0.000708943116478622,
+ 0.000701444165315479
+ ],
+ "acc_eval": 0.16796875,
+ "epoch": 23
+ },
+ {
+ "hidden_norms": [
+ 3604.90283203125,
+ 165405.75,
+ 423586.46875,
+ 533219.375,
+ 454992.90625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008110221242532134,
+ 0.0006812610663473606,
+ 0.0006812110659666359,
+ 0.0006817537359893322,
+ 0.0006813214858993888
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 24
+ },
+ {
+ "hidden_norms": [
+ 3761.85400390625,
+ 178944.296875,
+ 464984.875,
+ 587869.375,
+ 501438.21875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008038324886001647,
+ 0.0006578225293196738,
+ 0.0006502956384792924,
+ 0.000664222112391144,
+ 0.0006502254982478917
+ ],
+ "acc_eval": 0.240234375,
+ "epoch": 25
+ },
+ {
+ "hidden_norms": [
+ 3818.5869140625,
+ 193167.4375,
+ 505599.375,
+ 643764.4375,
+ 550033.3125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007956585614010692,
+ 0.0007038708426989615,
+ 0.0007025190279819071,
+ 0.0007078333292156458,
+ 0.0006988184759393334
+ ],
+ "acc_eval": 0.185546875,
+ "epoch": 26
+ },
+ {
+ "hidden_norms": [
+ 3924.1787109375,
+ 207801.1875,
+ 548741.125,
+ 701043.0625,
+ 599520.4375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009222823427990079,
+ 0.000673642847687006,
+ 0.0006724554114043713,
+ 0.0006726986612193286,
+ 0.0006725445855408907
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 27
+ },
+ {
+ "hidden_norms": [
+ 4061.806884765625,
+ 222595.921875,
+ 590807.5,
+ 755718.75,
+ 646775.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008092334610410035,
+ 0.0007093537133187056,
+ 0.0007078479393385351,
+ 0.0007069098646752536,
+ 0.0007029378321021795
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 28
+ },
+ {
+ "hidden_norms": [
+ 4216.11083984375,
+ 237549.296875,
+ 636429.5625,
+ 816954.9375,
+ 699524.9375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008620031294412911,
+ 0.0007326522027142346,
+ 0.00072627910412848,
+ 0.000725903722923249,
+ 0.0007269763154909015
+ ],
+ "acc_eval": 0.1533203125,
+ "epoch": 29
+ },
+ {
+ "hidden_norms": [
+ 4319.05029296875,
+ 251667.5,
+ 681409.75,
+ 874567.9375,
+ 748820.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008448463049717247,
+ 0.0007160686072893441,
+ 0.000714016379788518,
+ 0.0007141274982132018,
+ 0.0007095346227288246
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 30
+ },
+ {
+ "hidden_norms": [
+ 4387.8330078125,
+ 268470.375,
+ 733153.125,
+ 943456.375,
+ 808793.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009849616326391697,
+ 0.0007160623208619654,
+ 0.0007154300110414624,
+ 0.0007152247708290815,
+ 0.0007160453242249787
+ ],
+ "acc_eval": 0.1884765625,
+ "epoch": 31
+ },
+ {
+ "hidden_norms": [
+ 4495.54638671875,
+ 291274.59375,
+ 806698.75,
+ 1039374.875,
+ 892062.1875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008646573405712843,
+ 0.000731874315533787,
+ 0.0007177238585427403,
+ 0.0007205329020507634,
+ 0.0007192457560449839
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 32
+ },
+ {
+ "hidden_norms": [
+ 4596.96337890625,
+ 305228.46875,
+ 848072.5625,
+ 1092268.625,
+ 937583.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009474663529545069,
+ 0.0007221641135402024,
+ 0.000721680698916316,
+ 0.0007284134044311941,
+ 0.0007212713244371116
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 33
+ },
+ {
+ "hidden_norms": [
+ 4724.111328125,
+ 321366.5,
+ 891238.9375,
+ 1149886.25,
+ 987910.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009131877450272441,
+ 0.0007397676818072796,
+ 0.0007398735033348203,
+ 0.0007397927111014724,
+ 0.0007406016811728477
+ ],
+ "acc_eval": 0.125,
+ "epoch": 34
+ },
+ {
+ "hidden_norms": [
+ 4865.970703125,
+ 344027.15625,
+ 946722.0625,
+ 1219714.625,
+ 1049445.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001010064734145999,
+ 0.0007341124583035707,
+ 0.0007336883572861552,
+ 0.0007345521007664502,
+ 0.0007338698487728834
+ ],
+ "acc_eval": 0.119140625,
+ "epoch": 35
+ },
+ {
+ "hidden_norms": [
+ 5003.3857421875,
+ 373410.21875,
+ 1026535.0625,
+ 1321456.25,
+ 1139824.625
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010555180488154292,
+ 0.0007112861494533718,
+ 0.0007111895247362554,
+ 0.0007112334715202451,
+ 0.000711193191818893
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 36
+ },
+ {
+ "hidden_norms": [
+ 5121.19287109375,
+ 405646.9375,
+ 1111111.125,
+ 1430716.625,
+ 1237074.375
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010308363707736135,
+ 0.0007563655963167548,
+ 0.0007560031372122467,
+ 0.000755665882024914,
+ 0.0007561628590337932
+ ],
+ "acc_eval": 0.134765625,
+ "epoch": 37
+ },
+ {
+ "hidden_norms": [
+ 5212.7294921875,
+ 434054.15625,
+ 1180238.125,
+ 1518019.875,
+ 1314350.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001035128254443407,
+ 0.0007314062095247209,
+ 0.0007304889149963856,
+ 0.0007291524088941514,
+ 0.0007313747191801667
+ ],
+ "acc_eval": 0.140625,
+ "epoch": 38
+ },
+ {
+ "hidden_norms": [
+ 5322.74951171875,
+ 462000.6875,
+ 1248006.75,
+ 1606243.125,
+ 1392563.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009023830061778426,
+ 0.000720554031431675,
+ 0.0007195135112851858,
+ 0.0007197313825599849,
+ 0.0007196948863565922
+ ],
+ "acc_eval": 0.1708984375,
+ "epoch": 39
+ },
+ {
+ "hidden_norms": [
+ 5453.89111328125,
+ 498941.0625,
+ 1343521.0,
+ 1731177.375,
+ 1504101.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010444134240970016,
+ 0.0007362678297795355,
+ 0.0007352089160121977,
+ 0.0007340405718423426,
+ 0.0007357052527368069
+ ],
+ "acc_eval": 0.1328125,
+ "epoch": 40
+ },
+ {
+ "hidden_norms": [
+ 5515.6982421875,
+ 529817.75,
+ 1409505.625,
+ 1816151.0,
+ 1580539.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011280628386884928,
+ 0.0007231750059872866,
+ 0.0007211649208329618,
+ 0.000721275107935071,
+ 0.0007212632917799056
+ ],
+ "acc_eval": 0.1611328125,
+ "epoch": 41
+ },
+ {
+ "hidden_norms": [
+ 5617.26513671875,
+ 567492.4375,
+ 1498097.5,
+ 1931607.875,
+ 1684206.875
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010544253746047616,
+ 0.0007354306289926171,
+ 0.0007348860381171107,
+ 0.0007349851075559855,
+ 0.0007350810337811708
+ ],
+ "acc_eval": 0.1416015625,
+ "epoch": 42
+ },
+ {
+ "hidden_norms": [
+ 5740.7978515625,
+ 596215.625,
+ 1561745.25,
+ 2014107.25,
+ 1758526.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010764201870188117,
+ 0.0007244387525133789,
+ 0.000723967794328928,
+ 0.000724096957128495,
+ 0.0007241644198074937
+ ],
+ "acc_eval": 0.19921875,
+ "epoch": 43
+ },
+ {
+ "hidden_norms": [
+ 5808.19677734375,
+ 630780.3125,
+ 1636034.875,
+ 2109305.75,
+ 1845552.125
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010526466649025679,
+ 0.0007206913433037698,
+ 0.0007207048474811018,
+ 0.0007211468764580786,
+ 0.0007207895396277308
+ ],
+ "acc_eval": 0.173828125,
+ "epoch": 44
+ },
+ {
+ "hidden_norms": [
+ 5868.3583984375,
+ 673578.625,
+ 1729325.25,
+ 2227518.0,
+ 1953361.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009479392319917679,
+ 0.0007091389270499349,
+ 0.0007090644794516265,
+ 0.0007082624360918999,
+ 0.0007085782708600163
+ ],
+ "acc_eval": 0.1923828125,
+ "epoch": 45
+ },
+ {
+ "hidden_norms": [
+ 5953.82421875,
+ 720273.0,
+ 1840695.5,
+ 2372038.0,
+ 2084658.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0014002618845552206,
+ 0.0007315247785300016,
+ 0.0007256051758304238,
+ 0.0007254919619299471,
+ 0.000725599646102637
+ ],
+ "acc_eval": 0.17578125,
+ "epoch": 46
+ },
+ {
+ "hidden_norms": [
+ 6054.7861328125,
+ 758000.6875,
+ 1930354.375,
+ 2488163.75,
+ 2190582.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001109408913180232,
+ 0.0007018125616014004,
+ 0.0007016566814854741,
+ 0.000701890152413398,
+ 0.0007018494652584195
+ ],
+ "acc_eval": 0.203125,
+ "epoch": 47
+ },
+ {
+ "hidden_norms": [
+ 6155.0859375,
+ 790443.0,
+ 2009565.875,
+ 2590829.25,
+ 2285268.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010253023356199265,
+ 0.0007347314967773855,
+ 0.0007304528844542801,
+ 0.0007322027231566608,
+ 0.0007312395609915257
+ ],
+ "acc_eval": 0.154296875,
+ "epoch": 48
+ },
+ {
+ "hidden_norms": [
+ 6216.64453125,
+ 830678.125,
+ 2088773.5,
+ 2691122.0,
+ 2376731.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010403504129499197,
+ 0.0006902964669279754,
+ 0.0006906419876031578,
+ 0.0006905900663696229,
+ 0.0006906461785547435
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 49
+ },
+ {
+ "hidden_norms": [
+ 6252.98486328125,
+ 867790.1875,
+ 2159729.75,
+ 2781409.5,
+ 2460902.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0011370684951543808,
+ 0.0007390088285319507,
+ 0.0007305812323465943,
+ 0.0007310720975510776,
+ 0.0007304322207346559
+ ],
+ "acc_eval": 0.15234375,
+ "epoch": 50
+ },
+ {
+ "hidden_norms": [
+ 6294.51611328125,
+ 897267.5625,
+ 2218282.5,
+ 2858224.75,
+ 2530432.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0013790406519547105,
+ 0.0007320911972783506,
+ 0.0007304649334400892,
+ 0.0007293879170902073,
+ 0.0007303770980797708
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 51
+ },
+ {
+ "hidden_norms": [
+ 6312.2314453125,
+ 935570.375,
+ 2299086.0,
+ 2963619.0,
+ 2627515.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000999285257421434,
+ 0.0007227054447866976,
+ 0.0007246703025884926,
+ 0.0007245387532748282,
+ 0.0007243558065965772
+ ],
+ "acc_eval": 0.20703125,
+ "epoch": 52
+ },
+ {
+ "hidden_norms": [
+ 6387.30322265625,
+ 977101.125,
+ 2387243.0,
+ 3077676.25,
+ 2733147.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001396833686158061,
+ 0.0007110408041626215,
+ 0.0007093287422321737,
+ 0.000708233390469104,
+ 0.0007085108081810176
+ ],
+ "acc_eval": 0.1787109375,
+ "epoch": 53
+ },
+ {
+ "hidden_norms": [
+ 6406.59033203125,
+ 1011753.1875,
+ 2450391.25,
+ 3158275.0,
+ 2807055.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0012408416951075196,
+ 0.0007304692408069968,
+ 0.000724659999832511,
+ 0.0007247650064527988,
+ 0.0007249858463183045
+ ],
+ "acc_eval": 0.130859375,
+ "epoch": 54
+ },
+ {
+ "hidden_norms": [
+ 6396.32080078125,
+ 1051044.375,
+ 2521085.5,
+ 3249326.75,
+ 2890642.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010854896390810609,
+ 0.0006957638543099165,
+ 0.0006896257400512695,
+ 0.0006964386557228863,
+ 0.0006897017010487616
+ ],
+ "acc_eval": 0.234375,
+ "epoch": 55
+ },
+ {
+ "hidden_norms": [
+ 6413.91357421875,
+ 1083474.5,
+ 2597945.5,
+ 3348271.5,
+ 2981405.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.00098806235473603,
+ 0.000719150179065764,
+ 0.0007170068565756083,
+ 0.0007178731029853225,
+ 0.0007173708290793002
+ ],
+ "acc_eval": 0.205078125,
+ "epoch": 56
+ },
+ {
+ "hidden_norms": [
+ 6406.4228515625,
+ 1124429.875,
+ 2675529.5,
+ 3447474.25,
+ 3073241.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001149638439528644,
+ 0.0007225789595395327,
+ 0.0007212197524495423,
+ 0.0007210947806015611,
+ 0.0007211659685708582
+ ],
+ "acc_eval": 0.1494140625,
+ "epoch": 57
+ },
+ {
+ "hidden_norms": [
+ 6443.423828125,
+ 1166184.375,
+ 2758561.25,
+ 3551879.75,
+ 3171214.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.001115654013119638,
+ 0.000685695675201714,
+ 0.0006846366450190544,
+ 0.0006861463189125061,
+ 0.0006862673326395452
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 58
+ },
+ {
+ "hidden_norms": [
+ 6477.5,
+ 1208826.0,
+ 2842194.75,
+ 3654862.0,
+ 3267617.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000923235435038805,
+ 0.0006659153732471168,
+ 0.0006642267107963562,
+ 0.0006722065154463053,
+ 0.000664416525978595
+ ],
+ "acc_eval": 0.2353515625,
+ "epoch": 59
+ },
+ {
+ "hidden_norms": [
+ 6486.1689453125,
+ 1249377.0,
+ 2928293.75,
+ 3765881.75,
+ 3370835.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008846685523167253,
+ 0.0006866253679618239,
+ 0.000686973100528121,
+ 0.0006869880016893148,
+ 0.0006870955694466829
+ ],
+ "acc_eval": 0.2373046875,
+ "epoch": 60
+ },
+ {
+ "hidden_norms": [
+ 6499.3720703125,
+ 1291233.25,
+ 3012714.75,
+ 3873429.75,
+ 3471234.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009820004925131798,
+ 0.0007174524944275618,
+ 0.0007178467349149287,
+ 0.0007176626822911203,
+ 0.0007174718775786459
+ ],
+ "acc_eval": 0.216796875,
+ "epoch": 61
+ },
+ {
+ "hidden_norms": [
+ 6486.14404296875,
+ 1327247.75,
+ 3088322.75,
+ 3971415.75,
+ 3562299.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010241338750347495,
+ 0.0007171124452725053,
+ 0.0007174332858994603,
+ 0.0007172181503847241,
+ 0.0007169945747591555
+ ],
+ "acc_eval": 0.18359375,
+ "epoch": 62
+ },
+ {
+ "hidden_norms": [
+ 6455.17236328125,
+ 1355067.375,
+ 3142698.25,
+ 4041006.5,
+ 3627490.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009781530825421214,
+ 0.0007034538430161774,
+ 0.000703376077581197,
+ 0.0007118352805264294,
+ 0.0007080681971274316
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 63
+ },
+ {
+ "hidden_norms": [
+ 6454.62841796875,
+ 1384795.75,
+ 3199654.0,
+ 4114095.75,
+ 3696468.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009227422997355461,
+ 0.0007023688522167504,
+ 0.0007012909045442939,
+ 0.0007004260551184416,
+ 0.0007006779196672142
+ ],
+ "acc_eval": 0.21484375,
+ "epoch": 64
+ },
+ {
+ "hidden_norms": [
+ 6451.345703125,
+ 1420232.75,
+ 3260116.5,
+ 4190244.25,
+ 3768354.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008870494784787297,
+ 0.0007146014831960201,
+ 0.0007149986922740936,
+ 0.0007148014265112579,
+ 0.0007145918207243085
+ ],
+ "acc_eval": 0.197265625,
+ "epoch": 65
+ },
+ {
+ "hidden_norms": [
+ 6445.890625,
+ 1448264.875,
+ 3319505.0,
+ 4267505.0,
+ 3840047.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0010003555798903108,
+ 0.0007171350298449397,
+ 0.0007168895681388676,
+ 0.0007169176824390888,
+ 0.0007170233875513077
+ ],
+ "acc_eval": 0.1591796875,
+ "epoch": 66
+ },
+ {
+ "hidden_norms": [
+ 6440.8212890625,
+ 1478082.75,
+ 3376291.25,
+ 4340727.0,
+ 3909334.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009646597318351269,
+ 0.0007130720769055188,
+ 0.0007134011830203235,
+ 0.0007131980964913964,
+ 0.0007129770237952471
+ ],
+ "acc_eval": 0.171875,
+ "epoch": 67
+ },
+ {
+ "hidden_norms": [
+ 6398.03955078125,
+ 1508487.5,
+ 3436526.25,
+ 4417271.5,
+ 3981251.75
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009445869363844395,
+ 0.0007122856914065778,
+ 0.0007126569980755448,
+ 0.0007124742260202765,
+ 0.0007122504175640643
+ ],
+ "acc_eval": 0.189453125,
+ "epoch": 68
+ },
+ {
+ "hidden_norms": [
+ 6389.02392578125,
+ 1530834.625,
+ 3480246.5,
+ 4471170.0,
+ 4032576.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009853171650320292,
+ 0.0006874292739666998,
+ 0.0006876476109027863,
+ 0.0006881517474539578,
+ 0.0006880395230837166
+ ],
+ "acc_eval": 0.1904296875,
+ "epoch": 69
+ },
+ {
+ "hidden_norms": [
+ 6338.54443359375,
+ 1561198.875,
+ 3541681.5,
+ 4548099.0,
+ 4105499.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009333671187050641,
+ 0.0006952910916879773,
+ 0.0006947650690563023,
+ 0.0006940987077541649,
+ 0.0006943742628209293
+ ],
+ "acc_eval": 0.23046875,
+ "epoch": 70
+ },
+ {
+ "hidden_norms": [
+ 6280.18603515625,
+ 1585008.0,
+ 3589125.25,
+ 4608667.0,
+ 4162480.25
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009699579677544534,
+ 0.0007101434166543186,
+ 0.0007104446412995458,
+ 0.000710242718923837,
+ 0.0007100136135704815
+ ],
+ "acc_eval": 0.146484375,
+ "epoch": 71
+ },
+ {
+ "hidden_norms": [
+ 6252.455078125,
+ 1608187.875,
+ 3635014.75,
+ 4667478.5,
+ 4218253.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008955001248978078,
+ 0.0006863236776553094,
+ 0.0006864941096864641,
+ 0.000687020889017731,
+ 0.0006868807831779122
+ ],
+ "acc_eval": 0.2431640625,
+ "epoch": 72
+ },
+ {
+ "hidden_norms": [
+ 6201.6845703125,
+ 1619508.875,
+ 3661275.25,
+ 4700652.0,
+ 4249921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009069991065189242,
+ 0.0006539999740198255,
+ 0.0006531713879667222,
+ 0.0006594359292648733,
+ 0.000653320224955678
+ ],
+ "acc_eval": 0.2216796875,
+ "epoch": 73
+ },
+ {
+ "hidden_norms": [
+ 6182.8115234375,
+ 1632587.875,
+ 3679586.25,
+ 4722070.5,
+ 4271567.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009595821611583233,
+ 0.0007079984061419964,
+ 0.0007082773372530937,
+ 0.0007081056828610599,
+ 0.000707884959410876
+ ],
+ "acc_eval": 0.193359375,
+ "epoch": 74
+ },
+ {
+ "hidden_norms": [
+ 6153.7392578125,
+ 1653576.875,
+ 3722935.0,
+ 4776921.0,
+ 4323508.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008598894928582013,
+ 0.0007073319284245372,
+ 0.0007075938628986478,
+ 0.0007074539898894727,
+ 0.0007072555599734187
+ ],
+ "acc_eval": 0.201171875,
+ "epoch": 75
+ },
+ {
+ "hidden_norms": [
+ 6135.21240234375,
+ 1667474.375,
+ 3750912.75,
+ 4812450.5,
+ 4357575.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0009454588289372623,
+ 0.0007068001432344317,
+ 0.0007069715647958219,
+ 0.0007067638216540217,
+ 0.0007065933896228671
+ ],
+ "acc_eval": 0.2158203125,
+ "epoch": 76
+ },
+ {
+ "hidden_norms": [
+ 6085.7109375,
+ 1679251.75,
+ 3774334.5,
+ 4840148.5,
+ 4384792.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008410231093876064,
+ 0.0006843701121397316,
+ 0.0006845371681265533,
+ 0.00068506138632074,
+ 0.0006849151104688644
+ ],
+ "acc_eval": 0.2578125,
+ "epoch": 77
+ },
+ {
+ "hidden_norms": [
+ 6042.693359375,
+ 1685705.5,
+ 3787479.75,
+ 4856211.0,
+ 4400193.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008572259685024619,
+ 0.0006840305286459625,
+ 0.0006841861759312451,
+ 0.0006847094628028572,
+ 0.0006845552125014365
+ ],
+ "acc_eval": 0.2568359375,
+ "epoch": 78
+ },
+ {
+ "hidden_norms": [
+ 6003.5390625,
+ 1702685.5,
+ 3813174.5,
+ 4888481.0,
+ 4430612.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008342780056409538,
+ 0.0006777377566322684,
+ 0.0006779460818506777,
+ 0.0006789933540858328,
+ 0.0006781259435229003
+ ],
+ "acc_eval": 0.2685546875,
+ "epoch": 79
+ },
+ {
+ "hidden_norms": [
+ 5948.60107421875,
+ 1714243.125,
+ 3830846.5,
+ 4910337.5,
+ 4451921.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008218465954996645,
+ 0.0006832804065197706,
+ 0.0006831764476373792,
+ 0.0006826326716691256,
+ 0.0006829035119153559
+ ],
+ "acc_eval": 0.2529296875,
+ "epoch": 80
+ },
+ {
+ "hidden_norms": [
+ 5881.8525390625,
+ 1718113.375,
+ 3838036.5,
+ 4920025.5,
+ 4461931.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007958809728734195,
+ 0.000677398347761482,
+ 0.0006775528891012073,
+ 0.0006775871734134853,
+ 0.0006777321686968207
+ ],
+ "acc_eval": 0.2548828125,
+ "epoch": 81
+ },
+ {
+ "hidden_norms": [
+ 5816.7880859375,
+ 1723461.25,
+ 3850904.75,
+ 4936806.0,
+ 4478473.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008361428044736385,
+ 0.0006769691244699061,
+ 0.0006771331536583602,
+ 0.0006771665066480637,
+ 0.0006773129571229219
+ ],
+ "acc_eval": 0.251953125,
+ "epoch": 82
+ },
+ {
+ "hidden_norms": [
+ 5760.41845703125,
+ 1732135.25,
+ 3859576.0,
+ 4947171.0,
+ 4488986.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008036325452849269,
+ 0.0006821549613960087,
+ 0.0006806753808632493,
+ 0.0006799713592045009,
+ 0.0006802318384870887
+ ],
+ "acc_eval": 0.2490234375,
+ "epoch": 83
+ },
+ {
+ "hidden_norms": [
+ 5710.22998046875,
+ 1740014.25,
+ 3871992.25,
+ 4962337.5,
+ 4503463.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008278922759927809,
+ 0.0006754198693670332,
+ 0.000675307004712522,
+ 0.0006768241291865706,
+ 0.0006769676692783833
+ ],
+ "acc_eval": 0.26171875,
+ "epoch": 84
+ },
+ {
+ "hidden_norms": [
+ 5685.73828125,
+ 1745863.25,
+ 3880256.75,
+ 4973639.5,
+ 4514457.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008255501161329448,
+ 0.0006466225022450089,
+ 0.0006466452032327652,
+ 0.0006467151688411832,
+ 0.0006467655766755342
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 85
+ },
+ {
+ "hidden_norms": [
+ 5637.498046875,
+ 1743128.375,
+ 3879796.5,
+ 4973009.0,
+ 4514424.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008148956694640219,
+ 0.0006465681362897158,
+ 0.0006463592289946973,
+ 0.0006491504609584808,
+ 0.0006464755861088634
+ ],
+ "acc_eval": 0.2587890625,
+ "epoch": 86
+ },
+ {
+ "hidden_norms": [
+ 5601.87744140625,
+ 1741859.375,
+ 3884447.75,
+ 4978445.5,
+ 4518886.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008254973217844963,
+ 0.0006783050484955311,
+ 0.0006774527719244361,
+ 0.0006768335006199777,
+ 0.0006770920008420944
+ ],
+ "acc_eval": 0.298828125,
+ "epoch": 87
+ },
+ {
+ "hidden_norms": [
+ 5587.505859375,
+ 1748285.875,
+ 3887730.5,
+ 4982144.0,
+ 4523151.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008113561780191958,
+ 0.0006764904828742146,
+ 0.000676542054861784,
+ 0.0006762324483133852,
+ 0.0006764894351363182
+ ],
+ "acc_eval": 0.2734375,
+ "epoch": 88
+ },
+ {
+ "hidden_norms": [
+ 5553.013671875,
+ 1748456.75,
+ 3890722.0,
+ 4986538.5,
+ 4527315.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007909060223028064,
+ 0.0006763285491615534,
+ 0.0006762049742974341,
+ 0.0006756742368452251,
+ 0.000675930583383888
+ ],
+ "acc_eval": 0.2861328125,
+ "epoch": 89
+ },
+ {
+ "hidden_norms": [
+ 5524.611328125,
+ 1748210.0,
+ 3893003.75,
+ 4989732.5,
+ 4530436.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.000797618820797652,
+ 0.0006453269743360579,
+ 0.0006453663809224963,
+ 0.0006454290705733001,
+ 0.0006454723770730197
+ ],
+ "acc_eval": 0.28515625,
+ "epoch": 90
+ },
+ {
+ "hidden_norms": [
+ 5506.21923828125,
+ 1750958.0,
+ 3894639.5,
+ 4992073.0,
+ 4532399.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007834367570467293,
+ 0.0006762953125871718,
+ 0.0006754640489816666,
+ 0.0006748714949935675,
+ 0.0006751226610504091
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 91
+ },
+ {
+ "hidden_norms": [
+ 5485.10791015625,
+ 1747546.25,
+ 3895030.0,
+ 4992480.5,
+ 4532805.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007779909064993262,
+ 0.0006450997898355126,
+ 0.0006451247027143836,
+ 0.0006455867551267147,
+ 0.0006452234229072928
+ ],
+ "acc_eval": 0.2890625,
+ "epoch": 92
+ },
+ {
+ "hidden_norms": [
+ 5464.07763671875,
+ 1749313.125,
+ 3894610.75,
+ 4991684.0,
+ 4532270.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0008090221090242267,
+ 0.0006661301013082266,
+ 0.0006646219990216196,
+ 0.0006726695573888719,
+ 0.0006649038987234235
+ ],
+ "acc_eval": 0.283203125,
+ "epoch": 93
+ },
+ {
+ "hidden_norms": [
+ 5451.2841796875,
+ 1749389.0,
+ 3894315.25,
+ 4990837.5,
+ 4531011.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007907215040177107,
+ 0.0006448677740991116,
+ 0.0006448915228247643,
+ 0.0006451430963352323,
+ 0.0006449950742535293
+ ],
+ "acc_eval": 0.2958984375,
+ "epoch": 94
+ },
+ {
+ "hidden_norms": [
+ 5437.77099609375,
+ 1750653.125,
+ 3895251.75,
+ 4992303.0,
+ 4532441.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007774807745590806,
+ 0.000676269584801048,
+ 0.0006763145211152732,
+ 0.0006763775018043816,
+ 0.000676501716952771
+ ],
+ "acc_eval": 0.2763671875,
+ "epoch": 95
+ },
+ {
+ "hidden_norms": [
+ 5427.34619140625,
+ 1751408.875,
+ 3894547.75,
+ 4991554.5,
+ 4532145.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797307334840298,
+ 0.000664835621137172,
+ 0.0006642266525886953,
+ 0.000671364541631192,
+ 0.0006645115208812058
+ ],
+ "acc_eval": 0.296875,
+ "epoch": 96
+ },
+ {
+ "hidden_norms": [
+ 5420.30615234375,
+ 1751757.5,
+ 3894027.5,
+ 4991042.0,
+ 4531674.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007797667058184743,
+ 0.0006446840125136077,
+ 0.0006447113119065762,
+ 0.0006447701598517597,
+ 0.0006448116037063301
+ ],
+ "acc_eval": 0.2939453125,
+ "epoch": 97
+ },
+ {
+ "hidden_norms": [
+ 5416.81396484375,
+ 1751629.625,
+ 3893959.25,
+ 4991021.5,
+ 4531639.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007706825854256749,
+ 0.0006446407060138881,
+ 0.0006406756583601236,
+ 0.0006447536870837212,
+ 0.0006393496878445148
+ ],
+ "acc_eval": 0.306640625,
+ "epoch": 98
+ },
+ {
+ "hidden_norms": [
+ 5415.3095703125,
+ 1751552.75,
+ 3893897.0,
+ 4990973.0,
+ 4531587.5
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007776900893077254,
+ 0.0006458400748670101,
+ 0.0006446869228966534,
+ 0.0006466003833338618,
+ 0.0006447876221500337
+ ],
+ "acc_eval": 0.2978515625,
+ "epoch": 99
+ },
+ {
+ "hidden_norms": [
+ 5414.92822265625,
+ 1751530.25,
+ 3893876.5,
+ 4990954.0,
+ 4531568.0
+ ],
+ "bp_grad_norms_per_sample_med": [
+ 0.0007761479937471449,
+ 0.0006465426995418966,
+ 0.0006446881452575326,
+ 0.0006466349004767835,
+ 0.0006447875639423728
+ ],
+ "acc_eval": 0.294921875,
+ "epoch": 100
+ }
+ ],
+ "arch": "resmlp_noln",
+ "seed": 42
+} \ No newline at end of file