diff options
| author | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
|---|---|---|
| committer | YurenHao0426 <blackhao0426@gmail.com> | 2026-01-13 23:49:05 -0600 |
| commit | cd99d6b874d9d09b3bb87b8485cc787885af71f1 (patch) | |
| tree | 59a233959932ca0e4f12f196275e07fcf443b33f /runs/depth_scaling_asymm/cifar100_20260101-112330/results.json | |
init commit
Diffstat (limited to 'runs/depth_scaling_asymm/cifar100_20260101-112330/results.json')
| -rw-r--r-- | runs/depth_scaling_asymm/cifar100_20260101-112330/results.json | 16822 |
1 files changed, 16822 insertions, 0 deletions
diff --git a/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json b/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json new file mode 100644 index 0000000..6c6da3b --- /dev/null +++ b/runs/depth_scaling_asymm/cifar100_20260101-112330/results.json @@ -0,0 +1,16822 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 4.348092296829224, + "train_acc": 0.09724, + "test_loss": 3.5478567863464354, + "test_acc": 0.1787, + "lyapunov": null, + "grad_norm": 6.316536759043694, + "grad_max_sv": 4.902881336212158, + "grad_min_sv": 1.1448865706586986e-07, + "grad_condition": 88191421.7926497, + "lr": 0.0009998903417374227, + "time_sec": 17.679682731628418 + }, + { + "epoch": 2, + "train_loss": 3.49050922706604, + "train_acc": 0.1874, + "test_loss": 3.2633129741668703, + "test_acc": 0.2305, + "lyapunov": null, + "grad_norm": 4.4801349556346395, + "grad_max_sv": 3.2215479910373688, + "grad_min_sv": 8.299195606298326e-08, + "grad_condition": 121110274.52327952, + "lr": 0.0009995614150494292, + "time_sec": 15.735185623168945 + }, + { + "epoch": 3, + "train_loss": 3.0170057023620607, + "train_acc": 0.25916, + "test_loss": 2.9698277725219726, + "test_acc": 0.277, + "lyapunov": null, + "grad_norm": 3.5133664087504743, + "grad_max_sv": 2.335329008102417, + "grad_min_sv": 6.557634772974552e-08, + "grad_condition": 39177377.20397766, + "lr": 0.0009990133642141358, + "time_sec": 15.478843212127686 + }, + { + "epoch": 4, + "train_loss": 2.72460933883667, + "train_acc": 0.31376, + "test_loss": 2.5551274646759032, + "test_acc": 0.3459, + "lyapunov": null, + "grad_norm": 2.9634417699116904, + "grad_max_sv": 1.8090383648872375, + "grad_min_sv": 5.484415814827059e-08, + "grad_condition": 38079849.47138412, + "lr": 0.0009982464296247522, + "time_sec": 15.453156232833862 + }, + { + "epoch": 5, + "train_loss": 2.490703504867554, + "train_acc": 0.35894, + "test_loss": 2.7182868785858156, + "test_acc": 0.3267, + "lyapunov": null, + "grad_norm": 2.6429461818460145, + "grad_max_sv": 1.5860196590423583, + "grad_min_sv": 4.9649662298145714e-08, + "grad_condition": 58850970.75600495, + "lr": 0.0009972609476841367, + "time_sec": 15.466280460357666 + }, + { + "epoch": 6, + "train_loss": 2.3172771724700927, + "train_acc": 0.39578, + "test_loss": 2.39353342666626, + "test_acc": 0.3858, + "lyapunov": null, + "grad_norm": 2.425728150736765, + "grad_max_sv": 1.3820528209209442, + "grad_min_sv": 4.6181405355394387e-08, + "grad_condition": 48644681.68891229, + "lr": 0.000996057350657239, + "time_sec": 15.472876071929932 + }, + { + "epoch": 7, + "train_loss": 2.1795343031311036, + "train_acc": 0.42514, + "test_loss": 2.5081939483642577, + "test_acc": 0.3733, + "lyapunov": null, + "grad_norm": 2.261531612589412, + "grad_max_sv": 1.2684625327587127, + "grad_min_sv": 4.360769899069972e-08, + "grad_condition": 42250330.837381184, + "lr": 0.000994636166481494, + "time_sec": 15.466506242752075 + }, + { + "epoch": 8, + "train_loss": 2.0688308012390135, + "train_acc": 0.44974, + "test_loss": 2.4493139656066893, + "test_acc": 0.3851, + "lyapunov": null, + "grad_norm": 2.118981579627668, + "grad_max_sv": 1.159741823375225, + "grad_min_sv": 4.073619567137449e-08, + "grad_condition": 437927531.63442343, + "lr": 0.0009929980185352525, + "time_sec": 15.472336769104004 + }, + { + "epoch": 9, + "train_loss": 1.9493904537963866, + "train_acc": 0.47454, + "test_loss": 2.441312085723877, + "test_acc": 0.389, + "lyapunov": null, + "grad_norm": 1.9875075491821204, + "grad_max_sv": 1.0529514640569686, + "grad_min_sv": 3.8403542657050595e-08, + "grad_condition": 87931604.40353736, + "lr": 0.0009911436253643444, + "time_sec": 15.4936044216156 + }, + { + "epoch": 10, + "train_loss": 1.858957971572876, + "train_acc": 0.4983, + "test_loss": 2.183478004837036, + "test_acc": 0.4383, + "lyapunov": null, + "grad_norm": 1.8688341406216382, + "grad_max_sv": 0.9524922624230385, + "grad_min_sv": 3.567054506770084e-08, + "grad_condition": 37551442.84495841, + "lr": 0.0009890738003669028, + "time_sec": 15.46358847618103 + }, + { + "epoch": 11, + "train_loss": 1.7630364864730834, + "train_acc": 0.51782, + "test_loss": 3.0158682430267336, + "test_acc": 0.3359, + "lyapunov": null, + "grad_norm": 1.7816105917819214, + "grad_max_sv": 0.9029998555779457, + "grad_min_sv": 3.4386650932249904e-08, + "grad_condition": 96253986.02645789, + "lr": 0.00098678945143658, + "time_sec": 15.461369752883911 + }, + { + "epoch": 12, + "train_loss": 1.7038999611282348, + "train_acc": 0.52966, + "test_loss": 2.345099726104736, + "test_acc": 0.4116, + "lyapunov": null, + "grad_norm": 1.703439920745613, + "grad_max_sv": 0.8390393868088722, + "grad_min_sv": 3.2384037166287294e-08, + "grad_condition": 263062888.07930222, + "lr": 0.0009842915805643154, + "time_sec": 15.47589898109436 + }, + { + "epoch": 13, + "train_loss": 1.6350115670394898, + "train_acc": 0.54934, + "test_loss": 2.3178677167892454, + "test_acc": 0.4258, + "lyapunov": null, + "grad_norm": 1.627197475633154, + "grad_max_sv": 0.7804030522704124, + "grad_min_sv": 3.0640796072622935e-08, + "grad_condition": 47339680.420034245, + "lr": 0.000981581283398829, + "time_sec": 15.482157230377197 + }, + { + "epoch": 14, + "train_loss": 1.5789134158706666, + "train_acc": 0.56262, + "test_loss": 3.108631703567505, + "test_acc": 0.3341, + "lyapunov": null, + "grad_norm": 1.5815496416496932, + "grad_max_sv": 0.7780330538749695, + "grad_min_sv": 3.0241727028840204e-08, + "grad_condition": 121072879.52128251, + "lr": 0.0009786597487660333, + "time_sec": 15.469743490219116 + }, + { + "epoch": 15, + "train_loss": 1.5213708932495118, + "train_acc": 0.57622, + "test_loss": 2.1178235721588137, + "test_acc": 0.4665, + "lyapunov": null, + "grad_norm": 1.5137971406754955, + "grad_max_sv": 0.7158914238214493, + "grad_min_sv": 2.8684351333074785e-08, + "grad_condition": 31997486.936446648, + "lr": 0.0009755282581475766, + "time_sec": 15.4898362159729 + }, + { + "epoch": 16, + "train_loss": 1.466670620689392, + "train_acc": 0.58748, + "test_loss": 1.9707215017318727, + "test_acc": 0.4909, + "lyapunov": null, + "grad_norm": 1.4598686481318373, + "grad_max_sv": 0.6799994811415673, + "grad_min_sv": 2.748090726922836e-08, + "grad_condition": 67712877.74998799, + "lr": 0.0009721881851187403, + "time_sec": 15.463284254074097 + }, + { + "epoch": 17, + "train_loss": 1.4266776397705079, + "train_acc": 0.60022, + "test_loss": 1.9578287740707399, + "test_acc": 0.496, + "lyapunov": null, + "grad_norm": 1.4163199382153222, + "grad_max_sv": 0.6607045501470565, + "grad_min_sv": 2.6701706835885463e-08, + "grad_condition": 69925020.646238, + "lr": 0.0009686409947459456, + "time_sec": 15.465324878692627 + }, + { + "epoch": 18, + "train_loss": 1.3868621417999267, + "train_acc": 0.61008, + "test_loss": 1.8873281810760498, + "test_acc": 0.5122, + "lyapunov": null, + "grad_norm": 1.3780415134056272, + "grad_max_sv": 0.6475953251123429, + "grad_min_sv": 2.629753427935144e-08, + "grad_condition": 71849203.49105962, + "lr": 0.0009648882429441254, + "time_sec": 15.476778745651245 + }, + { + "epoch": 19, + "train_loss": 1.3300997947692872, + "train_acc": 0.6208, + "test_loss": 1.8625336185455321, + "test_acc": 0.5163, + "lyapunov": null, + "grad_norm": 1.3376016965348547, + "grad_max_sv": 0.6296016126871109, + "grad_min_sv": 2.534474096427264e-08, + "grad_condition": 40912774.4949669, + "lr": 0.00096093157579425, + "time_sec": 15.47281002998352 + }, + { + "epoch": 20, + "train_loss": 1.2915953662490844, + "train_acc": 0.6313, + "test_loss": 1.88144536113739, + "test_acc": 0.5061, + "lyapunov": null, + "grad_norm": 1.3064427354934414, + "grad_max_sv": 0.5868082754313946, + "grad_min_sv": 2.44614505123808e-08, + "grad_condition": 40190101.53190343, + "lr": 0.0009567727288213001, + "time_sec": 15.473944902420044 + }, + { + "epoch": 21, + "train_loss": 1.2615811933898926, + "train_acc": 0.63936, + "test_loss": 2.138494786453247, + "test_acc": 0.4639, + "lyapunov": null, + "grad_norm": 1.2742362971746195, + "grad_max_sv": 0.577499034255743, + "grad_min_sv": 2.428454916880707e-08, + "grad_condition": 34685614.15402056, + "lr": 0.0009524135262330095, + "time_sec": 15.476754188537598 + }, + { + "epoch": 22, + "train_loss": 1.2293620531463623, + "train_acc": 0.6453, + "test_loss": 1.8758944011688232, + "test_acc": 0.5147, + "lyapunov": null, + "grad_norm": 1.252289309007294, + "grad_max_sv": 0.570976011455059, + "grad_min_sv": 2.3561374129510426e-08, + "grad_condition": 48751943.11700691, + "lr": 0.0009478558801197061, + "time_sec": 15.473217487335205 + }, + { + "epoch": 23, + "train_loss": 1.1897959590911866, + "train_acc": 0.65626, + "test_loss": 1.8954246566772461, + "test_acc": 0.5211, + "lyapunov": null, + "grad_norm": 1.2259155434497018, + "grad_max_sv": 0.5599369831383229, + "grad_min_sv": 2.2801355227530795e-08, + "grad_condition": 52092903.5694242, + "lr": 0.000943101789615607, + "time_sec": 15.473440170288086 + }, + { + "epoch": 24, + "train_loss": 1.1551566465377807, + "train_acc": 0.665, + "test_loss": 1.896939277267456, + "test_acc": 0.5226, + "lyapunov": null, + "grad_norm": 1.2022612803404449, + "grad_max_sv": 0.5331769093871117, + "grad_min_sv": 2.2077526620062348e-08, + "grad_condition": 154376470.85049906, + "lr": 0.0009381533400219313, + "time_sec": 15.473422765731812 + }, + { + "epoch": 25, + "train_loss": 1.13716111492157, + "train_acc": 0.66968, + "test_loss": 1.9673876178741454, + "test_acc": 0.5073, + "lyapunov": null, + "grad_norm": 1.1814644477570717, + "grad_max_sv": 0.5192016668617725, + "grad_min_sv": 2.207178118607267e-08, + "grad_condition": 32052263.833083443, + "lr": 0.0009330127018922189, + "time_sec": 15.463173151016235 + }, + { + "epoch": 26, + "train_loss": 1.0986487645339966, + "train_acc": 0.6787, + "test_loss": 1.7822764610290527, + "test_acc": 0.5433, + "lyapunov": null, + "grad_norm": 1.1543031476624748, + "grad_max_sv": 0.5173374325037002, + "grad_min_sv": 2.149504294557403e-08, + "grad_condition": 47084637.545989394, + "lr": 0.000927682130080253, + "time_sec": 15.460694313049316 + }, + { + "epoch": 27, + "train_loss": 1.0663320102691651, + "train_acc": 0.6865, + "test_loss": 1.8293514751434325, + "test_acc": 0.533, + "lyapunov": null, + "grad_norm": 1.1345054831803263, + "grad_max_sv": 0.4966191992163658, + "grad_min_sv": 2.08524984349201e-08, + "grad_condition": 45914156.60470325, + "lr": 0.0009221639627510072, + "time_sec": 15.467730045318604 + }, + { + "epoch": 28, + "train_loss": 1.0501069176864624, + "train_acc": 0.68934, + "test_loss": 2.0238259536743164, + "test_acc": 0.5084, + "lyapunov": null, + "grad_norm": 1.1176238593171397, + "grad_max_sv": 0.489936176687479, + "grad_min_sv": 2.0258219826652103e-08, + "grad_condition": 52549899.42960344, + "lr": 0.0009164606203550494, + "time_sec": 15.526809692382812 + }, + { + "epoch": 29, + "train_loss": 1.0180758087921142, + "train_acc": 0.69862, + "test_loss": 1.8129717712402345, + "test_acc": 0.5511, + "lyapunov": null, + "grad_norm": 1.0978329669563418, + "grad_max_sv": 0.49835110902786256, + "grad_min_sv": 2.0405637433853347e-08, + "grad_condition": 716037506.8371468, + "lr": 0.0009105746045668516, + "time_sec": 15.492526054382324 + }, + { + "epoch": 30, + "train_loss": 0.9951805596923828, + "train_acc": 0.7055, + "test_loss": 1.746192921257019, + "test_acc": 0.5623, + "lyapunov": null, + "grad_norm": 1.0796441895567979, + "grad_max_sv": 0.47773563787341117, + "grad_min_sv": 1.9923237732071692e-08, + "grad_condition": 316108467.8828658, + "lr": 0.0009045084971874733, + "time_sec": 15.470518827438354 + }, + { + "epoch": 31, + "train_loss": 0.9780883857536316, + "train_acc": 0.70904, + "test_loss": 1.7732117160797118, + "test_acc": 0.558, + "lyapunov": null, + "grad_norm": 1.0645091607080823, + "grad_max_sv": 0.46556121930480004, + "grad_min_sv": 1.9688543108527246e-08, + "grad_condition": 174238515.18129045, + "lr": 0.0008982649590120977, + "time_sec": 15.477237224578857 + }, + { + "epoch": 32, + "train_loss": 0.9519822745513916, + "train_acc": 0.71686, + "test_loss": 1.7432144353866577, + "test_acc": 0.5575, + "lyapunov": null, + "grad_norm": 1.0432923508174365, + "grad_max_sv": 0.46001894399523735, + "grad_min_sv": 1.928787157004508e-08, + "grad_condition": 84996179.20525053, + "lr": 0.0008918467286629196, + "time_sec": 15.482601881027222 + }, + { + "epoch": 33, + "train_loss": 0.9250898433685303, + "train_acc": 0.7218, + "test_loss": 1.7904945095062257, + "test_acc": 0.556, + "lyapunov": null, + "grad_norm": 1.0314496073989632, + "grad_max_sv": 0.45169909074902537, + "grad_min_sv": 1.9128463927403638e-08, + "grad_condition": 68691111.76926772, + "lr": 0.0008852566213878943, + "time_sec": 15.519761800765991 + }, + { + "epoch": 34, + "train_loss": 0.9152010176086426, + "train_acc": 0.72778, + "test_loss": 1.835019757270813, + "test_acc": 0.5553, + "lyapunov": null, + "grad_norm": 1.0226948793120243, + "grad_max_sv": 0.44521483927965166, + "grad_min_sv": 1.8672882064196816e-08, + "grad_condition": 72631593.89558022, + "lr": 0.000878497527825878, + "time_sec": 15.492830753326416 + }, + { + "epoch": 35, + "train_loss": 0.8909054629325867, + "train_acc": 0.72998, + "test_loss": 1.8686577810287475, + "test_acc": 0.5431, + "lyapunov": null, + "grad_norm": 1.0060209353905554, + "grad_max_sv": 0.428337212651968, + "grad_min_sv": 1.8221278065555514e-08, + "grad_condition": 54925799.50217812, + "lr": 0.000871572412738697, + "time_sec": 15.495248556137085 + }, + { + "epoch": 36, + "train_loss": 0.8669569097518921, + "train_acc": 0.7396, + "test_loss": 1.8778275032043457, + "test_acc": 0.5506, + "lyapunov": null, + "grad_norm": 0.9935254761598353, + "grad_max_sv": 0.42610192447900774, + "grad_min_sv": 1.789830566673034e-08, + "grad_condition": 65521171.05971684, + "lr": 0.0008644843137107055, + "time_sec": 15.501812219619751 + }, + { + "epoch": 37, + "train_loss": 0.8407849538421631, + "train_acc": 0.74404, + "test_loss": 1.884768021965027, + "test_acc": 0.5558, + "lyapunov": null, + "grad_norm": 0.983358047025113, + "grad_max_sv": 0.429234990477562, + "grad_min_sv": 1.8252723432699015e-08, + "grad_condition": 312919609.17862236, + "lr": 0.0008572363398164014, + "time_sec": 15.485287427902222 + }, + { + "epoch": 38, + "train_loss": 0.8223714313125611, + "train_acc": 0.74734, + "test_loss": 1.8372897932052612, + "test_acc": 0.5581, + "lyapunov": null, + "grad_norm": 0.9730686293969507, + "grad_max_sv": 0.43215164765715597, + "grad_min_sv": 1.805779136082597e-08, + "grad_condition": 111631952.08398516, + "lr": 0.0008498316702566826, + "time_sec": 15.495893239974976 + }, + { + "epoch": 39, + "train_loss": 0.8224841629219055, + "train_acc": 0.7495, + "test_loss": 1.8123548791885375, + "test_acc": 0.5623, + "lyapunov": null, + "grad_norm": 0.9689754376402935, + "grad_max_sv": 0.41914472356438637, + "grad_min_sv": 1.7533556316562392e-08, + "grad_condition": 50149472.40203967, + "lr": 0.0008422735529643442, + "time_sec": 15.51100492477417 + }, + { + "epoch": 40, + "train_loss": 0.8005770356750488, + "train_acc": 0.75588, + "test_loss": 1.9014682191848755, + "test_acc": 0.5541, + "lyapunov": null, + "grad_norm": 0.9508080469971997, + "grad_max_sv": 0.42388487085700033, + "grad_min_sv": 1.762832624032859e-08, + "grad_condition": 346358468.0799734, + "lr": 0.0008345653031794289, + "time_sec": 15.498661279678345 + }, + { + "epoch": 41, + "train_loss": 0.7747948072814942, + "train_acc": 0.76342, + "test_loss": 1.8567888566970825, + "test_acc": 0.5642, + "lyapunov": null, + "grad_norm": 0.9372391115065106, + "grad_max_sv": 0.4081222198903561, + "grad_min_sv": 1.7018125511580885e-08, + "grad_condition": 61876276.47604829, + "lr": 0.0008267103019950526, + "time_sec": 15.5028657913208 + }, + { + "epoch": 42, + "train_loss": 0.7694620947647095, + "train_acc": 0.76502, + "test_loss": 1.8408411359786987, + "test_acc": 0.5591, + "lyapunov": null, + "grad_norm": 0.9326717735984488, + "grad_max_sv": 0.41085106804966925, + "grad_min_sv": 1.7216302598821454e-08, + "grad_condition": 43901470.16833824, + "lr": 0.0008187119948743447, + "time_sec": 15.496897459030151 + }, + { + "epoch": 43, + "train_loss": 0.7424543988418579, + "train_acc": 0.77306, + "test_loss": 1.809230382347107, + "test_acc": 0.571, + "lyapunov": null, + "grad_norm": 0.9131307159835452, + "grad_max_sv": 0.40560107976198195, + "grad_min_sv": 1.6559755318563962e-08, + "grad_condition": 374063353.4207941, + "lr": 0.000810573890139155, + "time_sec": 15.487475872039795 + }, + { + "epoch": 44, + "train_loss": 0.7239759206962585, + "train_acc": 0.77538, + "test_loss": 1.7808053987503052, + "test_acc": 0.5793, + "lyapunov": null, + "grad_norm": 0.9060005234187932, + "grad_max_sv": 0.39045327603816987, + "grad_min_sv": 1.6347653778933656e-08, + "grad_condition": 175023718.92676198, + "lr": 0.0008022995574311873, + "time_sec": 15.478513240814209 + }, + { + "epoch": 45, + "train_loss": 0.709962793712616, + "train_acc": 0.77894, + "test_loss": 1.9501771980285645, + "test_acc": 0.5602, + "lyapunov": null, + "grad_norm": 0.8987907360568149, + "grad_max_sv": 0.39080821722745895, + "grad_min_sv": 1.634847552334229e-08, + "grad_condition": 38169444.05614711, + "lr": 0.0007938926261462363, + "time_sec": 15.49375057220459 + }, + { + "epoch": 46, + "train_loss": 0.7000335352516174, + "train_acc": 0.78202, + "test_loss": 1.9276861065864563, + "test_acc": 0.563, + "lyapunov": null, + "grad_norm": 0.8939654390908522, + "grad_max_sv": 0.3900447376072407, + "grad_min_sv": 1.6118415283213062e-08, + "grad_condition": 201079781.287968, + "lr": 0.0007853567838422158, + "time_sec": 15.506261825561523 + }, + { + "epoch": 47, + "train_loss": 0.6843666355323792, + "train_acc": 0.78712, + "test_loss": 1.8863512687683106, + "test_acc": 0.5648, + "lyapunov": null, + "grad_norm": 0.8860846821543104, + "grad_max_sv": 0.38012751266360284, + "grad_min_sv": 1.5984218158706515e-08, + "grad_condition": 363331609.5318787, + "lr": 0.0007766957746216719, + "time_sec": 15.481945991516113 + }, + { + "epoch": 48, + "train_loss": 0.6651840719032288, + "train_acc": 0.79232, + "test_loss": 1.826128447341919, + "test_acc": 0.5815, + "lyapunov": null, + "grad_norm": 0.8702032066364243, + "grad_max_sv": 0.37026465982198714, + "grad_min_sv": 1.544788876539638e-08, + "grad_condition": 1805163796.8757565, + "lr": 0.0007679133974894982, + "time_sec": 15.52286958694458 + }, + { + "epoch": 49, + "train_loss": 0.6528418668937683, + "train_acc": 0.79534, + "test_loss": 1.8805492639541626, + "test_acc": 0.5748, + "lyapunov": null, + "grad_norm": 0.8668040159369109, + "grad_max_sv": 0.3801993615925312, + "grad_min_sv": 1.5647269831914333e-08, + "grad_condition": 52007972.99755625, + "lr": 0.000759013504686565, + "time_sec": 15.518036127090454 + }, + { + "epoch": 50, + "train_loss": 0.6436834973526001, + "train_acc": 0.7997, + "test_loss": 1.793442686843872, + "test_acc": 0.5833, + "lyapunov": null, + "grad_norm": 0.8597198609492746, + "grad_max_sv": 0.37670152857899664, + "grad_min_sv": 1.5507358382387677e-08, + "grad_condition": 427721692.1185082, + "lr": 0.0007499999999999998, + "time_sec": 15.534092426300049 + }, + { + "epoch": 51, + "train_loss": 0.6239418637657166, + "train_acc": 0.80486, + "test_loss": 1.9321050287246704, + "test_acc": 0.5702, + "lyapunov": null, + "grad_norm": 0.8414343547264628, + "grad_max_sv": 0.3712430141866207, + "grad_min_sv": 1.5363422166663614e-08, + "grad_condition": 365943262.8213007, + "lr": 0.0007408768370508575, + "time_sec": 15.527155876159668 + }, + { + "epoch": 52, + "train_loss": 0.6170344979095459, + "train_acc": 0.80566, + "test_loss": 1.7804856214523315, + "test_acc": 0.588, + "lyapunov": null, + "grad_norm": 0.8457147724415158, + "grad_max_sv": 0.36000491231679915, + "grad_min_sv": 1.510340268962018e-08, + "grad_condition": 55532260.257321715, + "lr": 0.0007316480175599307, + "time_sec": 15.508218765258789 + }, + { + "epoch": 53, + "train_loss": 0.6110373974990845, + "train_acc": 0.8104, + "test_loss": 2.008984780883789, + "test_acc": 0.5633, + "lyapunov": null, + "grad_norm": 0.8288727311238714, + "grad_max_sv": 0.3595147252082825, + "grad_min_sv": 1.5030111735758744e-08, + "grad_condition": 51249181.30750112, + "lr": 0.0007223175895924635, + "time_sec": 15.506837129592896 + }, + { + "epoch": 54, + "train_loss": 0.5891339810752869, + "train_acc": 0.81566, + "test_loss": 1.8466287677764892, + "test_acc": 0.578, + "lyapunov": null, + "grad_norm": 0.8213597411734475, + "grad_max_sv": 0.3565825395286083, + "grad_min_sv": 1.4749719501978495e-08, + "grad_condition": 570713779.6923382, + "lr": 0.0007128896457825361, + "time_sec": 15.501415491104126 + }, + { + "epoch": 55, + "train_loss": 0.5801966732025147, + "train_acc": 0.81848, + "test_loss": 1.8548430694580078, + "test_acc": 0.5809, + "lyapunov": null, + "grad_norm": 0.815116092241223, + "grad_max_sv": 0.36071729883551595, + "grad_min_sv": 1.4880934259310642e-08, + "grad_condition": 334242266.9087108, + "lr": 0.0007033683215378998, + "time_sec": 15.510899066925049 + }, + { + "epoch": 56, + "train_loss": 0.569889211063385, + "train_acc": 0.82134, + "test_loss": 1.8169442867279053, + "test_acc": 0.5857, + "lyapunov": null, + "grad_norm": 0.8134294920256526, + "grad_max_sv": 0.3643924631178379, + "grad_min_sv": 1.5098616617734152e-08, + "grad_condition": 592439727.9387308, + "lr": 0.0006937577932260512, + "time_sec": 15.496611595153809 + }, + { + "epoch": 57, + "train_loss": 0.5602374402427673, + "train_acc": 0.82158, + "test_loss": 1.915207731628418, + "test_acc": 0.5802, + "lyapunov": null, + "grad_norm": 0.8103201963167868, + "grad_max_sv": 0.3596944443881512, + "grad_min_sv": 1.4392631711435122e-08, + "grad_condition": 84052786.33799395, + "lr": 0.0006840622763423388, + "time_sec": 15.500912427902222 + }, + { + "epoch": 58, + "train_loss": 0.5363558686447144, + "train_acc": 0.83006, + "test_loss": 1.9087711734771728, + "test_acc": 0.579, + "lyapunov": null, + "grad_norm": 0.7940934690943876, + "grad_max_sv": 0.3485556967556477, + "grad_min_sv": 1.4054249935363528e-08, + "grad_condition": 99578456.52402398, + "lr": 0.0006742860236609073, + "time_sec": 15.499320268630981 + }, + { + "epoch": 59, + "train_loss": 0.5240596619415283, + "train_acc": 0.83386, + "test_loss": 1.8847876579284668, + "test_acc": 0.5849, + "lyapunov": null, + "grad_norm": 0.7848942902344976, + "grad_max_sv": 0.3444338757544756, + "grad_min_sv": 1.4203639615807326e-08, + "grad_condition": 1006017198.7685986, + "lr": 0.0006644333233692913, + "time_sec": 15.51360535621643 + }, + { + "epoch": 60, + "train_loss": 0.5250089431381225, + "train_acc": 0.83314, + "test_loss": 1.8497852947235107, + "test_acc": 0.5934, + "lyapunov": null, + "grad_norm": 0.78894564972248, + "grad_max_sv": 0.35073093622922896, + "grad_min_sv": 1.3935465524236857e-08, + "grad_condition": 88013656.03250492, + "lr": 0.0006545084971874734, + "time_sec": 15.508491516113281 + }, + { + "epoch": 61, + "train_loss": 0.5165614600944519, + "train_acc": 0.83506, + "test_loss": 1.8630810359954835, + "test_acc": 0.5874, + "lyapunov": null, + "grad_norm": 0.7829768565092297, + "grad_max_sv": 0.3336628802120686, + "grad_min_sv": 1.3946549117481444e-08, + "grad_condition": 180242934.78653836, + "lr": 0.0006445158984722354, + "time_sec": 15.503038167953491 + }, + { + "epoch": 62, + "train_loss": 0.500950801115036, + "train_acc": 0.83966, + "test_loss": 1.8171254947662354, + "test_acc": 0.5999, + "lyapunov": null, + "grad_norm": 0.7677509624143988, + "grad_max_sv": 0.3256234541535378, + "grad_min_sv": 1.3750762319075793e-08, + "grad_condition": 64445933.52390041, + "lr": 0.0006344599103076324, + "time_sec": 15.505617618560791 + }, + { + "epoch": 63, + "train_loss": 0.48925278188705446, + "train_acc": 0.84414, + "test_loss": 1.9641206827163695, + "test_acc": 0.5824, + "lyapunov": null, + "grad_norm": 0.7625502199233959, + "grad_max_sv": 0.3294233627617359, + "grad_min_sv": 1.32725306221243e-08, + "grad_condition": 1228963257.7671177, + "lr": 0.0006243449435824269, + "time_sec": 15.529828071594238 + }, + { + "epoch": 64, + "train_loss": 0.48350829057693484, + "train_acc": 0.84334, + "test_loss": 1.9596610692977905, + "test_acc": 0.5774, + "lyapunov": null, + "grad_norm": 0.7632750006619222, + "grad_max_sv": 0.3282707162201405, + "grad_min_sv": 1.3222439235009708e-08, + "grad_condition": 124220191.9706742, + "lr": 0.0006141754350553275, + "time_sec": 15.521306037902832 + }, + { + "epoch": 65, + "train_loss": 0.4709274704360962, + "train_acc": 0.84992, + "test_loss": 1.8849371217727662, + "test_acc": 0.5929, + "lyapunov": null, + "grad_norm": 0.7514320426924211, + "grad_max_sv": 0.3312883138656616, + "grad_min_sv": 1.352077347374636e-08, + "grad_condition": 135157839.23060852, + "lr": 0.0006039558454088793, + "time_sec": 15.500089168548584 + }, + { + "epoch": 66, + "train_loss": 0.4579773247909546, + "train_acc": 0.85246, + "test_loss": 1.9383041584968568, + "test_acc": 0.5795, + "lyapunov": null, + "grad_norm": 0.7398296341112965, + "grad_max_sv": 0.32728378027677535, + "grad_min_sv": 1.3280565344621006e-08, + "grad_condition": 870917269.6899513, + "lr": 0.000593690657292862, + "time_sec": 15.498245477676392 + }, + { + "epoch": 67, + "train_loss": 0.4509772509765625, + "train_acc": 0.85632, + "test_loss": 1.9290270626068116, + "test_acc": 0.5832, + "lyapunov": null, + "grad_norm": 0.733532607565585, + "grad_max_sv": 0.3176191322505474, + "grad_min_sv": 1.2820620155827924e-08, + "grad_condition": 563528143.6689861, + "lr": 0.0005833843733580507, + "time_sec": 15.513327360153198 + }, + { + "epoch": 68, + "train_loss": 0.44296426357269286, + "train_acc": 0.85874, + "test_loss": 1.9557575977325439, + "test_acc": 0.5895, + "lyapunov": null, + "grad_norm": 0.7313567414469692, + "grad_max_sv": 0.3311334565281868, + "grad_min_sv": 1.299003317134506e-08, + "grad_condition": 57636313.192167915, + "lr": 0.0005730415142812054, + "time_sec": 15.521730422973633 + }, + { + "epoch": 69, + "train_loss": 0.43896515016555787, + "train_acc": 0.85892, + "test_loss": 1.960878660583496, + "test_acc": 0.5868, + "lyapunov": null, + "grad_norm": 0.7340093422433535, + "grad_max_sv": 0.3193955574184656, + "grad_min_sv": 1.2791151784291576e-08, + "grad_condition": 100597916.68063782, + "lr": 0.0005626666167821517, + "time_sec": 15.51311707496643 + }, + { + "epoch": 70, + "train_loss": 0.4285468480491638, + "train_acc": 0.86298, + "test_loss": 1.9584955738067626, + "test_acc": 0.591, + "lyapunov": null, + "grad_norm": 0.7244061253185728, + "grad_max_sv": 0.31838734485208986, + "grad_min_sv": 1.2623370689458097e-08, + "grad_condition": 256671325.86986813, + "lr": 0.0005522642316338265, + "time_sec": 15.545679569244385 + }, + { + "epoch": 71, + "train_loss": 0.4232082028102875, + "train_acc": 0.863, + "test_loss": 1.9168709438323974, + "test_acc": 0.5946, + "lyapunov": null, + "grad_norm": 0.7235116987420683, + "grad_max_sv": 0.3361910209059715, + "grad_min_sv": 1.3065330882943912e-08, + "grad_condition": 539616293.1861387, + "lr": 0.0005418389216661573, + "time_sec": 15.529778480529785 + }, + { + "epoch": 72, + "train_loss": 0.40893464082717895, + "train_acc": 0.8671, + "test_loss": 1.9778603734970093, + "test_acc": 0.5917, + "lyapunov": null, + "grad_norm": 0.7120788606908913, + "grad_max_sv": 0.3133332245051861, + "grad_min_sv": 1.2864244934573943e-08, + "grad_condition": 599875620.9980721, + "lr": 0.0005313952597646563, + "time_sec": 15.501370429992676 + }, + { + "epoch": 73, + "train_loss": 0.4073019913864136, + "train_acc": 0.86922, + "test_loss": 1.8993178993225097, + "test_acc": 0.6036, + "lyapunov": null, + "grad_norm": 0.7054800561985982, + "grad_max_sv": 0.32210378982126714, + "grad_min_sv": 1.2598049555162874e-08, + "grad_condition": 609078116.1228421, + "lr": 0.0005209378268645994, + "time_sec": 15.514087915420532 + }, + { + "epoch": 74, + "train_loss": 0.38610194705963136, + "train_acc": 0.87514, + "test_loss": 1.9717372917175293, + "test_acc": 0.5877, + "lyapunov": null, + "grad_norm": 0.6876754791376803, + "grad_max_sv": 0.30587312653660775, + "grad_min_sv": 1.228859272620758e-08, + "grad_condition": 287047740.76686746, + "lr": 0.0005104712099416781, + "time_sec": 15.521286249160767 + }, + { + "epoch": 75, + "train_loss": 0.38415311262130736, + "train_acc": 0.87532, + "test_loss": 1.9978297256469726, + "test_acc": 0.5873, + "lyapunov": null, + "grad_norm": 0.6901352414114731, + "grad_max_sv": 0.30640832521021366, + "grad_min_sv": 1.2382189768650464e-08, + "grad_condition": 89574244.76284985, + "lr": 0.0004999999999999996, + "time_sec": 15.522554159164429 + }, + { + "epoch": 76, + "train_loss": 0.38036803808212283, + "train_acc": 0.87676, + "test_loss": 1.9114773050308227, + "test_acc": 0.5941, + "lyapunov": null, + "grad_norm": 0.6862042555811976, + "grad_max_sv": 0.30668022595345973, + "grad_min_sv": 1.2098685775799311e-08, + "grad_condition": 79753720.75813168, + "lr": 0.0004895287900583212, + "time_sec": 15.500049591064453 + }, + { + "epoch": 77, + "train_loss": 0.37699529049873354, + "train_acc": 0.8755, + "test_loss": 1.9144949556350708, + "test_acc": 0.6035, + "lyapunov": null, + "grad_norm": 0.6869175270134545, + "grad_max_sv": 0.30233032815158367, + "grad_min_sv": 1.210133520196388e-08, + "grad_condition": 86138637.5204114, + "lr": 0.0004790621731353997, + "time_sec": 15.553943395614624 + }, + { + "epoch": 78, + "train_loss": 0.3636139490318298, + "train_acc": 0.88226, + "test_loss": 1.9924920860290527, + "test_acc": 0.5927, + "lyapunov": null, + "grad_norm": 0.6711688569608495, + "grad_max_sv": 0.29902654588222505, + "grad_min_sv": 1.1863716191731766e-08, + "grad_condition": 88817475.8392382, + "lr": 0.000468604740235343, + "time_sec": 15.530450820922852 + }, + { + "epoch": 79, + "train_loss": 0.362152115983963, + "train_acc": 0.88426, + "test_loss": 1.924188154411316, + "test_acc": 0.598, + "lyapunov": null, + "grad_norm": 0.6714773282743005, + "grad_max_sv": 0.29965595006942747, + "grad_min_sv": 1.1964831648906583e-08, + "grad_condition": 902616195.7149051, + "lr": 0.00045816107833384175, + "time_sec": 15.498046636581421 + }, + { + "epoch": 80, + "train_loss": 0.35668459805488584, + "train_acc": 0.88318, + "test_loss": 1.9200622287750244, + "test_acc": 0.5961, + "lyapunov": null, + "grad_norm": 0.6691406173146984, + "grad_max_sv": 0.30350013412535193, + "grad_min_sv": 1.2079031691623194e-08, + "grad_condition": 208431932.92374653, + "lr": 0.0004477357683661729, + "time_sec": 15.500086307525635 + }, + { + "epoch": 81, + "train_loss": 0.3465567926597595, + "train_acc": 0.88642, + "test_loss": 1.9750726140975952, + "test_acc": 0.5909, + "lyapunov": null, + "grad_norm": 0.6600906573823067, + "grad_max_sv": 0.3025949317961931, + "grad_min_sv": 1.1841972132921319e-08, + "grad_condition": 833170767.4888487, + "lr": 0.00043733338321784746, + "time_sec": 15.528315544128418 + }, + { + "epoch": 82, + "train_loss": 0.3412511627674103, + "train_acc": 0.88932, + "test_loss": 1.9702592422485352, + "test_acc": 0.5983, + "lyapunov": null, + "grad_norm": 0.6534470838362898, + "grad_max_sv": 0.281625871360302, + "grad_min_sv": 1.1298424867564605e-08, + "grad_condition": 245256269.73618746, + "lr": 0.0004269584857187939, + "time_sec": 15.54018759727478 + }, + { + "epoch": 83, + "train_loss": 0.32986866790771485, + "train_acc": 0.89278, + "test_loss": 1.9833718214035034, + "test_acc": 0.5983, + "lyapunov": null, + "grad_norm": 0.6472964118800569, + "grad_max_sv": 0.2898814812302589, + "grad_min_sv": 1.1219894397937468e-08, + "grad_condition": 67348047.22944725, + "lr": 0.0004166156266419484, + "time_sec": 15.523268938064575 + }, + { + "epoch": 84, + "train_loss": 0.32046857831954956, + "train_acc": 0.89464, + "test_loss": 1.9931445137023927, + "test_acc": 0.5976, + "lyapunov": null, + "grad_norm": 0.6387491891164032, + "grad_max_sv": 0.2859178498387337, + "grad_min_sv": 1.1112689026274158e-08, + "grad_condition": 532191414.5407898, + "lr": 0.0004063093427071373, + "time_sec": 15.5046226978302 + }, + { + "epoch": 85, + "train_loss": 0.31971281969070436, + "train_acc": 0.89616, + "test_loss": 1.919898393058777, + "test_acc": 0.6034, + "lyapunov": null, + "grad_norm": 0.6349502290101287, + "grad_max_sv": 0.2895286176353693, + "grad_min_sv": 1.114760893840749e-08, + "grad_condition": 1708507357.4309907, + "lr": 0.0003960441545911199, + "time_sec": 15.50874662399292 + }, + { + "epoch": 86, + "train_loss": 0.314735742893219, + "train_acc": 0.89802, + "test_loss": 1.9826490537643433, + "test_acc": 0.6039, + "lyapunov": null, + "grad_norm": 0.6374095409599659, + "grad_max_sv": 0.29547037966549394, + "grad_min_sv": 1.1427597929134642e-08, + "grad_condition": 249196257.17434186, + "lr": 0.0003858245649446718, + "time_sec": 15.518042802810669 + }, + { + "epoch": 87, + "train_loss": 0.3056777443599701, + "train_acc": 0.90104, + "test_loss": 2.015980870628357, + "test_acc": 0.5982, + "lyapunov": null, + "grad_norm": 0.6267239770409858, + "grad_max_sv": 0.29190454818308353, + "grad_min_sv": 1.1234584110458944e-08, + "grad_condition": 1983104332.2605565, + "lr": 0.00037565505641757235, + "time_sec": 15.49971318244934 + }, + { + "epoch": 88, + "train_loss": 0.3044772444725037, + "train_acc": 0.90106, + "test_loss": 2.005346726799011, + "test_acc": 0.6026, + "lyapunov": null, + "grad_norm": 0.6293105806437898, + "grad_max_sv": 0.2927882194519043, + "grad_min_sv": 1.12210154674941e-08, + "grad_condition": 178904778.3418693, + "lr": 0.00036554008969236695, + "time_sec": 15.495405673980713 + }, + { + "epoch": 89, + "train_loss": 0.30109511434555053, + "train_acc": 0.90188, + "test_loss": 1.998448072052002, + "test_acc": 0.6034, + "lyapunov": null, + "grad_norm": 0.6266125109308321, + "grad_max_sv": 0.29103793352842333, + "grad_min_sv": 1.1148633635108679e-08, + "grad_condition": 893976917.5132227, + "lr": 0.0003554841015277638, + "time_sec": 15.50434947013855 + }, + { + "epoch": 90, + "train_loss": 0.28917674076080324, + "train_acc": 0.90682, + "test_loss": 1.9980867877960204, + "test_acc": 0.6012, + "lyapunov": null, + "grad_norm": 0.6127659289231001, + "grad_max_sv": 0.29112574011087416, + "grad_min_sv": 1.1166155032202307e-08, + "grad_condition": 348701496.86000526, + "lr": 0.000345491502812526, + "time_sec": 15.520820617675781 + }, + { + "epoch": 91, + "train_loss": 0.2823534561729431, + "train_acc": 0.90822, + "test_loss": 1.9809785503387451, + "test_acc": 0.6052, + "lyapunov": null, + "grad_norm": 0.606268342013339, + "grad_max_sv": 0.27696173191070556, + "grad_min_sv": 1.0846671113454859e-08, + "grad_condition": 248996494.78191227, + "lr": 0.0003355666766307081, + "time_sec": 15.745567321777344 + }, + { + "epoch": 92, + "train_loss": 0.28228991139411924, + "train_acc": 0.91008, + "test_loss": 2.0131442947387694, + "test_acc": 0.6001, + "lyapunov": null, + "grad_norm": 0.6064057382091922, + "grad_max_sv": 0.277644307166338, + "grad_min_sv": 1.0798128024722132e-08, + "grad_condition": 406311701.1258798, + "lr": 0.00032571397633909225, + "time_sec": 15.527170181274414 + }, + { + "epoch": 93, + "train_loss": 0.2772208102607727, + "train_acc": 0.91184, + "test_loss": 2.0510717596054078, + "test_acc": 0.5952, + "lyapunov": null, + "grad_norm": 0.603398829043512, + "grad_max_sv": 0.2785311110317707, + "grad_min_sv": 1.0620686785936529e-08, + "grad_condition": 159246942.28978306, + "lr": 0.00031593772365766094, + "time_sec": 15.521395206451416 + }, + { + "epoch": 94, + "train_loss": 0.2721544520187378, + "train_acc": 0.91266, + "test_loss": 2.044207299041748, + "test_acc": 0.5963, + "lyapunov": null, + "grad_norm": 0.597776334868791, + "grad_max_sv": 0.2813128184527159, + "grad_min_sv": 1.032634765595758e-08, + "grad_condition": 320344963.9972409, + "lr": 0.0003062422067739483, + "time_sec": 15.535969257354736 + }, + { + "epoch": 95, + "train_loss": 0.2562399788665771, + "train_acc": 0.91636, + "test_loss": 2.1072509820938112, + "test_acc": 0.5953, + "lyapunov": null, + "grad_norm": 0.5775561165196347, + "grad_max_sv": 0.27824114337563516, + "grad_min_sv": 1.0481623234420353e-08, + "grad_condition": 474004359.26671135, + "lr": 0.00029663167846209965, + "time_sec": 15.517311334609985 + }, + { + "epoch": 96, + "train_loss": 0.2625131010723114, + "train_acc": 0.9142, + "test_loss": 2.035417915725708, + "test_acc": 0.604, + "lyapunov": null, + "grad_norm": 0.5877203581399221, + "grad_max_sv": 0.28129979483783246, + "grad_min_sv": 1.0502568877773787e-08, + "grad_condition": 177356414.63757357, + "lr": 0.00028711035421746345, + "time_sec": 15.521276950836182 + }, + { + "epoch": 97, + "train_loss": 0.2552481310462952, + "train_acc": 0.9173, + "test_loss": 1.9491484304428102, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.5816116237706002, + "grad_max_sv": 0.27597419619560243, + "grad_min_sv": 1.0369440153409904e-08, + "grad_condition": 153072053.30610082, + "lr": 0.00027768241040753615, + "time_sec": 15.518199920654297 + }, + { + "epoch": 98, + "train_loss": 0.2514290081501007, + "train_acc": 0.91774, + "test_loss": 1.9556513019561768, + "test_acc": 0.6144, + "lyapunov": null, + "grad_norm": 0.5786453355425705, + "grad_max_sv": 0.25863444767892363, + "grad_min_sv": 9.982682687079137e-09, + "grad_condition": 323898207.1043015, + "lr": 0.00026835198244006903, + "time_sec": 15.518558025360107 + }, + { + "epoch": 99, + "train_loss": 0.24542429465293883, + "train_acc": 0.92078, + "test_loss": 2.0414382596969602, + "test_acc": 0.6093, + "lyapunov": null, + "grad_norm": 0.5720561260068352, + "grad_max_sv": 0.2730622936040163, + "grad_min_sv": 1.0236981595745931e-08, + "grad_condition": 73009111.50173582, + "lr": 0.0002591231629491421, + "time_sec": 15.516184568405151 + }, + { + "epoch": 100, + "train_loss": 0.2419339677333832, + "train_acc": 0.92168, + "test_loss": 2.0001620481491087, + "test_acc": 0.615, + "lyapunov": null, + "grad_norm": 0.5656963959074934, + "grad_max_sv": 0.2690838035196066, + "grad_min_sv": 1.0369351413283546e-08, + "grad_condition": 325100290.9819474, + "lr": 0.0002499999999999997, + "time_sec": 15.516221761703491 + }, + { + "epoch": 101, + "train_loss": 0.23517837069511413, + "train_acc": 0.92362, + "test_loss": 2.0624069427490235, + "test_acc": 0.6006, + "lyapunov": null, + "grad_norm": 0.5588551885657764, + "grad_max_sv": 0.26636214926838875, + "grad_min_sv": 9.985110372735806e-09, + "grad_condition": 152593330.29256034, + "lr": 0.00024098649531343477, + "time_sec": 15.525659799575806 + }, + { + "epoch": 102, + "train_loss": 0.23243571233749388, + "train_acc": 0.92494, + "test_loss": 2.050922277832031, + "test_acc": 0.6071, + "lyapunov": null, + "grad_norm": 0.555094837720988, + "grad_max_sv": 0.2671301085501909, + "grad_min_sv": 9.489460735148495e-09, + "grad_condition": 975172257.3566437, + "lr": 0.0002320866025105016, + "time_sec": 15.512139797210693 + }, + { + "epoch": 103, + "train_loss": 0.22915385756969453, + "train_acc": 0.92618, + "test_loss": 2.0090701560974122, + "test_acc": 0.6102, + "lyapunov": null, + "grad_norm": 0.551643622576711, + "grad_max_sv": 0.26358814239501954, + "grad_min_sv": 9.903819275135706e-09, + "grad_condition": 8450881945.308035, + "lr": 0.0002233042253783278, + "time_sec": 15.51590085029602 + }, + { + "epoch": 104, + "train_loss": 0.22301624965667724, + "train_acc": 0.929, + "test_loss": 2.0414324163436888, + "test_acc": 0.6097, + "lyapunov": null, + "grad_norm": 0.547361757777093, + "grad_max_sv": 0.2635317210108042, + "grad_min_sv": 9.868235632663237e-09, + "grad_condition": 918464158.4766433, + "lr": 0.000214643216157784, + "time_sec": 15.517698764801025 + }, + { + "epoch": 105, + "train_loss": 0.21800282436847687, + "train_acc": 0.92888, + "test_loss": 2.006334408760071, + "test_acc": 0.6108, + "lyapunov": null, + "grad_norm": 0.5441245707971135, + "grad_max_sv": 0.2652390133589506, + "grad_min_sv": 9.775255871067018e-09, + "grad_condition": 1728037982.0008423, + "lr": 0.00020610737385376332, + "time_sec": 15.521651268005371 + }, + { + "epoch": 106, + "train_loss": 0.22170533905029297, + "train_acc": 0.92766, + "test_loss": 2.0015246070861816, + "test_acc": 0.6151, + "lyapunov": null, + "grad_norm": 0.5504732473005655, + "grad_max_sv": 0.2658932194113731, + "grad_min_sv": 9.836566865553675e-09, + "grad_condition": 187622343.96039546, + "lr": 0.00019770044256881242, + "time_sec": 15.52303409576416 + }, + { + "epoch": 107, + "train_loss": 0.21625425663948059, + "train_acc": 0.92998, + "test_loss": 2.0188750885009767, + "test_acc": 0.6132, + "lyapunov": null, + "grad_norm": 0.5416895117176501, + "grad_max_sv": 0.25219607427716256, + "grad_min_sv": 9.366761803773077e-09, + "grad_condition": 260260509.50687146, + "lr": 0.0001894261098608447, + "time_sec": 15.538499593734741 + }, + { + "epoch": 108, + "train_loss": 0.20747127439498902, + "train_acc": 0.93344, + "test_loss": 1.992410384941101, + "test_acc": 0.6181, + "lyapunov": null, + "grad_norm": 0.5312872760984289, + "grad_max_sv": 0.26626099497079847, + "grad_min_sv": 9.742697032379816e-09, + "grad_condition": 241868081.8815055, + "lr": 0.000181288005125655, + "time_sec": 15.520596027374268 + }, + { + "epoch": 109, + "train_loss": 0.21061437376976014, + "train_acc": 0.93212, + "test_loss": 2.0430712549209593, + "test_acc": 0.6121, + "lyapunov": null, + "grad_norm": 0.53793437376293, + "grad_max_sv": 0.26196735054254533, + "grad_min_sv": 9.911649283440849e-09, + "grad_condition": 196778424.3729182, + "lr": 0.0001732896980049473, + "time_sec": 15.514817953109741 + }, + { + "epoch": 110, + "train_loss": 0.20801750651359557, + "train_acc": 0.93272, + "test_loss": 2.0129987867355346, + "test_acc": 0.6136, + "lyapunov": null, + "grad_norm": 0.5345111757966097, + "grad_max_sv": 0.2620788164436817, + "grad_min_sv": 9.685049608479378e-09, + "grad_condition": 442982408.6181739, + "lr": 0.00016543469682057076, + "time_sec": 15.524093389511108 + }, + { + "epoch": 111, + "train_loss": 0.20387941056251527, + "train_acc": 0.93432, + "test_loss": 2.017576940536499, + "test_acc": 0.6171, + "lyapunov": null, + "grad_norm": 0.5265383831682404, + "grad_max_sv": 0.2475517351180315, + "grad_min_sv": 9.334722057222771e-09, + "grad_condition": 520706944.53767884, + "lr": 0.00015772644703565552, + "time_sec": 15.520273685455322 + }, + { + "epoch": 112, + "train_loss": 0.20065601328372956, + "train_acc": 0.93514, + "test_loss": 2.0878772733688353, + "test_acc": 0.6091, + "lyapunov": null, + "grad_norm": 0.5235410807678327, + "grad_max_sv": 0.2556714225560427, + "grad_min_sv": 9.592023909182901e-09, + "grad_condition": 295083197.1946956, + "lr": 0.00015016832974331713, + "time_sec": 15.510764837265015 + }, + { + "epoch": 113, + "train_loss": 0.1982079153442383, + "train_acc": 0.93612, + "test_loss": 2.047266570854187, + "test_acc": 0.6181, + "lyapunov": null, + "grad_norm": 0.5197176578777744, + "grad_max_sv": 0.25255175642669203, + "grad_min_sv": 9.308845385150311e-09, + "grad_condition": 520055211.6428779, + "lr": 0.00014276366018359834, + "time_sec": 15.705829381942749 + }, + { + "epoch": 114, + "train_loss": 0.19655517510414122, + "train_acc": 0.93708, + "test_loss": 2.0292094760894774, + "test_acc": 0.6144, + "lyapunov": null, + "grad_norm": 0.5181527372855724, + "grad_max_sv": 0.25922506861388683, + "grad_min_sv": 9.507550523431274e-09, + "grad_condition": 332806274.6985155, + "lr": 0.00013551568628929425, + "time_sec": 15.525954723358154 + }, + { + "epoch": 115, + "train_loss": 0.18803977591514587, + "train_acc": 0.93928, + "test_loss": 2.0187850973129273, + "test_acc": 0.6152, + "lyapunov": null, + "grad_norm": 0.5114058292617459, + "grad_max_sv": 0.2462628223001957, + "grad_min_sv": 9.353905294090265e-09, + "grad_condition": 1483441837.69936, + "lr": 0.00012842758726130276, + "time_sec": 15.518154859542847 + }, + { + "epoch": 116, + "train_loss": 0.18797869988918303, + "train_acc": 0.93912, + "test_loss": 2.084369885826111, + "test_acc": 0.6095, + "lyapunov": null, + "grad_norm": 0.5077819115434521, + "grad_max_sv": 0.25109760873019693, + "grad_min_sv": 8.964496494212256e-09, + "grad_condition": 298276978.79912215, + "lr": 0.0001215024721741218, + "time_sec": 15.520355939865112 + }, + { + "epoch": 117, + "train_loss": 0.18214592965126036, + "train_acc": 0.94196, + "test_loss": 2.034072047996521, + "test_acc": 0.6169, + "lyapunov": null, + "grad_norm": 0.49960618612788865, + "grad_max_sv": 0.25671581737697124, + "grad_min_sv": 9.445877218535077e-09, + "grad_condition": 1803107586.0713096, + "lr": 0.00011474337861210538, + "time_sec": 15.5315523147583 + }, + { + "epoch": 118, + "train_loss": 0.18415243848800658, + "train_acc": 0.93992, + "test_loss": 2.082629474067688, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.5036047735021936, + "grad_max_sv": 0.24121248573064805, + "grad_min_sv": 8.989532489320911e-09, + "grad_condition": 1883514828.3661075, + "lr": 0.00010815327133708009, + "time_sec": 15.565385580062866 + }, + { + "epoch": 119, + "train_loss": 0.18069743538856506, + "train_acc": 0.94234, + "test_loss": 2.0749569414138795, + "test_acc": 0.6104, + "lyapunov": null, + "grad_norm": 0.4967845602516186, + "grad_max_sv": 0.24950436390936376, + "grad_min_sv": 9.221202780431564e-09, + "grad_condition": 275651167.2776666, + "lr": 0.00010173504098790182, + "time_sec": 15.531636476516724 + }, + { + "epoch": 120, + "train_loss": 0.1800184269142151, + "train_acc": 0.9418, + "test_loss": 2.063923722267151, + "test_acc": 0.6149, + "lyapunov": null, + "grad_norm": 0.5000634640274525, + "grad_max_sv": 0.2467968337237835, + "grad_min_sv": 9.10186292138633e-09, + "grad_condition": 420120780.22859687, + "lr": 9.549150281252629e-05, + "time_sec": 15.545646905899048 + }, + { + "epoch": 121, + "train_loss": 0.1746319353055954, + "train_acc": 0.94524, + "test_loss": 2.031014646720886, + "test_acc": 0.6202, + "lyapunov": null, + "grad_norm": 0.4894634649372604, + "grad_max_sv": 0.24847413785755634, + "grad_min_sv": 9.111916768203901e-09, + "grad_condition": 529933823.1357336, + "lr": 8.942539543314794e-05, + "time_sec": 15.525688648223877 + }, + { + "epoch": 122, + "train_loss": 0.1720413486146927, + "train_acc": 0.94558, + "test_loss": 2.0709302186965943, + "test_acc": 0.6107, + "lyapunov": null, + "grad_norm": 0.4872422158802626, + "grad_max_sv": 0.25410806462168695, + "grad_min_sv": 9.372779969513134e-09, + "grad_condition": 129683199.58735898, + "lr": 8.353937964495024e-05, + "time_sec": 15.53614616394043 + }, + { + "epoch": 123, + "train_loss": 0.167387109708786, + "train_acc": 0.94716, + "test_loss": 2.04781618976593, + "test_acc": 0.621, + "lyapunov": null, + "grad_norm": 0.47867845277837057, + "grad_max_sv": 0.24308387711644172, + "grad_min_sv": 8.83432009590561e-09, + "grad_condition": 446940201.78913987, + "lr": 7.783603724899243e-05, + "time_sec": 15.534965991973877 + }, + { + "epoch": 124, + "train_loss": 0.17369194811820984, + "train_acc": 0.9434, + "test_loss": 2.080777750968933, + "test_acc": 0.6137, + "lyapunov": null, + "grad_norm": 0.4915299120514337, + "grad_max_sv": 0.24491641744971276, + "grad_min_sv": 8.973002642667129e-09, + "grad_condition": 968560910.7177868, + "lr": 7.231786991974666e-05, + "time_sec": 15.534366130828857 + }, + { + "epoch": 125, + "train_loss": 0.17029917016983032, + "train_acc": 0.94574, + "test_loss": 2.0687435190200807, + "test_acc": 0.6157, + "lyapunov": null, + "grad_norm": 0.4850020461380622, + "grad_max_sv": 0.24593175910413265, + "grad_min_sv": 8.810581337420631e-09, + "grad_condition": 165938611.54228717, + "lr": 6.698729810778072e-05, + "time_sec": 15.55061674118042 + }, + { + "epoch": 126, + "train_loss": 0.1665445522928238, + "train_acc": 0.94674, + "test_loss": 2.0515053030014037, + "test_acc": 0.6187, + "lyapunov": null, + "grad_norm": 0.48056912270271285, + "grad_max_sv": 0.23969021812081337, + "grad_min_sv": 8.827286746693327e-09, + "grad_condition": 1743247825.2921212, + "lr": 6.184665997806817e-05, + "time_sec": 15.531169652938843 + }, + { + "epoch": 127, + "train_loss": 0.16487963933944702, + "train_acc": 0.94836, + "test_loss": 2.033387902641296, + "test_acc": 0.6198, + "lyapunov": null, + "grad_norm": 0.47729941792361885, + "grad_max_sv": 0.2343486487865448, + "grad_min_sv": 8.995271932876748e-09, + "grad_condition": 606828641.3185183, + "lr": 5.6898210384392595e-05, + "time_sec": 15.539721250534058 + }, + { + "epoch": 128, + "train_loss": 0.16376567732810973, + "train_acc": 0.94834, + "test_loss": 2.0975912773132324, + "test_acc": 0.6112, + "lyapunov": null, + "grad_norm": 0.47555669561822944, + "grad_max_sv": 0.2403645869344473, + "grad_min_sv": 8.86344721578395e-09, + "grad_condition": 1871409158.001809, + "lr": 5.214411988029363e-05, + "time_sec": 15.523812055587769 + }, + { + "epoch": 129, + "train_loss": 0.16381013206005096, + "train_acc": 0.94882, + "test_loss": 2.0344886224746705, + "test_acc": 0.6205, + "lyapunov": null, + "grad_norm": 0.47811068127125184, + "grad_max_sv": 0.2321129973977804, + "grad_min_sv": 8.809577021736195e-09, + "grad_condition": 674841641.2549579, + "lr": 4.7586473766990294e-05, + "time_sec": 15.542162656784058 + }, + { + "epoch": 130, + "train_loss": 0.1587965604352951, + "train_acc": 0.95018, + "test_loss": 2.039856211090088, + "test_acc": 0.6198, + "lyapunov": null, + "grad_norm": 0.46996704308372744, + "grad_max_sv": 0.24367436692118644, + "grad_min_sv": 8.878338260412334e-09, + "grad_condition": 3107522776.3953853, + "lr": 4.32272711786996e-05, + "time_sec": 15.518379926681519 + }, + { + "epoch": 131, + "train_loss": 0.16415684640884398, + "train_acc": 0.94804, + "test_loss": 2.0716621114730835, + "test_acc": 0.6177, + "lyapunov": null, + "grad_norm": 0.477860267933493, + "grad_max_sv": 0.23813350014388562, + "grad_min_sv": 8.676938825780134e-09, + "grad_condition": 186204488.74284863, + "lr": 3.906842420574966e-05, + "time_sec": 15.52889084815979 + }, + { + "epoch": 132, + "train_loss": 0.1586827588367462, + "train_acc": 0.94982, + "test_loss": 2.053567728805542, + "test_acc": 0.6199, + "lyapunov": null, + "grad_norm": 0.4697672382287586, + "grad_max_sv": 0.2426899142563343, + "grad_min_sv": 8.828440787385545e-09, + "grad_condition": 1012659868.4686158, + "lr": 3.5111757055874305e-05, + "time_sec": 15.524049282073975 + }, + { + "epoch": 133, + "train_loss": 0.15553737973690032, + "train_acc": 0.95082, + "test_loss": 2.043516174507141, + "test_acc": 0.6191, + "lyapunov": null, + "grad_norm": 0.4649067986135626, + "grad_max_sv": 0.24401309713721275, + "grad_min_sv": 8.961552855574292e-09, + "grad_condition": 1162757970.0586789, + "lr": 3.1359005254054254e-05, + "time_sec": 15.536059856414795 + }, + { + "epoch": 134, + "train_loss": 0.15784678574085237, + "train_acc": 0.9499, + "test_loss": 2.03684903011322, + "test_acc": 0.6189, + "lyapunov": null, + "grad_norm": 0.4686730421924603, + "grad_max_sv": 0.23595759123563767, + "grad_min_sv": 8.586731024010303e-09, + "grad_condition": 4315274102.848023, + "lr": 2.7811814881259484e-05, + "time_sec": 15.534076690673828 + }, + { + "epoch": 135, + "train_loss": 0.15442110489368438, + "train_acc": 0.95192, + "test_loss": 2.0882527042388914, + "test_acc": 0.6147, + "lyapunov": null, + "grad_norm": 0.4615131055534514, + "grad_max_sv": 0.2321950040757656, + "grad_min_sv": 8.617836743177176e-09, + "grad_condition": 99470014.62201284, + "lr": 2.4471741852423218e-05, + "time_sec": 15.554243803024292 + }, + { + "epoch": 136, + "train_loss": 0.15938658513069154, + "train_acc": 0.95014, + "test_loss": 2.0193495433807374, + "test_acc": 0.619, + "lyapunov": null, + "grad_norm": 0.46997706784197274, + "grad_max_sv": 0.24588101021945477, + "grad_min_sv": 8.594699345537e-09, + "grad_condition": 299854790.23102367, + "lr": 2.1340251233966362e-05, + "time_sec": 15.515581130981445 + }, + { + "epoch": 137, + "train_loss": 0.15305941107273102, + "train_acc": 0.95102, + "test_loss": 2.085107785606384, + "test_acc": 0.6178, + "lyapunov": null, + "grad_norm": 0.4651082031381239, + "grad_max_sv": 0.23546294569969178, + "grad_min_sv": 8.641280193082048e-09, + "grad_condition": 1355468630.1220336, + "lr": 1.8418716601170932e-05, + "time_sec": 15.523824691772461 + }, + { + "epoch": 138, + "train_loss": 0.15521952202796935, + "train_acc": 0.95138, + "test_loss": 2.05961570148468, + "test_acc": 0.621, + "lyapunov": null, + "grad_norm": 0.4655707979434113, + "grad_max_sv": 0.22249948792159557, + "grad_min_sv": 8.559314398871517e-09, + "grad_condition": 523110775.45855033, + "lr": 1.570841943568445e-05, + "time_sec": 15.527312755584717 + }, + { + "epoch": 139, + "train_loss": 0.15613153836250304, + "train_acc": 0.94964, + "test_loss": 2.0917256591796876, + "test_acc": 0.6145, + "lyapunov": null, + "grad_norm": 0.4685524417915432, + "grad_max_sv": 0.23622551932930946, + "grad_min_sv": 8.448936071386512e-09, + "grad_condition": 381309760.86173236, + "lr": 1.3210548563419845e-05, + "time_sec": 15.53156852722168 + }, + { + "epoch": 140, + "train_loss": 0.15750930822372436, + "train_acc": 0.95076, + "test_loss": 2.0336023241043093, + "test_acc": 0.6231, + "lyapunov": null, + "grad_norm": 0.46956356170298885, + "grad_max_sv": 0.24571651183068752, + "grad_min_sv": 8.880518665268025e-09, + "grad_condition": 446576930.15414965, + "lr": 1.0926199633097203e-05, + "time_sec": 15.513741731643677 + }, + { + "epoch": 141, + "train_loss": 0.15634389350891112, + "train_acc": 0.95178, + "test_loss": 2.0461313623428343, + "test_acc": 0.6206, + "lyapunov": null, + "grad_norm": 0.4667179789960613, + "grad_max_sv": 0.2333354063332081, + "grad_min_sv": 8.735082636959725e-09, + "grad_condition": 2773787337.949284, + "lr": 8.856374635655688e-06, + "time_sec": 15.527939558029175 + }, + { + "epoch": 142, + "train_loss": 0.1522996149158478, + "train_acc": 0.95188, + "test_loss": 2.036745939064026, + "test_acc": 0.6191, + "lyapunov": null, + "grad_norm": 0.45971196350477606, + "grad_max_sv": 0.23409303948283194, + "grad_min_sv": 8.654798093845651e-09, + "grad_condition": 899766914.5561358, + "lr": 7.001981464747503e-06, + "time_sec": 15.528279781341553 + }, + { + "epoch": 143, + "train_loss": 0.15602009796380997, + "train_acc": 0.95086, + "test_loss": 2.030546005439758, + "test_acc": 0.6179, + "lyapunov": null, + "grad_norm": 0.46698211747670393, + "grad_max_sv": 0.2427021000534296, + "grad_min_sv": 8.880018779116672e-09, + "grad_condition": 2005668849.0321355, + "lr": 5.3638335185058295e-06, + "time_sec": 15.519719362258911 + }, + { + "epoch": 144, + "train_loss": 0.15405357198238373, + "train_acc": 0.95214, + "test_loss": 2.0480900999069216, + "test_acc": 0.6225, + "lyapunov": null, + "grad_norm": 0.4619783068969592, + "grad_max_sv": 0.24754497669637204, + "grad_min_sv": 9.022524723482569e-09, + "grad_condition": 472769507.4774891, + "lr": 3.942649342761114e-06, + "time_sec": 15.538635015487671 + }, + { + "epoch": 145, + "train_loss": 0.15324831766605376, + "train_acc": 0.95236, + "test_loss": 2.0383225648880003, + "test_acc": 0.6217, + "lyapunov": null, + "grad_norm": 0.46106192343039926, + "grad_max_sv": 0.23626826107501983, + "grad_min_sv": 8.604992432687843e-09, + "grad_condition": 1211825093.7054877, + "lr": 2.7390523158633524e-06, + "time_sec": 15.542897939682007 + }, + { + "epoch": 146, + "train_loss": 0.15349729721069336, + "train_acc": 0.9521, + "test_loss": 2.0096838916778563, + "test_acc": 0.6241, + "lyapunov": null, + "grad_norm": 0.4615822267692517, + "grad_max_sv": 0.23966375291347503, + "grad_min_sv": 8.838330253866516e-09, + "grad_condition": 685922400.3184944, + "lr": 1.7535703752478133e-06, + "time_sec": 15.519303321838379 + }, + { + "epoch": 147, + "train_loss": 0.15039199693679808, + "train_acc": 0.95362, + "test_loss": 2.0573708726882933, + "test_acc": 0.6207, + "lyapunov": null, + "grad_norm": 0.4572591547952713, + "grad_max_sv": 0.2330123759806156, + "grad_min_sv": 8.66143673887215e-09, + "grad_condition": 1329748658.9084074, + "lr": 9.866357858642196e-07, + "time_sec": 15.523812532424927 + }, + { + "epoch": 148, + "train_loss": 0.15033800620317458, + "train_acc": 0.95234, + "test_loss": 2.0463861759185793, + "test_acc": 0.6186, + "lyapunov": null, + "grad_norm": 0.45711357740306113, + "grad_max_sv": 0.2265869051218033, + "grad_min_sv": 8.489472146479878e-09, + "grad_condition": 764759274.1337291, + "lr": 4.38584950570808e-07, + "time_sec": 15.51754641532898 + }, + { + "epoch": 149, + "train_loss": 0.15091258768081664, + "train_acc": 0.95256, + "test_loss": 2.0271072778701784, + "test_acc": 0.6188, + "lyapunov": null, + "grad_norm": 0.4574063447607332, + "grad_max_sv": 0.23711176067590714, + "grad_min_sv": 8.619700593825432e-09, + "grad_condition": 2609529945.0149875, + "lr": 1.096582625772501e-07, + "time_sec": 15.518434286117554 + }, + { + "epoch": 150, + "train_loss": 0.153145382938385, + "train_acc": 0.95224, + "test_loss": 2.03473729095459, + "test_acc": 0.6182, + "lyapunov": null, + "grad_norm": 0.46046361312569684, + "grad_max_sv": 0.22179042883217334, + "grad_min_sv": 8.465783018335969e-09, + "grad_condition": 1154619433.2746358, + "lr": 0.0, + "time_sec": 15.527158737182617 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 4.604280056762695, + "train_acc": 0.06204, + "test_loss": 4.320657266998291, + "test_acc": 0.0698, + "lyapunov": null, + "grad_norm": 6.299548945029663, + "grad_max_sv": 5.383423590660096, + "grad_min_sv": 1.0969439819819016e-07, + "grad_condition": 135387683.66756994, + "lr": 0.0009998903417374227, + "time_sec": 32.66659903526306 + }, + { + "epoch": 2, + "train_loss": 3.8911869562530517, + "train_acc": 0.12252, + "test_loss": 3.901215605163574, + "test_acc": 0.1102, + "lyapunov": null, + "grad_norm": 4.7289084274834625, + "grad_max_sv": 4.045294773578644, + "grad_min_sv": 8.59628614957586e-08, + "grad_condition": 54316925.08787592, + "lr": 0.0009995614150494292, + "time_sec": 32.55902910232544 + }, + { + "epoch": 3, + "train_loss": 3.5447918058776855, + "train_acc": 0.16864, + "test_loss": 3.5751065971374514, + "test_acc": 0.1632, + "lyapunov": null, + "grad_norm": 3.9235192359291027, + "grad_max_sv": 3.218869465589523, + "grad_min_sv": 7.25899491738069e-08, + "grad_condition": 59713400.674747445, + "lr": 0.0009990133642141358, + "time_sec": 32.56558012962341 + }, + { + "epoch": 4, + "train_loss": 3.285915934448242, + "train_acc": 0.20564, + "test_loss": 3.4154525535583495, + "test_acc": 0.1808, + "lyapunov": null, + "grad_norm": 3.2931939429390655, + "grad_max_sv": 2.48674353659153, + "grad_min_sv": 6.094367343001394e-08, + "grad_condition": 49578785.90593137, + "lr": 0.0009982464296247522, + "time_sec": 32.57981467247009 + }, + { + "epoch": 5, + "train_loss": 3.049801904296875, + "train_acc": 0.2475, + "test_loss": 3.380838261413574, + "test_acc": 0.2067, + "lyapunov": null, + "grad_norm": 2.7585548587495836, + "grad_max_sv": 1.9313260614871979, + "grad_min_sv": 5.103909220399716e-08, + "grad_condition": 117086071.43576927, + "lr": 0.0009972609476841367, + "time_sec": 32.564860582351685 + }, + { + "epoch": 6, + "train_loss": 2.861402225112915, + "train_acc": 0.28052, + "test_loss": 3.1182963836669924, + "test_acc": 0.2393, + "lyapunov": null, + "grad_norm": 2.365169286939716, + "grad_max_sv": 1.514634570479393, + "grad_min_sv": 4.377452151871353e-08, + "grad_condition": 42685906.70361744, + "lr": 0.000996057350657239, + "time_sec": 32.57882595062256 + }, + { + "epoch": 7, + "train_loss": 2.683069683303833, + "train_acc": 0.31566, + "test_loss": 2.857948400115967, + "test_acc": 0.2899, + "lyapunov": null, + "grad_norm": 2.0678830204526424, + "grad_max_sv": 1.2104690104722977, + "grad_min_sv": 3.849874057187952e-08, + "grad_condition": 83742051.18670955, + "lr": 0.000994636166481494, + "time_sec": 32.585235834121704 + }, + { + "epoch": 8, + "train_loss": 2.5299233337402343, + "train_acc": 0.34444, + "test_loss": 3.000171680831909, + "test_acc": 0.2752, + "lyapunov": null, + "grad_norm": 1.874555701802065, + "grad_max_sv": 1.0279113829135895, + "grad_min_sv": 3.509024343872902e-08, + "grad_condition": 55390142.1353655, + "lr": 0.0009929980185352525, + "time_sec": 32.69047737121582 + }, + { + "epoch": 9, + "train_loss": 2.4147268306732177, + "train_acc": 0.3694, + "test_loss": 2.543715224456787, + "test_acc": 0.3455, + "lyapunov": null, + "grad_norm": 1.7485138229937156, + "grad_max_sv": 0.9131708398461342, + "grad_min_sv": 3.287046465294541e-08, + "grad_condition": 39656658.27812234, + "lr": 0.0009911436253643444, + "time_sec": 32.57169961929321 + }, + { + "epoch": 10, + "train_loss": 2.2967233794403077, + "train_acc": 0.39298, + "test_loss": 2.6548849906921386, + "test_acc": 0.3353, + "lyapunov": null, + "grad_norm": 1.6282804367899422, + "grad_max_sv": 0.782713083922863, + "grad_min_sv": 3.019940961190848e-08, + "grad_condition": 36873848.007240444, + "lr": 0.0009890738003669028, + "time_sec": 32.577866077423096 + }, + { + "epoch": 11, + "train_loss": 2.192351549682617, + "train_acc": 0.41852, + "test_loss": 2.3893451919555666, + "test_acc": 0.3824, + "lyapunov": null, + "grad_norm": 1.5518898048516216, + "grad_max_sv": 0.7297310382127762, + "grad_min_sv": 2.9274875311402494e-08, + "grad_condition": 81724146.83842216, + "lr": 0.00098678945143658, + "time_sec": 32.599745750427246 + }, + { + "epoch": 12, + "train_loss": 2.117909373779297, + "train_acc": 0.4337, + "test_loss": 2.522136171722412, + "test_acc": 0.3587, + "lyapunov": null, + "grad_norm": 1.4842631514558458, + "grad_max_sv": 0.66500775963068, + "grad_min_sv": 2.8010595395921988e-08, + "grad_condition": 35670339.18143847, + "lr": 0.0009842915805643154, + "time_sec": 32.62933874130249 + }, + { + "epoch": 13, + "train_loss": 2.035253409576416, + "train_acc": 0.45344, + "test_loss": 2.391997838592529, + "test_acc": 0.3805, + "lyapunov": null, + "grad_norm": 1.4422903854957079, + "grad_max_sv": 0.6408356204628944, + "grad_min_sv": 2.7295970482510425e-08, + "grad_condition": 43720876.000019774, + "lr": 0.000981581283398829, + "time_sec": 32.557313442230225 + }, + { + "epoch": 14, + "train_loss": 1.9614996997451781, + "train_acc": 0.46826, + "test_loss": 2.3329195419311524, + "test_acc": 0.4028, + "lyapunov": null, + "grad_norm": 1.3741944023253918, + "grad_max_sv": 0.6013172835111618, + "grad_min_sv": 2.5733794781213072e-08, + "grad_condition": 36069642.478253104, + "lr": 0.0009786597487660333, + "time_sec": 32.58955407142639 + }, + { + "epoch": 15, + "train_loss": 1.8944761297988892, + "train_acc": 0.48526, + "test_loss": 2.2367286880493165, + "test_acc": 0.4236, + "lyapunov": null, + "grad_norm": 1.3219592289498192, + "grad_max_sv": 0.5812912411987782, + "grad_min_sv": 2.4716666779944773e-08, + "grad_condition": 29281331.50836698, + "lr": 0.0009755282581475766, + "time_sec": 32.56029748916626 + }, + { + "epoch": 16, + "train_loss": 1.8379625350189208, + "train_acc": 0.49608, + "test_loss": 2.1963637313842774, + "test_acc": 0.4284, + "lyapunov": null, + "grad_norm": 1.2908175006695335, + "grad_max_sv": 0.5532825239002704, + "grad_min_sv": 2.4336655729539913e-08, + "grad_condition": 42358304.72716427, + "lr": 0.0009721881851187403, + "time_sec": 32.54909014701843 + }, + { + "epoch": 17, + "train_loss": 1.7670473766326904, + "train_acc": 0.51538, + "test_loss": 2.1328998752593993, + "test_acc": 0.4452, + "lyapunov": null, + "grad_norm": 1.2440997761596901, + "grad_max_sv": 0.5198108039796352, + "grad_min_sv": 2.3273317767413813e-08, + "grad_condition": 35998824.48422967, + "lr": 0.0009686409947459456, + "time_sec": 32.55762696266174 + }, + { + "epoch": 18, + "train_loss": 1.7253368561553954, + "train_acc": 0.52444, + "test_loss": 2.245950330352783, + "test_acc": 0.4284, + "lyapunov": null, + "grad_norm": 1.214902512911659, + "grad_max_sv": 0.5048692628741265, + "grad_min_sv": 2.2689030459988047e-08, + "grad_condition": 49317544.599824145, + "lr": 0.0009648882429441254, + "time_sec": 32.5514817237854 + }, + { + "epoch": 19, + "train_loss": 1.6694325649261474, + "train_acc": 0.5342, + "test_loss": 2.19226961517334, + "test_acc": 0.4387, + "lyapunov": null, + "grad_norm": 1.1750671216974986, + "grad_max_sv": 0.4863507993519306, + "grad_min_sv": 2.2075054092324244e-08, + "grad_condition": 97502207.70501134, + "lr": 0.00096093157579425, + "time_sec": 32.55115628242493 + }, + { + "epoch": 20, + "train_loss": 1.617248278427124, + "train_acc": 0.5473, + "test_loss": 2.143247143173218, + "test_acc": 0.453, + "lyapunov": null, + "grad_norm": 1.1445750522907119, + "grad_max_sv": 0.4708236537873745, + "grad_min_sv": 2.1383133666508236e-08, + "grad_condition": 30242603.347623855, + "lr": 0.0009567727288213001, + "time_sec": 32.56135654449463 + }, + { + "epoch": 21, + "train_loss": 1.5802922723007202, + "train_acc": 0.557, + "test_loss": 2.0990093154907226, + "test_acc": 0.4651, + "lyapunov": null, + "grad_norm": 1.1146123139527973, + "grad_max_sv": 0.45539517551660535, + "grad_min_sv": 2.1216313506045025e-08, + "grad_condition": 32120917.787080377, + "lr": 0.0009524135262330095, + "time_sec": 32.58874869346619 + }, + { + "epoch": 22, + "train_loss": 1.540067174949646, + "train_acc": 0.56592, + "test_loss": 2.0439955375671386, + "test_acc": 0.4707, + "lyapunov": null, + "grad_norm": 1.0888616623198637, + "grad_max_sv": 0.43293082937598226, + "grad_min_sv": 2.0197447772596356e-08, + "grad_condition": 51667507.409315005, + "lr": 0.0009478558801197061, + "time_sec": 32.57522892951965 + }, + { + "epoch": 23, + "train_loss": 1.5045368173980713, + "train_acc": 0.57686, + "test_loss": 2.0701497230529786, + "test_acc": 0.4729, + "lyapunov": null, + "grad_norm": 1.0823066547637195, + "grad_max_sv": 0.4348363593220711, + "grad_min_sv": 2.0215574525472847e-08, + "grad_condition": 38846769.86075296, + "lr": 0.000943101789615607, + "time_sec": 32.58562135696411 + }, + { + "epoch": 24, + "train_loss": 1.464451589126587, + "train_acc": 0.58532, + "test_loss": 2.2039865215301515, + "test_acc": 0.4486, + "lyapunov": null, + "grad_norm": 1.0523927832685198, + "grad_max_sv": 0.41661558151245115, + "grad_min_sv": 1.950878351086871e-08, + "grad_condition": 34416119.9412758, + "lr": 0.0009381533400219313, + "time_sec": 32.563148736953735 + }, + { + "epoch": 25, + "train_loss": 1.4205649266052247, + "train_acc": 0.59388, + "test_loss": 2.1708908073425293, + "test_acc": 0.4631, + "lyapunov": null, + "grad_norm": 1.0237955167104829, + "grad_max_sv": 0.41313874199986456, + "grad_min_sv": 1.9160673876000846e-08, + "grad_condition": 116069222.65926342, + "lr": 0.0009330127018922189, + "time_sec": 32.58251953125 + }, + { + "epoch": 26, + "train_loss": 1.3801667861938476, + "train_acc": 0.60904, + "test_loss": 2.141048712158203, + "test_acc": 0.4804, + "lyapunov": null, + "grad_norm": 1.003894338084706, + "grad_max_sv": 0.39152884259819987, + "grad_min_sv": 1.85417132805496e-08, + "grad_condition": 149070926.97039393, + "lr": 0.000927682130080253, + "time_sec": 32.58069562911987 + }, + { + "epoch": 27, + "train_loss": 1.3742198986053467, + "train_acc": 0.6049, + "test_loss": 2.1493278324127196, + "test_acc": 0.4766, + "lyapunov": null, + "grad_norm": 1.0025464883815882, + "grad_max_sv": 0.3876075059175491, + "grad_min_sv": 1.830616184195222e-08, + "grad_condition": 35882215.67392446, + "lr": 0.0009221639627510072, + "time_sec": 32.56836271286011 + }, + { + "epoch": 28, + "train_loss": 1.320306241645813, + "train_acc": 0.6196, + "test_loss": 2.1034063312530518, + "test_acc": 0.4844, + "lyapunov": null, + "grad_norm": 0.9735499274270826, + "grad_max_sv": 0.3877687506377697, + "grad_min_sv": 1.8286890105835564e-08, + "grad_condition": 335682383.9298244, + "lr": 0.0009164606203550494, + "time_sec": 32.57155418395996 + }, + { + "epoch": 29, + "train_loss": 1.2960155849075317, + "train_acc": 0.6256, + "test_loss": 2.1984372549057007, + "test_acc": 0.4692, + "lyapunov": null, + "grad_norm": 0.9613960934578316, + "grad_max_sv": 0.3829047717154026, + "grad_min_sv": 1.7720739411974938e-08, + "grad_condition": 36256976.72962162, + "lr": 0.0009105746045668516, + "time_sec": 32.55882430076599 + }, + { + "epoch": 30, + "train_loss": 1.276566519241333, + "train_acc": 0.62918, + "test_loss": 2.3138665813446044, + "test_acc": 0.4615, + "lyapunov": null, + "grad_norm": 0.9496542327680724, + "grad_max_sv": 0.37292894124984743, + "grad_min_sv": 1.7765610841463662e-08, + "grad_condition": 48990654.53726908, + "lr": 0.0009045084971874733, + "time_sec": 32.57599472999573 + }, + { + "epoch": 31, + "train_loss": 1.2222671955871582, + "train_acc": 0.64256, + "test_loss": 2.1691656875610352, + "test_acc": 0.4809, + "lyapunov": null, + "grad_norm": 0.9328591067251968, + "grad_max_sv": 0.3668631583452225, + "grad_min_sv": 1.731717505781827e-08, + "grad_condition": 30411660.235134684, + "lr": 0.0008982649590120977, + "time_sec": 32.56551241874695 + }, + { + "epoch": 32, + "train_loss": 1.2110996068191529, + "train_acc": 0.64794, + "test_loss": 2.214646379852295, + "test_acc": 0.4829, + "lyapunov": null, + "grad_norm": 0.930727366359918, + "grad_max_sv": 0.3651597030460835, + "grad_min_sv": 1.725773807192965e-08, + "grad_condition": 25901528.27644656, + "lr": 0.0008918467286629196, + "time_sec": 32.56990313529968 + }, + { + "epoch": 33, + "train_loss": 1.1722402347946168, + "train_acc": 0.6566, + "test_loss": 2.2246903633117676, + "test_acc": 0.4846, + "lyapunov": null, + "grad_norm": 0.9124985410949377, + "grad_max_sv": 0.35901916325092315, + "grad_min_sv": 1.6734816802102536e-08, + "grad_condition": 84184024.35994068, + "lr": 0.0008852566213878943, + "time_sec": 32.58838510513306 + }, + { + "epoch": 34, + "train_loss": 1.1472361179351807, + "train_acc": 0.66254, + "test_loss": 2.1493885478973387, + "test_acc": 0.4941, + "lyapunov": null, + "grad_norm": 0.8981676912068559, + "grad_max_sv": 0.34216810315847396, + "grad_min_sv": 1.6077876746622975e-08, + "grad_condition": 36468768.92296384, + "lr": 0.000878497527825878, + "time_sec": 32.57939434051514 + }, + { + "epoch": 35, + "train_loss": 1.1205655740356446, + "train_acc": 0.66956, + "test_loss": 2.163042925453186, + "test_acc": 0.4954, + "lyapunov": null, + "grad_norm": 0.8860645128225066, + "grad_max_sv": 0.3396616868674755, + "grad_min_sv": 1.607423450074308e-08, + "grad_condition": 144981538.90034992, + "lr": 0.000871572412738697, + "time_sec": 32.57995939254761 + }, + { + "epoch": 36, + "train_loss": 1.1019499723815918, + "train_acc": 0.67338, + "test_loss": 2.1101196655273435, + "test_acc": 0.508, + "lyapunov": null, + "grad_norm": 0.8837215741761234, + "grad_max_sv": 0.3453404136002064, + "grad_min_sv": 1.6300073393815674e-08, + "grad_condition": 39609134.3745661, + "lr": 0.0008644843137107055, + "time_sec": 32.610419511795044 + }, + { + "epoch": 37, + "train_loss": 1.0685892918777466, + "train_acc": 0.68264, + "test_loss": 2.166209588623047, + "test_acc": 0.5007, + "lyapunov": null, + "grad_norm": 0.8688858809651051, + "grad_max_sv": 0.3433241851627827, + "grad_min_sv": 1.6007609650054573e-08, + "grad_condition": 775786281.5340235, + "lr": 0.0008572363398164014, + "time_sec": 32.565879583358765 + }, + { + "epoch": 38, + "train_loss": 1.0574775017929077, + "train_acc": 0.68396, + "test_loss": 2.222346786689758, + "test_acc": 0.5, + "lyapunov": null, + "grad_norm": 0.8639145605396845, + "grad_max_sv": 0.3388586565852165, + "grad_min_sv": 1.583358475998331e-08, + "grad_condition": 34039562.91252621, + "lr": 0.0008498316702566826, + "time_sec": 32.57612729072571 + }, + { + "epoch": 39, + "train_loss": 1.0226109420394898, + "train_acc": 0.69532, + "test_loss": 2.190898861312866, + "test_acc": 0.502, + "lyapunov": null, + "grad_norm": 0.8542002974927076, + "grad_max_sv": 0.3443542592227459, + "grad_min_sv": 1.5959563168244095e-08, + "grad_condition": 59986387.77119949, + "lr": 0.0008422735529643442, + "time_sec": 32.57960486412048 + }, + { + "epoch": 40, + "train_loss": 1.0001259584808349, + "train_acc": 0.70102, + "test_loss": 2.25260383605957, + "test_acc": 0.4998, + "lyapunov": null, + "grad_norm": 0.8465843258509351, + "grad_max_sv": 0.33337946608662605, + "grad_min_sv": 1.5467166557259216e-08, + "grad_condition": 37113133.49315401, + "lr": 0.0008345653031794289, + "time_sec": 32.61366534233093 + }, + { + "epoch": 41, + "train_loss": 0.980431226234436, + "train_acc": 0.70476, + "test_loss": 2.1930856651306154, + "test_acc": 0.5111, + "lyapunov": null, + "grad_norm": 0.8344894111462177, + "grad_max_sv": 0.3344740740954876, + "grad_min_sv": 1.5184292248560104e-08, + "grad_condition": 42849773.682712145, + "lr": 0.0008267103019950526, + "time_sec": 32.604257106781006 + }, + { + "epoch": 42, + "train_loss": 0.9617984279251098, + "train_acc": 0.71146, + "test_loss": 2.2299947700500486, + "test_acc": 0.506, + "lyapunov": null, + "grad_norm": 0.8242242603947335, + "grad_max_sv": 0.3212660253047943, + "grad_min_sv": 1.4864016899610033e-08, + "grad_condition": 73401477.5678053, + "lr": 0.0008187119948743447, + "time_sec": 32.6293363571167 + }, + { + "epoch": 43, + "train_loss": 0.9384816081619263, + "train_acc": 0.71576, + "test_loss": 2.1490371479034422, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.8237477937232076, + "grad_max_sv": 0.3244126185774803, + "grad_min_sv": 1.494453279390906e-08, + "grad_condition": 58033299.26618519, + "lr": 0.000810573890139155, + "time_sec": 32.59305548667908 + }, + { + "epoch": 44, + "train_loss": 0.9152639833831787, + "train_acc": 0.72254, + "test_loss": 2.227645333480835, + "test_acc": 0.515, + "lyapunov": null, + "grad_norm": 0.8114307246954692, + "grad_max_sv": 0.32891099974513055, + "grad_min_sv": 1.470089587857909e-08, + "grad_condition": 187882457.4560508, + "lr": 0.0008022995574311873, + "time_sec": 32.56365776062012 + }, + { + "epoch": 45, + "train_loss": 0.8937730826950073, + "train_acc": 0.72926, + "test_loss": 2.257075512313843, + "test_acc": 0.5171, + "lyapunov": null, + "grad_norm": 0.7991066773444042, + "grad_max_sv": 0.310314255207777, + "grad_min_sv": 1.442440034638004e-08, + "grad_condition": 67545918.8595486, + "lr": 0.0007938926261462363, + "time_sec": 32.56998062133789 + }, + { + "epoch": 46, + "train_loss": 0.8821200103569031, + "train_acc": 0.73168, + "test_loss": 2.312848774147034, + "test_acc": 0.5052, + "lyapunov": null, + "grad_norm": 0.7987404367629951, + "grad_max_sv": 0.31381460800766947, + "grad_min_sv": 1.427665476706752e-08, + "grad_condition": 147171178.65022224, + "lr": 0.0007853567838422158, + "time_sec": 32.57842302322388 + }, + { + "epoch": 47, + "train_loss": 0.8545298266983032, + "train_acc": 0.73686, + "test_loss": 2.2923807540893555, + "test_acc": 0.5057, + "lyapunov": null, + "grad_norm": 0.7859231581178334, + "grad_max_sv": 0.31694323718547823, + "grad_min_sv": 1.4505229091466009e-08, + "grad_condition": 93313806.69758794, + "lr": 0.0007766957746216719, + "time_sec": 32.56472444534302 + }, + { + "epoch": 48, + "train_loss": 0.8375117244720459, + "train_acc": 0.74296, + "test_loss": 2.350985548019409, + "test_acc": 0.5065, + "lyapunov": null, + "grad_norm": 0.7733144016514287, + "grad_max_sv": 0.31536148227751254, + "grad_min_sv": 1.3926250694989983e-08, + "grad_condition": 138817686.6846688, + "lr": 0.0007679133974894982, + "time_sec": 32.562721490859985 + }, + { + "epoch": 49, + "train_loss": 0.8223947568511963, + "train_acc": 0.74656, + "test_loss": 2.268610196495056, + "test_acc": 0.509, + "lyapunov": null, + "grad_norm": 0.7708191932209156, + "grad_max_sv": 0.3082855362445116, + "grad_min_sv": 1.424878183428624e-08, + "grad_condition": 48064293.176824205, + "lr": 0.000759013504686565, + "time_sec": 32.59068489074707 + }, + { + "epoch": 50, + "train_loss": 0.8102355616569519, + "train_acc": 0.75154, + "test_loss": 2.303807855987549, + "test_acc": 0.5172, + "lyapunov": null, + "grad_norm": 0.7678857639968419, + "grad_max_sv": 0.30606309957802297, + "grad_min_sv": 1.401376939977328e-08, + "grad_condition": 66554378.026006415, + "lr": 0.0007499999999999998, + "time_sec": 32.61594772338867 + }, + { + "epoch": 51, + "train_loss": 0.7894559608268737, + "train_acc": 0.75788, + "test_loss": 2.3806381210327148, + "test_acc": 0.5067, + "lyapunov": null, + "grad_norm": 0.7578995070890107, + "grad_max_sv": 0.2958958923816681, + "grad_min_sv": 1.3479759735507413e-08, + "grad_condition": 59071539.288179755, + "lr": 0.0007408768370508575, + "time_sec": 32.58355736732483 + }, + { + "epoch": 52, + "train_loss": 0.7807610025405883, + "train_acc": 0.7587, + "test_loss": 2.335085013961792, + "test_acc": 0.5175, + "lyapunov": null, + "grad_norm": 0.7536291786486181, + "grad_max_sv": 0.3058082439005375, + "grad_min_sv": 1.4062500508851828e-08, + "grad_condition": 89488373.11429313, + "lr": 0.0007316480175599307, + "time_sec": 32.58504581451416 + }, + { + "epoch": 53, + "train_loss": 0.7639712882995605, + "train_acc": 0.76632, + "test_loss": 2.2413758136749267, + "test_acc": 0.529, + "lyapunov": null, + "grad_norm": 0.7437671807956605, + "grad_max_sv": 0.2986128095537424, + "grad_min_sv": 1.3716437835195604e-08, + "grad_condition": 153765004.26652625, + "lr": 0.0007223175895924635, + "time_sec": 32.599562883377075 + }, + { + "epoch": 54, + "train_loss": 0.7342572978401184, + "train_acc": 0.77172, + "test_loss": 2.3813604881286623, + "test_acc": 0.5211, + "lyapunov": null, + "grad_norm": 0.7415334115465683, + "grad_max_sv": 0.2952877823263407, + "grad_min_sv": 1.3237078199702934e-08, + "grad_condition": 158912190.85988137, + "lr": 0.0007128896457825361, + "time_sec": 32.58093762397766 + }, + { + "epoch": 55, + "train_loss": 0.7243311285591125, + "train_acc": 0.77394, + "test_loss": 2.5364841087341308, + "test_acc": 0.4919, + "lyapunov": null, + "grad_norm": 0.7336077653545635, + "grad_max_sv": 0.30250501483678816, + "grad_min_sv": 1.3610404020827915e-08, + "grad_condition": 80425531.55629282, + "lr": 0.0007033683215378998, + "time_sec": 32.64418268203735 + }, + { + "epoch": 56, + "train_loss": 0.7082911996078491, + "train_acc": 0.77956, + "test_loss": 2.494243837738037, + "test_acc": 0.5119, + "lyapunov": null, + "grad_norm": 0.7290174142670145, + "grad_max_sv": 0.2945553746074438, + "grad_min_sv": 1.3041360513894872e-08, + "grad_condition": 131633091.2577754, + "lr": 0.0006937577932260512, + "time_sec": 32.61989617347717 + }, + { + "epoch": 57, + "train_loss": 0.6861382236289978, + "train_acc": 0.7852, + "test_loss": 2.4704931076049803, + "test_acc": 0.518, + "lyapunov": null, + "grad_norm": 0.7189100733167055, + "grad_max_sv": 0.2928345203399658, + "grad_min_sv": 1.3202054537260477e-08, + "grad_condition": 122301802.04377504, + "lr": 0.0006840622763423388, + "time_sec": 32.601600885391235 + }, + { + "epoch": 58, + "train_loss": 0.6700656919956207, + "train_acc": 0.79076, + "test_loss": 2.505882039642334, + "test_acc": 0.5131, + "lyapunov": null, + "grad_norm": 0.7086978020515203, + "grad_max_sv": 0.28342925757169724, + "grad_min_sv": 1.2833174680912385e-08, + "grad_condition": 67698817.82937825, + "lr": 0.0006742860236609073, + "time_sec": 32.58192586898804 + }, + { + "epoch": 59, + "train_loss": 0.6577284108161926, + "train_acc": 0.79492, + "test_loss": 2.491006435775757, + "test_acc": 0.5155, + "lyapunov": null, + "grad_norm": 0.7069652566379913, + "grad_max_sv": 0.2849778015166521, + "grad_min_sv": 1.2662411319475097e-08, + "grad_condition": 54369902.95066987, + "lr": 0.0006644333233692913, + "time_sec": 32.601956605911255 + }, + { + "epoch": 60, + "train_loss": 0.6429468762397766, + "train_acc": 0.7985, + "test_loss": 2.4342385992050173, + "test_acc": 0.5281, + "lyapunov": null, + "grad_norm": 0.6950269523418225, + "grad_max_sv": 0.2759479142725468, + "grad_min_sv": 1.2526198570604087e-08, + "grad_condition": 1003668275.7453331, + "lr": 0.0006545084971874734, + "time_sec": 32.593979835510254 + }, + { + "epoch": 61, + "train_loss": 0.6316694467926025, + "train_acc": 0.80204, + "test_loss": 2.572236448669434, + "test_acc": 0.5228, + "lyapunov": null, + "grad_norm": 0.6953930381951806, + "grad_max_sv": 0.2823780722916126, + "grad_min_sv": 1.2607634538338957e-08, + "grad_condition": 910241325.2806966, + "lr": 0.0006445158984722354, + "time_sec": 32.63531136512756 + }, + { + "epoch": 62, + "train_loss": 0.6084016784477234, + "train_acc": 0.80756, + "test_loss": 2.528528450965881, + "test_acc": 0.5249, + "lyapunov": null, + "grad_norm": 0.6902039343361056, + "grad_max_sv": 0.2754691679030657, + "grad_min_sv": 1.2385301192095743e-08, + "grad_condition": 124171966.43343556, + "lr": 0.0006344599103076324, + "time_sec": 32.646347761154175 + }, + { + "epoch": 63, + "train_loss": 0.6006980142784119, + "train_acc": 0.81018, + "test_loss": 2.438706118583679, + "test_acc": 0.5266, + "lyapunov": null, + "grad_norm": 0.6822637884805373, + "grad_max_sv": 0.276136140525341, + "grad_min_sv": 1.2456568440621928e-08, + "grad_condition": 41258405.402897015, + "lr": 0.0006243449435824269, + "time_sec": 32.60796880722046 + }, + { + "epoch": 64, + "train_loss": 0.585920947380066, + "train_acc": 0.81566, + "test_loss": 2.505697784423828, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.6743129224923755, + "grad_max_sv": 0.26691033616662024, + "grad_min_sv": 1.2091218234630552e-08, + "grad_condition": 57195642.756296314, + "lr": 0.0006141754350553275, + "time_sec": 32.621875286102295 + }, + { + "epoch": 65, + "train_loss": 0.5716569157028198, + "train_acc": 0.81832, + "test_loss": 2.488600128173828, + "test_acc": 0.5221, + "lyapunov": null, + "grad_norm": 0.6747582168048405, + "grad_max_sv": 0.2778852738440037, + "grad_min_sv": 1.2316326589503767e-08, + "grad_condition": 66617009.51688242, + "lr": 0.0006039558454088793, + "time_sec": 32.58805871009827 + }, + { + "epoch": 66, + "train_loss": 0.5558187670326233, + "train_acc": 0.82442, + "test_loss": 2.455172736740112, + "test_acc": 0.5327, + "lyapunov": null, + "grad_norm": 0.6650651562580321, + "grad_max_sv": 0.27054035626351836, + "grad_min_sv": 1.1980440989180913e-08, + "grad_condition": 263553333.63889045, + "lr": 0.000593690657292862, + "time_sec": 32.61953616142273 + }, + { + "epoch": 67, + "train_loss": 0.5372648673820496, + "train_acc": 0.82802, + "test_loss": 2.5111166515350343, + "test_acc": 0.5259, + "lyapunov": null, + "grad_norm": 0.6598459109898526, + "grad_max_sv": 0.26995205879211426, + "grad_min_sv": 1.1711705713568498e-08, + "grad_condition": 40680262.666348636, + "lr": 0.0005833843733580507, + "time_sec": 32.596007108688354 + }, + { + "epoch": 68, + "train_loss": 0.529928300704956, + "train_acc": 0.83184, + "test_loss": 2.505376844024658, + "test_acc": 0.5324, + "lyapunov": null, + "grad_norm": 0.6554247710983278, + "grad_max_sv": 0.2640453014522791, + "grad_min_sv": 1.16465385096437e-08, + "grad_condition": 196611022.55457097, + "lr": 0.0005730415142812054, + "time_sec": 32.589977502822876 + }, + { + "epoch": 69, + "train_loss": 0.5270337955570221, + "train_acc": 0.83232, + "test_loss": 2.6256065521240233, + "test_acc": 0.5197, + "lyapunov": null, + "grad_norm": 0.6567252289857295, + "grad_max_sv": 0.2711860008537769, + "grad_min_sv": 1.1960956241034368e-08, + "grad_condition": 561898784.4199932, + "lr": 0.0005626666167821517, + "time_sec": 32.5863139629364 + }, + { + "epoch": 70, + "train_loss": 0.5109112097549439, + "train_acc": 0.8354, + "test_loss": 2.5708269050598145, + "test_acc": 0.5302, + "lyapunov": null, + "grad_norm": 0.646381173102848, + "grad_max_sv": 0.27013656310737133, + "grad_min_sv": 1.1766451666391648e-08, + "grad_condition": 259686356.85246676, + "lr": 0.0005522642316338265, + "time_sec": 32.601078033447266 + }, + { + "epoch": 71, + "train_loss": 0.49452698835372927, + "train_acc": 0.84226, + "test_loss": 2.5480498626708985, + "test_acc": 0.5341, + "lyapunov": null, + "grad_norm": 0.6360062848670928, + "grad_max_sv": 0.26699192114174364, + "grad_min_sv": 1.1295523278341807e-08, + "grad_condition": 5391854944.622183, + "lr": 0.0005418389216661573, + "time_sec": 32.60187101364136 + }, + { + "epoch": 72, + "train_loss": 0.48291658142089844, + "train_acc": 0.84586, + "test_loss": 2.659250145339966, + "test_acc": 0.5273, + "lyapunov": null, + "grad_norm": 0.6354901528331942, + "grad_max_sv": 0.26031049638986586, + "grad_min_sv": 1.1230092526043345e-08, + "grad_condition": 88239876.70399968, + "lr": 0.0005313952597646563, + "time_sec": 32.61269569396973 + }, + { + "epoch": 73, + "train_loss": 0.4778318354034424, + "train_acc": 0.8473, + "test_loss": 2.5874798002243042, + "test_acc": 0.5314, + "lyapunov": null, + "grad_norm": 0.6300098949086598, + "grad_max_sv": 0.26232460178434847, + "grad_min_sv": 1.134239846749957e-08, + "grad_condition": 105944680.31289935, + "lr": 0.0005209378268645994, + "time_sec": 32.613691091537476 + }, + { + "epoch": 74, + "train_loss": 0.46288997037887575, + "train_acc": 0.85288, + "test_loss": 2.5993505474090575, + "test_acc": 0.5337, + "lyapunov": null, + "grad_norm": 0.6215157272690962, + "grad_max_sv": 0.26828358359634874, + "grad_min_sv": 1.1235708100021391e-08, + "grad_condition": 41868662.72964181, + "lr": 0.0005104712099416781, + "time_sec": 32.61982536315918 + }, + { + "epoch": 75, + "train_loss": 0.45871317274093626, + "train_acc": 0.85266, + "test_loss": 2.6259676776885987, + "test_acc": 0.5345, + "lyapunov": null, + "grad_norm": 0.6170925610226076, + "grad_max_sv": 0.2573466833680868, + "grad_min_sv": 1.104757565784445e-08, + "grad_condition": 212140699.82071534, + "lr": 0.0004999999999999996, + "time_sec": 32.598039627075195 + }, + { + "epoch": 76, + "train_loss": 0.45109452469825745, + "train_acc": 0.85454, + "test_loss": 2.665439921569824, + "test_acc": 0.5303, + "lyapunov": null, + "grad_norm": 0.6161744946755234, + "grad_max_sv": 0.25873752422630786, + "grad_min_sv": 1.1002691283393782e-08, + "grad_condition": 1052469961.0162939, + "lr": 0.0004895287900583212, + "time_sec": 32.58305859565735 + }, + { + "epoch": 77, + "train_loss": 0.43257994356155394, + "train_acc": 0.86046, + "test_loss": 2.702251711654663, + "test_acc": 0.526, + "lyapunov": null, + "grad_norm": 0.607726688787837, + "grad_max_sv": 0.26136815659701823, + "grad_min_sv": 1.0734200759157653e-08, + "grad_condition": 189329156.27802238, + "lr": 0.0004790621731353997, + "time_sec": 32.59784960746765 + }, + { + "epoch": 78, + "train_loss": 0.41896025703430173, + "train_acc": 0.86472, + "test_loss": 2.671762952804565, + "test_acc": 0.5336, + "lyapunov": null, + "grad_norm": 0.5957655893318665, + "grad_max_sv": 0.2534705221652985, + "grad_min_sv": 1.0711852985699488e-08, + "grad_condition": 191261118.43217826, + "lr": 0.000468604740235343, + "time_sec": 32.62303113937378 + }, + { + "epoch": 79, + "train_loss": 0.40766072305679324, + "train_acc": 0.86786, + "test_loss": 2.584160025596619, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.5933439762516267, + "grad_max_sv": 0.2529820345342159, + "grad_min_sv": 1.1027942445340776e-08, + "grad_condition": 38680465.32555069, + "lr": 0.00045816107833384175, + "time_sec": 32.64057159423828 + }, + { + "epoch": 80, + "train_loss": 0.395585339012146, + "train_acc": 0.8719, + "test_loss": 2.6836016262054443, + "test_acc": 0.5338, + "lyapunov": null, + "grad_norm": 0.5915283577904045, + "grad_max_sv": 0.2511633686721325, + "grad_min_sv": 1.074133903124913e-08, + "grad_condition": 579600714.0219278, + "lr": 0.0004477357683661729, + "time_sec": 32.63526272773743 + }, + { + "epoch": 81, + "train_loss": 0.39450348417282105, + "train_acc": 0.87178, + "test_loss": 2.5824236192703247, + "test_acc": 0.5448, + "lyapunov": null, + "grad_norm": 0.5885071131780099, + "grad_max_sv": 0.25625271871685984, + "grad_min_sv": 1.0501880514518502e-08, + "grad_condition": 124784334.66343915, + "lr": 0.00043733338321784746, + "time_sec": 32.604066610336304 + }, + { + "epoch": 82, + "train_loss": 0.3872408880805969, + "train_acc": 0.87422, + "test_loss": 2.6602687486648557, + "test_acc": 0.5352, + "lyapunov": null, + "grad_norm": 0.5833408041873426, + "grad_max_sv": 0.2544650699943304, + "grad_min_sv": 1.0623962720494873e-08, + "grad_condition": 134511278.94006854, + "lr": 0.0004269584857187939, + "time_sec": 32.63341236114502 + }, + { + "epoch": 83, + "train_loss": 0.3692175518798828, + "train_acc": 0.8823, + "test_loss": 2.6812981620788574, + "test_acc": 0.5354, + "lyapunov": null, + "grad_norm": 0.571242006609448, + "grad_max_sv": 0.2509057328104973, + "grad_min_sv": 1.0469137029164855e-08, + "grad_condition": 133735555.98911181, + "lr": 0.0004166156266419484, + "time_sec": 32.600364685058594 + }, + { + "epoch": 84, + "train_loss": 0.36960686668396, + "train_acc": 0.8806, + "test_loss": 2.6419603324890137, + "test_acc": 0.5453, + "lyapunov": null, + "grad_norm": 0.5733982210439359, + "grad_max_sv": 0.25141631327569486, + "grad_min_sv": 1.0406415923511908e-08, + "grad_condition": 126933629.16775417, + "lr": 0.0004063093427071373, + "time_sec": 32.60528612136841 + }, + { + "epoch": 85, + "train_loss": 0.3596297464942932, + "train_acc": 0.88366, + "test_loss": 2.716620068740845, + "test_acc": 0.5395, + "lyapunov": null, + "grad_norm": 0.5676461114412606, + "grad_max_sv": 0.24900777079164982, + "grad_min_sv": 1.0182381811286654e-08, + "grad_condition": 508099869.8504903, + "lr": 0.0003960441545911199, + "time_sec": 32.61734056472778 + }, + { + "epoch": 86, + "train_loss": 0.3471255212688446, + "train_acc": 0.88682, + "test_loss": 2.6910045627593995, + "test_acc": 0.5395, + "lyapunov": null, + "grad_norm": 0.5548265984779118, + "grad_max_sv": 0.23751378245651722, + "grad_min_sv": 9.806933828904186e-09, + "grad_condition": 127564160.08711353, + "lr": 0.0003858245649446718, + "time_sec": 32.59777784347534 + }, + { + "epoch": 87, + "train_loss": 0.3406936288833618, + "train_acc": 0.8891, + "test_loss": 2.744849885940552, + "test_acc": 0.5429, + "lyapunov": null, + "grad_norm": 0.5555218429462011, + "grad_max_sv": 0.2389649160206318, + "grad_min_sv": 9.80964975061914e-09, + "grad_condition": 889623886.9749553, + "lr": 0.00037565505641757235, + "time_sec": 32.603169679641724 + }, + { + "epoch": 88, + "train_loss": 0.332358439912796, + "train_acc": 0.89152, + "test_loss": 2.7001221378326417, + "test_acc": 0.5481, + "lyapunov": null, + "grad_norm": 0.550628932039783, + "grad_max_sv": 0.24251497723162174, + "grad_min_sv": 9.773675100493983e-09, + "grad_condition": 85698012.51102474, + "lr": 0.00036554008969236695, + "time_sec": 32.60269355773926 + }, + { + "epoch": 89, + "train_loss": 0.31770461375236514, + "train_acc": 0.89674, + "test_loss": 2.826695262527466, + "test_acc": 0.5359, + "lyapunov": null, + "grad_norm": 0.5452633910908743, + "grad_max_sv": 0.2457874234765768, + "grad_min_sv": 1.0011228396625271e-08, + "grad_condition": 115516500.1980664, + "lr": 0.0003554841015277638, + "time_sec": 32.615172147750854 + }, + { + "epoch": 90, + "train_loss": 0.3198126357555389, + "train_acc": 0.89686, + "test_loss": 2.761284243011475, + "test_acc": 0.5383, + "lyapunov": null, + "grad_norm": 0.5420260505535877, + "grad_max_sv": 0.2379120856523514, + "grad_min_sv": 9.806707615064857e-09, + "grad_condition": 292496720.3714178, + "lr": 0.000345491502812526, + "time_sec": 32.60730767250061 + }, + { + "epoch": 91, + "train_loss": 0.31583098639965057, + "train_acc": 0.89624, + "test_loss": 2.798471709060669, + "test_acc": 0.5389, + "lyapunov": null, + "grad_norm": 0.541688273995152, + "grad_max_sv": 0.2411293275654316, + "grad_min_sv": 9.842002349441745e-09, + "grad_condition": 859517900.635659, + "lr": 0.0003355666766307081, + "time_sec": 32.59173631668091 + }, + { + "epoch": 92, + "train_loss": 0.30620651626586914, + "train_acc": 0.89982, + "test_loss": 2.8147284172058105, + "test_acc": 0.5372, + "lyapunov": null, + "grad_norm": 0.534845986324325, + "grad_max_sv": 0.2446113031357527, + "grad_min_sv": 9.80392773058253e-09, + "grad_condition": 318006434.8637026, + "lr": 0.00032571397633909225, + "time_sec": 32.625818729400635 + }, + { + "epoch": 93, + "train_loss": 0.2942564325428009, + "train_acc": 0.9027, + "test_loss": 2.7974524646759034, + "test_acc": 0.5458, + "lyapunov": null, + "grad_norm": 0.5258623807030809, + "grad_max_sv": 0.23323353454470636, + "grad_min_sv": 9.338492477830445e-09, + "grad_condition": 179043441.62085792, + "lr": 0.00031593772365766094, + "time_sec": 32.64636468887329 + }, + { + "epoch": 94, + "train_loss": 0.29325305396080015, + "train_acc": 0.90696, + "test_loss": 2.7924257678985596, + "test_acc": 0.5399, + "lyapunov": null, + "grad_norm": 0.5223436049599501, + "grad_max_sv": 0.23972665779292585, + "grad_min_sv": 9.572742014005153e-09, + "grad_condition": 829147220.8115915, + "lr": 0.0003062422067739483, + "time_sec": 32.63534426689148 + }, + { + "epoch": 95, + "train_loss": 0.2819689624214172, + "train_acc": 0.90976, + "test_loss": 2.925028160858154, + "test_acc": 0.5349, + "lyapunov": null, + "grad_norm": 0.5142202374019095, + "grad_max_sv": 0.2272823579609394, + "grad_min_sv": 9.26979293529133e-09, + "grad_condition": 746493228.5809206, + "lr": 0.00029663167846209965, + "time_sec": 32.632474184036255 + }, + { + "epoch": 96, + "train_loss": 0.2815214267730713, + "train_acc": 0.90818, + "test_loss": 2.834438822937012, + "test_acc": 0.5361, + "lyapunov": null, + "grad_norm": 0.5120345521537165, + "grad_max_sv": 0.23016531057655812, + "grad_min_sv": 9.260385527062182e-09, + "grad_condition": 233123428.8839547, + "lr": 0.00028711035421746345, + "time_sec": 32.61351776123047 + }, + { + "epoch": 97, + "train_loss": 0.2686532742404938, + "train_acc": 0.91288, + "test_loss": 2.7868608379364015, + "test_acc": 0.5454, + "lyapunov": null, + "grad_norm": 0.50888083523268, + "grad_max_sv": 0.23386715427041055, + "grad_min_sv": 9.24353042355136e-09, + "grad_condition": 480824699.4459009, + "lr": 0.00027768241040753615, + "time_sec": 32.597689628601074 + }, + { + "epoch": 98, + "train_loss": 0.26857261137008664, + "train_acc": 0.9114, + "test_loss": 2.8518635543823243, + "test_acc": 0.5437, + "lyapunov": null, + "grad_norm": 0.5090536597227022, + "grad_max_sv": 0.22117703258991242, + "grad_min_sv": 8.954814682826662e-09, + "grad_condition": 523046386.34619534, + "lr": 0.00026835198244006903, + "time_sec": 32.608073472976685 + }, + { + "epoch": 99, + "train_loss": 0.25366373962402344, + "train_acc": 0.91882, + "test_loss": 2.8721565658569337, + "test_acc": 0.543, + "lyapunov": null, + "grad_norm": 0.49238261306821557, + "grad_max_sv": 0.2156506847590208, + "grad_min_sv": 8.781873435826509e-09, + "grad_condition": 904102693.0135263, + "lr": 0.0002591231629491421, + "time_sec": 32.61784863471985 + }, + { + "epoch": 100, + "train_loss": 0.24887621872901916, + "train_acc": 0.91974, + "test_loss": 2.921920951461792, + "test_acc": 0.5361, + "lyapunov": null, + "grad_norm": 0.4888254012066189, + "grad_max_sv": 0.2262551225721836, + "grad_min_sv": 9.07711106217608e-09, + "grad_condition": 2378158119.157684, + "lr": 0.0002499999999999997, + "time_sec": 32.63064646720886 + }, + { + "epoch": 101, + "train_loss": 0.2486992248916626, + "train_acc": 0.92078, + "test_loss": 2.84906298789978, + "test_acc": 0.546, + "lyapunov": null, + "grad_norm": 0.49044990509199843, + "grad_max_sv": 0.2249086916446686, + "grad_min_sv": 8.942711630455583e-09, + "grad_condition": 368518315.458243, + "lr": 0.00024098649531343477, + "time_sec": 32.61569309234619 + }, + { + "epoch": 102, + "train_loss": 0.24084433520317078, + "train_acc": 0.92134, + "test_loss": 2.8644924999237062, + "test_acc": 0.5466, + "lyapunov": null, + "grad_norm": 0.4835634789382412, + "grad_max_sv": 0.22181024961173534, + "grad_min_sv": 8.71543736290746e-09, + "grad_condition": 729146084.7030591, + "lr": 0.0002320866025105016, + "time_sec": 32.61780500411987 + }, + { + "epoch": 103, + "train_loss": 0.23572091526031494, + "train_acc": 0.9245, + "test_loss": 2.8849633934020997, + "test_acc": 0.5462, + "lyapunov": null, + "grad_norm": 0.47616360717681877, + "grad_max_sv": 0.21196404211223124, + "grad_min_sv": 8.353945581216632e-09, + "grad_condition": 474656759.6437806, + "lr": 0.0002233042253783278, + "time_sec": 32.613890647888184 + }, + { + "epoch": 104, + "train_loss": 0.2249231512260437, + "train_acc": 0.92648, + "test_loss": 2.9231421543121336, + "test_acc": 0.5417, + "lyapunov": null, + "grad_norm": 0.47192872655679174, + "grad_max_sv": 0.214255590736866, + "grad_min_sv": 8.505988313570536e-09, + "grad_condition": 289197672.1924402, + "lr": 0.000214643216157784, + "time_sec": 32.601218938827515 + }, + { + "epoch": 105, + "train_loss": 0.22248219745159148, + "train_acc": 0.9281, + "test_loss": 2.9562902782440186, + "test_acc": 0.5427, + "lyapunov": null, + "grad_norm": 0.4698308403081668, + "grad_max_sv": 0.22572967931628227, + "grad_min_sv": 8.526192928743314e-09, + "grad_condition": 1450261253.9932175, + "lr": 0.00020610737385376332, + "time_sec": 32.612290382385254 + }, + { + "epoch": 106, + "train_loss": 0.21623054056167604, + "train_acc": 0.92962, + "test_loss": 2.908762315750122, + "test_acc": 0.5446, + "lyapunov": null, + "grad_norm": 0.46340711985172833, + "grad_max_sv": 0.21638907827436923, + "grad_min_sv": 8.416883249314638e-09, + "grad_condition": 255468039.70825052, + "lr": 0.00019770044256881242, + "time_sec": 32.612945318222046 + }, + { + "epoch": 107, + "train_loss": 0.21244655453205108, + "train_acc": 0.93246, + "test_loss": 2.974463511657715, + "test_acc": 0.5384, + "lyapunov": null, + "grad_norm": 0.4594548274355528, + "grad_max_sv": 0.22012278363108634, + "grad_min_sv": 8.49774636952922e-09, + "grad_condition": 2473361556.8977194, + "lr": 0.0001894261098608447, + "time_sec": 32.62226438522339 + }, + { + "epoch": 108, + "train_loss": 0.2094324759197235, + "train_acc": 0.93186, + "test_loss": 2.8919307563781738, + "test_acc": 0.5468, + "lyapunov": null, + "grad_norm": 0.4576154748028718, + "grad_max_sv": 0.2116704247891903, + "grad_min_sv": 8.391172841922153e-09, + "grad_condition": 466352424.25916034, + "lr": 0.000181288005125655, + "time_sec": 32.6186683177948 + }, + { + "epoch": 109, + "train_loss": 0.20401785006046294, + "train_acc": 0.93418, + "test_loss": 2.957660815048218, + "test_acc": 0.539, + "lyapunov": null, + "grad_norm": 0.4546298422322962, + "grad_max_sv": 0.21849206127226353, + "grad_min_sv": 8.682296616380203e-09, + "grad_condition": 191940882.5588118, + "lr": 0.0001732896980049473, + "time_sec": 32.628432273864746 + }, + { + "epoch": 110, + "train_loss": 0.20467783069610596, + "train_acc": 0.9347, + "test_loss": 2.958277463912964, + "test_acc": 0.5437, + "lyapunov": null, + "grad_norm": 0.4527691780730168, + "grad_max_sv": 0.20565569326281546, + "grad_min_sv": 8.186116849185146e-09, + "grad_condition": 362737702.71097183, + "lr": 0.00016543469682057076, + "time_sec": 32.61425018310547 + }, + { + "epoch": 111, + "train_loss": 0.1963657117843628, + "train_acc": 0.93738, + "test_loss": 2.912566703796387, + "test_acc": 0.5453, + "lyapunov": null, + "grad_norm": 0.4442740357567778, + "grad_max_sv": 0.20528529062867165, + "grad_min_sv": 7.897949131502324e-09, + "grad_condition": 332879126.46642524, + "lr": 0.00015772644703565552, + "time_sec": 32.640437841415405 + }, + { + "epoch": 112, + "train_loss": 0.19529674465417862, + "train_acc": 0.93706, + "test_loss": 2.9921934005737305, + "test_acc": 0.5439, + "lyapunov": null, + "grad_norm": 0.4472859282028686, + "grad_max_sv": 0.21485005132853985, + "grad_min_sv": 8.123189853593854e-09, + "grad_condition": 1264491045.958951, + "lr": 0.00015016832974331713, + "time_sec": 32.62719178199768 + }, + { + "epoch": 113, + "train_loss": 0.19033806517124177, + "train_acc": 0.93864, + "test_loss": 2.982124820327759, + "test_acc": 0.5437, + "lyapunov": null, + "grad_norm": 0.44136667096649934, + "grad_max_sv": 0.21058676335960627, + "grad_min_sv": 8.165891918036905e-09, + "grad_condition": 312331837.29792935, + "lr": 0.00014276366018359834, + "time_sec": 32.62637948989868 + }, + { + "epoch": 114, + "train_loss": 0.1861744700717926, + "train_acc": 0.9415, + "test_loss": 2.9888067501068116, + "test_acc": 0.5439, + "lyapunov": null, + "grad_norm": 0.4352864374741274, + "grad_max_sv": 0.20403808429837228, + "grad_min_sv": 7.826812852777115e-09, + "grad_condition": 157749511.7241363, + "lr": 0.00013551568628929425, + "time_sec": 32.61394190788269 + }, + { + "epoch": 115, + "train_loss": 0.17919604228019714, + "train_acc": 0.94228, + "test_loss": 2.9267702087402343, + "test_acc": 0.5533, + "lyapunov": null, + "grad_norm": 0.4303078691865104, + "grad_max_sv": 0.21317217014729978, + "grad_min_sv": 7.932376714335499e-09, + "grad_condition": 130563128.16561177, + "lr": 0.00012842758726130276, + "time_sec": 32.59867215156555 + }, + { + "epoch": 116, + "train_loss": 0.1819922329044342, + "train_acc": 0.9421, + "test_loss": 2.9711815841674807, + "test_acc": 0.5465, + "lyapunov": null, + "grad_norm": 0.43180962461173705, + "grad_max_sv": 0.22204699292778968, + "grad_min_sv": 8.152687410540802e-09, + "grad_condition": 465179275.152493, + "lr": 0.0001215024721741218, + "time_sec": 32.63067364692688 + }, + { + "epoch": 117, + "train_loss": 0.1775187094783783, + "train_acc": 0.94306, + "test_loss": 2.9692884788513183, + "test_acc": 0.5485, + "lyapunov": null, + "grad_norm": 0.42535422696695824, + "grad_max_sv": 0.20696271434426308, + "grad_min_sv": 7.841850190731802e-09, + "grad_condition": 340204799.15066475, + "lr": 0.00011474337861210538, + "time_sec": 32.682225465774536 + }, + { + "epoch": 118, + "train_loss": 0.1782768397474289, + "train_acc": 0.94228, + "test_loss": 2.9190274017333984, + "test_acc": 0.5529, + "lyapunov": null, + "grad_norm": 0.4288690474100953, + "grad_max_sv": 0.20459303073585033, + "grad_min_sv": 7.852907129212925e-09, + "grad_condition": 413565999.92345744, + "lr": 0.00010815327133708009, + "time_sec": 32.6104941368103 + }, + { + "epoch": 119, + "train_loss": 0.17245361244678498, + "train_acc": 0.94452, + "test_loss": 2.9115855850219727, + "test_acc": 0.5518, + "lyapunov": null, + "grad_norm": 0.42115534183071457, + "grad_max_sv": 0.20364198610186576, + "grad_min_sv": 7.842290997188895e-09, + "grad_condition": 4300198879.021836, + "lr": 0.00010173504098790182, + "time_sec": 32.599159479141235 + }, + { + "epoch": 120, + "train_loss": 0.16841998175621034, + "train_acc": 0.9465, + "test_loss": 2.9750044021606445, + "test_acc": 0.5509, + "lyapunov": null, + "grad_norm": 0.4139970919760924, + "grad_max_sv": 0.21118448078632354, + "grad_min_sv": 7.870022611139622e-09, + "grad_condition": 588234398.5889165, + "lr": 9.549150281252629e-05, + "time_sec": 32.60773468017578 + }, + { + "epoch": 121, + "train_loss": 0.1674146131658554, + "train_acc": 0.94722, + "test_loss": 3.043567562866211, + "test_acc": 0.5401, + "lyapunov": null, + "grad_norm": 0.4140688259905283, + "grad_max_sv": 0.19524961337447166, + "grad_min_sv": 7.740067117572789e-09, + "grad_condition": 294042234.42343616, + "lr": 8.942539543314794e-05, + "time_sec": 32.605161905288696 + }, + { + "epoch": 122, + "train_loss": 0.16243593076705934, + "train_acc": 0.94846, + "test_loss": 2.929161159515381, + "test_acc": 0.5544, + "lyapunov": null, + "grad_norm": 0.4069435316400916, + "grad_max_sv": 0.1928358545526862, + "grad_min_sv": 7.721300553786966e-09, + "grad_condition": 1492464032.2227066, + "lr": 8.353937964495024e-05, + "time_sec": 32.641791105270386 + }, + { + "epoch": 123, + "train_loss": 0.1584806259393692, + "train_acc": 0.94938, + "test_loss": 3.1013183868408203, + "test_acc": 0.5441, + "lyapunov": null, + "grad_norm": 0.4074794428211969, + "grad_max_sv": 0.19953589588403703, + "grad_min_sv": 7.50950879795792e-09, + "grad_condition": 963926565.1466379, + "lr": 7.783603724899243e-05, + "time_sec": 32.63674283027649 + }, + { + "epoch": 124, + "train_loss": 0.15840048369407653, + "train_acc": 0.9494, + "test_loss": 3.02653837890625, + "test_acc": 0.5519, + "lyapunov": null, + "grad_norm": 0.4076422491058348, + "grad_max_sv": 0.2066960282623768, + "grad_min_sv": 7.477964763082447e-09, + "grad_condition": 442993334.53740203, + "lr": 7.231786991974666e-05, + "time_sec": 32.61531352996826 + }, + { + "epoch": 125, + "train_loss": 0.15796427134990693, + "train_acc": 0.9492, + "test_loss": 3.0291555103302, + "test_acc": 0.547, + "lyapunov": null, + "grad_norm": 0.4074327913561712, + "grad_max_sv": 0.20506599061191083, + "grad_min_sv": 7.742264148888345e-09, + "grad_condition": 174320401.78922492, + "lr": 6.698729810778072e-05, + "time_sec": 32.616377115249634 + }, + { + "epoch": 126, + "train_loss": 0.15587055792808532, + "train_acc": 0.94994, + "test_loss": 3.0593951934814454, + "test_acc": 0.5475, + "lyapunov": null, + "grad_norm": 0.40499205379602254, + "grad_max_sv": 0.20328918769955634, + "grad_min_sv": 7.676706426616719e-09, + "grad_condition": 1609865519.3051925, + "lr": 6.184665997806817e-05, + "time_sec": 32.61218738555908 + }, + { + "epoch": 127, + "train_loss": 0.1515829546546936, + "train_acc": 0.95164, + "test_loss": 2.997521667098999, + "test_acc": 0.5527, + "lyapunov": null, + "grad_norm": 0.3980720784578974, + "grad_max_sv": 0.20609603635966778, + "grad_min_sv": 7.607568789811877e-09, + "grad_condition": 467148050.5049923, + "lr": 5.6898210384392595e-05, + "time_sec": 32.59871435165405 + }, + { + "epoch": 128, + "train_loss": 0.15070208614826203, + "train_acc": 0.95202, + "test_loss": 2.989130591583252, + "test_acc": 0.5478, + "lyapunov": null, + "grad_norm": 0.4001034661246295, + "grad_max_sv": 0.1990298792719841, + "grad_min_sv": 7.700730269807106e-09, + "grad_condition": 1087373342.1502237, + "lr": 5.214411988029363e-05, + "time_sec": 32.64661478996277 + }, + { + "epoch": 129, + "train_loss": 0.1532275314569473, + "train_acc": 0.95156, + "test_loss": 3.076161633300781, + "test_acc": 0.5428, + "lyapunov": null, + "grad_norm": 0.39710317166706477, + "grad_max_sv": 0.2050964504480362, + "grad_min_sv": 7.753612097250589e-09, + "grad_condition": 177848968.01384813, + "lr": 4.7586473766990294e-05, + "time_sec": 32.619911193847656 + }, + { + "epoch": 130, + "train_loss": 0.14840273664474488, + "train_acc": 0.95386, + "test_loss": 3.0291847702026367, + "test_acc": 0.5514, + "lyapunov": null, + "grad_norm": 0.3943339950090642, + "grad_max_sv": 0.20189184583723546, + "grad_min_sv": 7.418064280288045e-09, + "grad_condition": 225551543.43719563, + "lr": 4.32272711786996e-05, + "time_sec": 32.61198544502258 + }, + { + "epoch": 131, + "train_loss": 0.1431949885225296, + "train_acc": 0.95528, + "test_loss": 3.027348929977417, + "test_acc": 0.5507, + "lyapunov": null, + "grad_norm": 0.38711994826678314, + "grad_max_sv": 0.19673722572624683, + "grad_min_sv": 7.518409088564434e-09, + "grad_condition": 1146835061.4670472, + "lr": 3.906842420574966e-05, + "time_sec": 32.61335587501526 + }, + { + "epoch": 132, + "train_loss": 0.1487313818216324, + "train_acc": 0.95322, + "test_loss": 3.0886004333496095, + "test_acc": 0.5461, + "lyapunov": null, + "grad_norm": 0.395507713545241, + "grad_max_sv": 0.20544077269732952, + "grad_min_sv": 7.573043920433565e-09, + "grad_condition": 168877391.5952191, + "lr": 3.5111757055874305e-05, + "time_sec": 32.5999391078949 + }, + { + "epoch": 133, + "train_loss": 0.14615771746635436, + "train_acc": 0.95264, + "test_loss": 3.000204067611694, + "test_acc": 0.5534, + "lyapunov": null, + "grad_norm": 0.3932909447553781, + "grad_max_sv": 0.18928411398082973, + "grad_min_sv": 7.371471794906034e-09, + "grad_condition": 362753839.3369804, + "lr": 3.1359005254054254e-05, + "time_sec": 32.6199426651001 + }, + { + "epoch": 134, + "train_loss": 0.14433889319181442, + "train_acc": 0.95458, + "test_loss": 3.007744090270996, + "test_acc": 0.5535, + "lyapunov": null, + "grad_norm": 0.38729299837720393, + "grad_max_sv": 0.1966633189469576, + "grad_min_sv": 7.389140074115508e-09, + "grad_condition": 474683811.0722334, + "lr": 2.7811814881259484e-05, + "time_sec": 32.66906452178955 + }, + { + "epoch": 135, + "train_loss": 0.14040502546787262, + "train_acc": 0.95526, + "test_loss": 2.9782509716033934, + "test_acc": 0.5519, + "lyapunov": null, + "grad_norm": 0.3837181152764762, + "grad_max_sv": 0.19970894865691663, + "grad_min_sv": 7.428829410741772e-09, + "grad_condition": 568455087.6695989, + "lr": 2.4471741852423218e-05, + "time_sec": 32.612287521362305 + }, + { + "epoch": 136, + "train_loss": 0.14493111051797866, + "train_acc": 0.95468, + "test_loss": 3.0520059284210204, + "test_acc": 0.5481, + "lyapunov": null, + "grad_norm": 0.39055918813288093, + "grad_max_sv": 0.20612289309501647, + "grad_min_sv": 7.689209627608634e-09, + "grad_condition": 670288720.96072, + "lr": 2.1340251233966362e-05, + "time_sec": 32.61230111122131 + }, + { + "epoch": 137, + "train_loss": 0.1412872414493561, + "train_acc": 0.95532, + "test_loss": 2.9926007400512695, + "test_acc": 0.5538, + "lyapunov": null, + "grad_norm": 0.3847438191608403, + "grad_max_sv": 0.1935590598732233, + "grad_min_sv": 7.3988825210688506e-09, + "grad_condition": 818122774.676174, + "lr": 1.8418716601170932e-05, + "time_sec": 32.63673734664917 + }, + { + "epoch": 138, + "train_loss": 0.1368464488697052, + "train_acc": 0.95786, + "test_loss": 3.0026862827301026, + "test_acc": 0.5541, + "lyapunov": null, + "grad_norm": 0.3793276651282968, + "grad_max_sv": 0.2012945655733347, + "grad_min_sv": 7.351351802645234e-09, + "grad_condition": 363599415.4796465, + "lr": 1.570841943568445e-05, + "time_sec": 32.59603404998779 + }, + { + "epoch": 139, + "train_loss": 0.1389853618478775, + "train_acc": 0.95644, + "test_loss": 3.04127444152832, + "test_acc": 0.5497, + "lyapunov": null, + "grad_norm": 0.38369680042825305, + "grad_max_sv": 0.1901318434625864, + "grad_min_sv": 7.190909153147098e-09, + "grad_condition": 1063192542.6047398, + "lr": 1.3210548563419845e-05, + "time_sec": 32.623175382614136 + }, + { + "epoch": 140, + "train_loss": 0.13792312327384948, + "train_acc": 0.95614, + "test_loss": 3.004412171936035, + "test_acc": 0.5534, + "lyapunov": null, + "grad_norm": 0.37904522036307264, + "grad_max_sv": 0.19201667234301567, + "grad_min_sv": 7.376605424202435e-09, + "grad_condition": 1234012097.4190845, + "lr": 1.0926199633097203e-05, + "time_sec": 32.630115270614624 + }, + { + "epoch": 141, + "train_loss": 0.1407741106414795, + "train_acc": 0.95654, + "test_loss": 3.0456832256317137, + "test_acc": 0.5511, + "lyapunov": null, + "grad_norm": 0.38330137862093777, + "grad_max_sv": 0.19592518154531718, + "grad_min_sv": 7.054394128222507e-09, + "grad_condition": 86708521.56413671, + "lr": 8.856374635655688e-06, + "time_sec": 32.61585021018982 + }, + { + "epoch": 142, + "train_loss": 0.1388852431154251, + "train_acc": 0.95632, + "test_loss": 3.063602409744263, + "test_acc": 0.5478, + "lyapunov": null, + "grad_norm": 0.3828568546417417, + "grad_max_sv": 0.1969303483143449, + "grad_min_sv": 7.518555048707278e-09, + "grad_condition": 678890293.0423553, + "lr": 7.001981464747503e-06, + "time_sec": 32.630441427230835 + }, + { + "epoch": 143, + "train_loss": 0.13581469515800476, + "train_acc": 0.9579, + "test_loss": 3.0148553092956543, + "test_acc": 0.5538, + "lyapunov": null, + "grad_norm": 0.37580622771801075, + "grad_max_sv": 0.18920586220920085, + "grad_min_sv": 7.312373946242665e-09, + "grad_condition": 360908520.84421337, + "lr": 5.3638335185058295e-06, + "time_sec": 32.64005398750305 + }, + { + "epoch": 144, + "train_loss": 0.1397603491592407, + "train_acc": 0.9547, + "test_loss": 3.017238700866699, + "test_acc": 0.5514, + "lyapunov": null, + "grad_norm": 0.3851319102923484, + "grad_max_sv": 0.19529533758759499, + "grad_min_sv": 7.18097194788922e-09, + "grad_condition": 274499937.83092636, + "lr": 3.942649342761114e-06, + "time_sec": 32.60517716407776 + }, + { + "epoch": 145, + "train_loss": 0.13670911428451538, + "train_acc": 0.95648, + "test_loss": 3.0282860946655275, + "test_acc": 0.5508, + "lyapunov": null, + "grad_norm": 0.37783913784420287, + "grad_max_sv": 0.19311878457665443, + "grad_min_sv": 7.273629627901489e-09, + "grad_condition": 2161793817.455667, + "lr": 2.7390523158633524e-06, + "time_sec": 32.614171266555786 + }, + { + "epoch": 146, + "train_loss": 0.1391296845769882, + "train_acc": 0.95668, + "test_loss": 3.0094220054626466, + "test_acc": 0.5501, + "lyapunov": null, + "grad_norm": 0.37960085678866656, + "grad_max_sv": 0.18867351226508616, + "grad_min_sv": 7.0429120130072884e-09, + "grad_condition": 483257361.70673215, + "lr": 1.7535703752478133e-06, + "time_sec": 32.59815835952759 + }, + { + "epoch": 147, + "train_loss": 0.13715074803590774, + "train_acc": 0.95716, + "test_loss": 3.018283353805542, + "test_acc": 0.5494, + "lyapunov": null, + "grad_norm": 0.3750663523004214, + "grad_max_sv": 0.19733735918998718, + "grad_min_sv": 7.336720725349341e-09, + "grad_condition": 639022830.9873111, + "lr": 9.866357858642196e-07, + "time_sec": 32.63532900810242 + }, + { + "epoch": 148, + "train_loss": 0.13438899482250213, + "train_acc": 0.95838, + "test_loss": 3.0480747367858885, + "test_acc": 0.5511, + "lyapunov": null, + "grad_norm": 0.374029090307932, + "grad_max_sv": 0.19485083129256964, + "grad_min_sv": 7.2787410602915756e-09, + "grad_condition": 1280998842.4402964, + "lr": 4.38584950570808e-07, + "time_sec": 32.61666941642761 + }, + { + "epoch": 149, + "train_loss": 0.1355752257716656, + "train_acc": 0.95742, + "test_loss": 3.020583014678955, + "test_acc": 0.5479, + "lyapunov": null, + "grad_norm": 0.3742080999065961, + "grad_max_sv": 0.18681482430547475, + "grad_min_sv": 7.387960459213656e-09, + "grad_condition": 886872133.6824732, + "lr": 1.096582625772501e-07, + "time_sec": 32.62542963027954 + }, + { + "epoch": 150, + "train_loss": 0.13964056191444396, + "train_acc": 0.95646, + "test_loss": 3.1249655624389647, + "test_acc": 0.5464, + "lyapunov": null, + "grad_norm": 0.3794352519997707, + "grad_max_sv": 0.2051174059510231, + "grad_min_sv": 7.552300875884155e-09, + "grad_condition": 4688136301.586805, + "lr": 0.0, + "time_sec": 32.61311602592468 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 4.857979267883301, + "train_acc": 0.03128, + "test_loss": 4.8280028671264645, + "test_acc": 0.0162, + "lyapunov": null, + "grad_norm": 5.914070912211268, + "grad_max_sv": 5.325387370586395, + "grad_min_sv": 9.769405192663893e-08, + "grad_condition": 1337497985.1511102, + "lr": 0.0009998903417374227, + "time_sec": 49.62461066246033 + }, + { + "epoch": 2, + "train_loss": 4.336386154098511, + "train_acc": 0.05714, + "test_loss": 4.968493894958496, + "test_acc": 0.0197, + "lyapunov": null, + "grad_norm": 4.4863167388537235, + "grad_max_sv": 3.9469796657562255, + "grad_min_sv": 7.601632206477583e-08, + "grad_condition": 129963899.4749479, + "lr": 0.0009995614150494292, + "time_sec": 49.636900901794434 + }, + { + "epoch": 3, + "train_loss": 4.062883013763428, + "train_acc": 0.08342, + "test_loss": 4.448897337341308, + "test_acc": 0.037, + "lyapunov": null, + "grad_norm": 3.6333047310988777, + "grad_max_sv": 3.0409141004085543, + "grad_min_sv": 6.369543137374478e-08, + "grad_condition": 59962043.95176021, + "lr": 0.0009990133642141358, + "time_sec": 49.63047957420349 + }, + { + "epoch": 4, + "train_loss": 3.8605975818634035, + "train_acc": 0.10722, + "test_loss": 4.516425963592529, + "test_acc": 0.0415, + "lyapunov": null, + "grad_norm": 3.020259734680317, + "grad_max_sv": 2.476314604282379, + "grad_min_sv": 5.230481114892882e-08, + "grad_condition": 51922675.56557977, + "lr": 0.0009982464296247522, + "time_sec": 49.61615824699402 + }, + { + "epoch": 5, + "train_loss": 3.6876567860412597, + "train_acc": 0.13404, + "test_loss": 4.7616854064941405, + "test_acc": 0.0373, + "lyapunov": null, + "grad_norm": 2.454606191256652, + "grad_max_sv": 1.8841783970594406, + "grad_min_sv": 4.2170166864030635e-08, + "grad_condition": 61784571.5567351, + "lr": 0.0009972609476841367, + "time_sec": 49.621190309524536 + }, + { + "epoch": 6, + "train_loss": 3.5600004296875, + "train_acc": 0.15464, + "test_loss": 4.541135731506348, + "test_acc": 0.0565, + "lyapunov": null, + "grad_norm": 2.047081522054368, + "grad_max_sv": 1.4700775474309922, + "grad_min_sv": 3.5812032206372636e-08, + "grad_condition": 47166242.58068286, + "lr": 0.000996057350657239, + "time_sec": 49.63187623023987 + }, + { + "epoch": 7, + "train_loss": 3.453279203033447, + "train_acc": 0.17224, + "test_loss": 4.9032746643066405, + "test_acc": 0.0512, + "lyapunov": null, + "grad_norm": 1.7128403586652834, + "grad_max_sv": 1.1189136162400246, + "grad_min_sv": 3.018336235394159e-08, + "grad_condition": 41920446.3053714, + "lr": 0.000994636166481494, + "time_sec": 49.60520005226135 + }, + { + "epoch": 8, + "train_loss": 3.36041114944458, + "train_acc": 0.1888, + "test_loss": 4.752816521453857, + "test_acc": 0.0648, + "lyapunov": null, + "grad_norm": 1.4850467477612923, + "grad_max_sv": 0.8669481813907624, + "grad_min_sv": 2.6475041869922223e-08, + "grad_condition": 37599938.73602452, + "lr": 0.0009929980185352525, + "time_sec": 49.618135929107666 + }, + { + "epoch": 9, + "train_loss": 3.286079960784912, + "train_acc": 0.20154, + "test_loss": 5.178885292053223, + "test_acc": 0.0623, + "lyapunov": null, + "grad_norm": 1.342261473440063, + "grad_max_sv": 0.7033843606710434, + "grad_min_sv": 2.384479090948577e-08, + "grad_condition": 141440858.58776602, + "lr": 0.0009911436253643444, + "time_sec": 49.62771654129028 + }, + { + "epoch": 10, + "train_loss": 3.2129677861022947, + "train_acc": 0.2144, + "test_loss": 5.0195522842407225, + "test_acc": 0.0622, + "lyapunov": null, + "grad_norm": 1.2503967032062735, + "grad_max_sv": 0.6261777065694332, + "grad_min_sv": 2.239258505704056e-08, + "grad_condition": 118005336.87045276, + "lr": 0.0009890738003669028, + "time_sec": 49.60965371131897 + }, + { + "epoch": 11, + "train_loss": 3.162713228683472, + "train_acc": 0.22544, + "test_loss": 4.962263533020019, + "test_acc": 0.0779, + "lyapunov": null, + "grad_norm": 1.1906728267056432, + "grad_max_sv": 0.5766806580126286, + "grad_min_sv": 2.144448115332098e-08, + "grad_condition": 68570214.69490463, + "lr": 0.00098678945143658, + "time_sec": 49.638447284698486 + }, + { + "epoch": 12, + "train_loss": 3.107430252532959, + "train_acc": 0.23672, + "test_loss": 5.273008836364746, + "test_acc": 0.0622, + "lyapunov": null, + "grad_norm": 1.1141405269120466, + "grad_max_sv": 0.5137097157537938, + "grad_min_sv": 2.047304612853851e-08, + "grad_condition": 58656857.58404706, + "lr": 0.0009842915805643154, + "time_sec": 49.64548635482788 + }, + { + "epoch": 13, + "train_loss": 3.054518303833008, + "train_acc": 0.24298, + "test_loss": 4.751382202148437, + "test_acc": 0.0805, + "lyapunov": null, + "grad_norm": 1.056334374659988, + "grad_max_sv": 0.4537819892168045, + "grad_min_sv": 1.9099582219961332e-08, + "grad_condition": 40473913.58753422, + "lr": 0.000981581283398829, + "time_sec": 49.62596035003662 + }, + { + "epoch": 14, + "train_loss": 3.0128901699066164, + "train_acc": 0.2535, + "test_loss": 5.3179588119506835, + "test_acc": 0.0894, + "lyapunov": null, + "grad_norm": 1.0060720335526403, + "grad_max_sv": 0.4221613615751266, + "grad_min_sv": 1.8469374840623944e-08, + "grad_condition": 27648316.070058893, + "lr": 0.0009786597487660333, + "time_sec": 49.63119626045227 + }, + { + "epoch": 15, + "train_loss": 2.9737020013427733, + "train_acc": 0.26082, + "test_loss": 6.165470205688477, + "test_acc": 0.0593, + "lyapunov": null, + "grad_norm": 0.9787012560859192, + "grad_max_sv": 0.39918764010071756, + "grad_min_sv": 1.789977660815456e-08, + "grad_condition": 32066062.312103875, + "lr": 0.0009755282581475766, + "time_sec": 49.61084794998169 + }, + { + "epoch": 16, + "train_loss": 2.9363278299713134, + "train_acc": 0.2678, + "test_loss": 7.10851273803711, + "test_acc": 0.0421, + "lyapunov": null, + "grad_norm": 0.9372246408127133, + "grad_max_sv": 0.38435717970132827, + "grad_min_sv": 1.733210386878348e-08, + "grad_condition": 24088715.267205216, + "lr": 0.0009721881851187403, + "time_sec": 49.61706733703613 + }, + { + "epoch": 17, + "train_loss": 2.911891692504883, + "train_acc": 0.27176, + "test_loss": 6.38866512298584, + "test_acc": 0.0601, + "lyapunov": null, + "grad_norm": 0.9126706344355823, + "grad_max_sv": 0.3579227849841118, + "grad_min_sv": 1.667584251102694e-08, + "grad_condition": 47679489.14127077, + "lr": 0.0009686409947459456, + "time_sec": 49.62139368057251 + }, + { + "epoch": 18, + "train_loss": 2.8810440801239015, + "train_acc": 0.2804, + "test_loss": 6.160967282104492, + "test_acc": 0.0718, + "lyapunov": null, + "grad_norm": 0.8853626149459919, + "grad_max_sv": 0.36028596982359884, + "grad_min_sv": 1.644115990712125e-08, + "grad_condition": 52172419.08719461, + "lr": 0.0009648882429441254, + "time_sec": 49.61437940597534 + }, + { + "epoch": 19, + "train_loss": 2.845276382827759, + "train_acc": 0.28578, + "test_loss": 5.377824464416504, + "test_acc": 0.0852, + "lyapunov": null, + "grad_norm": 0.859853543351059, + "grad_max_sv": 0.33440142646431925, + "grad_min_sv": 1.5989740054234146e-08, + "grad_condition": 23981566.09987827, + "lr": 0.00096093157579425, + "time_sec": 49.60141611099243 + }, + { + "epoch": 20, + "train_loss": 2.8133937200927734, + "train_acc": 0.29282, + "test_loss": 6.930623114013672, + "test_acc": 0.061, + "lyapunov": null, + "grad_norm": 0.8428428790749917, + "grad_max_sv": 0.3265179105103016, + "grad_min_sv": 1.569473392637466e-08, + "grad_condition": 52730874.60876007, + "lr": 0.0009567727288213001, + "time_sec": 49.62118935585022 + }, + { + "epoch": 21, + "train_loss": 2.792502545776367, + "train_acc": 0.29682, + "test_loss": 7.603221396636963, + "test_acc": 0.0601, + "lyapunov": null, + "grad_norm": 0.8301062641843454, + "grad_max_sv": 0.3209334272891283, + "grad_min_sv": 1.5400497213602372e-08, + "grad_condition": 32858821.905855753, + "lr": 0.0009524135262330095, + "time_sec": 49.61830496788025 + }, + { + "epoch": 22, + "train_loss": 2.763432760696411, + "train_acc": 0.30106, + "test_loss": 7.683717921447754, + "test_acc": 0.0632, + "lyapunov": null, + "grad_norm": 0.8155075807756811, + "grad_max_sv": 0.31464248038828374, + "grad_min_sv": 1.523456016894187e-08, + "grad_condition": 22807354.246203102, + "lr": 0.0009478558801197061, + "time_sec": 49.62720441818237 + }, + { + "epoch": 23, + "train_loss": 2.7460695344543455, + "train_acc": 0.3031, + "test_loss": 5.747795407867431, + "test_acc": 0.0819, + "lyapunov": null, + "grad_norm": 0.7966165231048401, + "grad_max_sv": 0.29990778900682924, + "grad_min_sv": 1.4812020640575519e-08, + "grad_condition": 26907900.924312055, + "lr": 0.000943101789615607, + "time_sec": 49.620564699172974 + }, + { + "epoch": 24, + "train_loss": 2.713617621231079, + "train_acc": 0.31124, + "test_loss": 6.716322633361816, + "test_acc": 0.08, + "lyapunov": null, + "grad_norm": 0.7863969132473815, + "grad_max_sv": 0.3049128696322441, + "grad_min_sv": 1.4714444074304112e-08, + "grad_condition": 23621111.366144888, + "lr": 0.0009381533400219313, + "time_sec": 49.6185462474823 + }, + { + "epoch": 25, + "train_loss": 2.692608075027466, + "train_acc": 0.3135, + "test_loss": 6.315327671813965, + "test_acc": 0.0773, + "lyapunov": null, + "grad_norm": 0.7780809028085155, + "grad_max_sv": 0.28820848651230335, + "grad_min_sv": 1.4556970873158548e-08, + "grad_condition": 22925885.469558023, + "lr": 0.0009330127018922189, + "time_sec": 49.63029909133911 + }, + { + "epoch": 26, + "train_loss": 2.6578130314636232, + "train_acc": 0.32226, + "test_loss": 7.161731970214844, + "test_acc": 0.074, + "lyapunov": null, + "grad_norm": 0.7600241350813963, + "grad_max_sv": 0.27918743565678594, + "grad_min_sv": 1.41998530961418e-08, + "grad_condition": 24836498.868989673, + "lr": 0.000927682130080253, + "time_sec": 49.61888551712036 + }, + { + "epoch": 27, + "train_loss": 2.6360860138702393, + "train_acc": 0.3281, + "test_loss": 6.265446292114258, + "test_acc": 0.072, + "lyapunov": null, + "grad_norm": 0.7503860366874832, + "grad_max_sv": 0.27820607759058474, + "grad_min_sv": 1.403503115116056e-08, + "grad_condition": 43704568.438496746, + "lr": 0.0009221639627510072, + "time_sec": 49.6322455406189 + }, + { + "epoch": 28, + "train_loss": 2.621903458404541, + "train_acc": 0.33094, + "test_loss": 8.008352018737792, + "test_acc": 0.0635, + "lyapunov": null, + "grad_norm": 0.7411508249278186, + "grad_max_sv": 0.276602141186595, + "grad_min_sv": 1.3749510615473914e-08, + "grad_condition": 48846366.407403715, + "lr": 0.0009164606203550494, + "time_sec": 49.62464737892151 + }, + { + "epoch": 29, + "train_loss": 2.6009712726593017, + "train_acc": 0.33356, + "test_loss": 6.3420821472167965, + "test_acc": 0.0871, + "lyapunov": null, + "grad_norm": 0.7392237108014773, + "grad_max_sv": 0.2745568320155144, + "grad_min_sv": 1.3796570551283249e-08, + "grad_condition": 31273171.49927681, + "lr": 0.0009105746045668516, + "time_sec": 49.654367446899414 + }, + { + "epoch": 30, + "train_loss": 2.5890472722625733, + "train_acc": 0.33498, + "test_loss": 6.483042420959473, + "test_acc": 0.0746, + "lyapunov": null, + "grad_norm": 0.7254213710143503, + "grad_max_sv": 0.2663456965237856, + "grad_min_sv": 1.3537345176783955e-08, + "grad_condition": 33323808.90351194, + "lr": 0.0009045084971874733, + "time_sec": 49.62457275390625 + }, + { + "epoch": 31, + "train_loss": 2.5546424687194826, + "train_acc": 0.3411, + "test_loss": 5.880196138000488, + "test_acc": 0.0666, + "lyapunov": null, + "grad_norm": 0.7170650074645288, + "grad_max_sv": 0.2706871546804905, + "grad_min_sv": 1.3557976122346993e-08, + "grad_condition": 55625831.471463725, + "lr": 0.0008982649590120977, + "time_sec": 49.625417709350586 + }, + { + "epoch": 32, + "train_loss": 2.5356599130249022, + "train_acc": 0.3476, + "test_loss": 6.206172892761231, + "test_acc": 0.0935, + "lyapunov": null, + "grad_norm": 0.7148263297514528, + "grad_max_sv": 0.2631382804363966, + "grad_min_sv": 1.335368298993611e-08, + "grad_condition": 27919253.234171998, + "lr": 0.0008918467286629196, + "time_sec": 49.64267349243164 + }, + { + "epoch": 33, + "train_loss": 2.520495999908447, + "train_acc": 0.34764, + "test_loss": 6.414087007141113, + "test_acc": 0.0819, + "lyapunov": null, + "grad_norm": 0.7096693517368512, + "grad_max_sv": 0.2555254019796848, + "grad_min_sv": 1.326168482251866e-08, + "grad_condition": 30057889.81326326, + "lr": 0.0008852566213878943, + "time_sec": 49.633198976516724 + }, + { + "epoch": 34, + "train_loss": 2.4981268305206297, + "train_acc": 0.35368, + "test_loss": 7.161307034301758, + "test_acc": 0.0753, + "lyapunov": null, + "grad_norm": 0.6981273416861422, + "grad_max_sv": 0.25148845836520195, + "grad_min_sv": 1.3116743149965693e-08, + "grad_condition": 25097258.440184355, + "lr": 0.000878497527825878, + "time_sec": 49.629374980926514 + }, + { + "epoch": 35, + "train_loss": 2.4812187934875487, + "train_acc": 0.35656, + "test_loss": 6.375511972045898, + "test_acc": 0.0787, + "lyapunov": null, + "grad_norm": 0.693256631694674, + "grad_max_sv": 0.24989120960235595, + "grad_min_sv": 1.3051334765701306e-08, + "grad_condition": 22699406.58897232, + "lr": 0.000871572412738697, + "time_sec": 49.620848655700684 + }, + { + "epoch": 36, + "train_loss": 2.4649569733428955, + "train_acc": 0.3595, + "test_loss": 5.7549407691955565, + "test_acc": 0.1002, + "lyapunov": null, + "grad_norm": 0.6880223056040339, + "grad_max_sv": 0.2544675827026367, + "grad_min_sv": 1.2971388471672008e-08, + "grad_condition": 27090819.46416967, + "lr": 0.0008644843137107055, + "time_sec": 49.639307498931885 + }, + { + "epoch": 37, + "train_loss": 2.4404139349365233, + "train_acc": 0.36276, + "test_loss": 6.19379566192627, + "test_acc": 0.0843, + "lyapunov": null, + "grad_norm": 0.6915322266205055, + "grad_max_sv": 0.25557893700897694, + "grad_min_sv": 1.3099128221005785e-08, + "grad_condition": 22396412.415633548, + "lr": 0.0008572363398164014, + "time_sec": 49.65658497810364 + }, + { + "epoch": 38, + "train_loss": 2.4350104721832277, + "train_acc": 0.36944, + "test_loss": 6.483997691345214, + "test_acc": 0.0947, + "lyapunov": null, + "grad_norm": 0.6860817508888643, + "grad_max_sv": 0.24186794832348824, + "grad_min_sv": 1.2734190080188058e-08, + "grad_condition": 24245161.640245236, + "lr": 0.0008498316702566826, + "time_sec": 49.636590003967285 + }, + { + "epoch": 39, + "train_loss": 2.4035986038970947, + "train_acc": 0.37506, + "test_loss": 7.426128985595703, + "test_acc": 0.0633, + "lyapunov": null, + "grad_norm": 0.6768284631491337, + "grad_max_sv": 0.23978918939828872, + "grad_min_sv": 1.2544681339196617e-08, + "grad_condition": 58875883.49556484, + "lr": 0.0008422735529643442, + "time_sec": 49.6271595954895 + }, + { + "epoch": 40, + "train_loss": 2.396695173187256, + "train_acc": 0.37446, + "test_loss": 6.887982989501953, + "test_acc": 0.0659, + "lyapunov": null, + "grad_norm": 0.6758452994499082, + "grad_max_sv": 0.23218532651662827, + "grad_min_sv": 1.2284334864609559e-08, + "grad_condition": 27825244.741001748, + "lr": 0.0008345653031794289, + "time_sec": 49.6188850402832 + }, + { + "epoch": 41, + "train_loss": 2.3766202754211427, + "train_acc": 0.38084, + "test_loss": 7.051847720336914, + "test_acc": 0.061, + "lyapunov": null, + "grad_norm": 0.6727252530320494, + "grad_max_sv": 0.2428621307015419, + "grad_min_sv": 1.2773543862920622e-08, + "grad_condition": 27042190.577230137, + "lr": 0.0008267103019950526, + "time_sec": 49.63360857963562 + }, + { + "epoch": 42, + "train_loss": 2.3670169010925295, + "train_acc": 0.38192, + "test_loss": 6.82649090423584, + "test_acc": 0.0753, + "lyapunov": null, + "grad_norm": 0.6702600637325808, + "grad_max_sv": 0.23488462790846826, + "grad_min_sv": 1.2701740556564367e-08, + "grad_condition": 22978134.483096853, + "lr": 0.0008187119948743447, + "time_sec": 49.626428842544556 + }, + { + "epoch": 43, + "train_loss": 2.34640893951416, + "train_acc": 0.38418, + "test_loss": 7.456131955718994, + "test_acc": 0.0764, + "lyapunov": null, + "grad_norm": 0.6673821071425099, + "grad_max_sv": 0.2304955620318651, + "grad_min_sv": 1.2439765384453239e-08, + "grad_condition": 31820388.99010671, + "lr": 0.000810573890139155, + "time_sec": 49.62021851539612 + }, + { + "epoch": 44, + "train_loss": 2.3332527070617677, + "train_acc": 0.38834, + "test_loss": 6.233900453186036, + "test_acc": 0.0882, + "lyapunov": null, + "grad_norm": 0.6619434612787911, + "grad_max_sv": 0.23275020457804202, + "grad_min_sv": 1.2357255231576491e-08, + "grad_condition": 41092001.19472371, + "lr": 0.0008022995574311873, + "time_sec": 49.632553815841675 + }, + { + "epoch": 45, + "train_loss": 2.319253850402832, + "train_acc": 0.3902, + "test_loss": 7.539175698852539, + "test_acc": 0.0652, + "lyapunov": null, + "grad_norm": 0.6606380867238602, + "grad_max_sv": 0.2288034502416849, + "grad_min_sv": 1.234043749409608e-08, + "grad_condition": 23995474.740780547, + "lr": 0.0007938926261462363, + "time_sec": 49.638259410858154 + }, + { + "epoch": 46, + "train_loss": 2.308006600112915, + "train_acc": 0.39154, + "test_loss": 7.362489430999756, + "test_acc": 0.0558, + "lyapunov": null, + "grad_norm": 0.660045345704197, + "grad_max_sv": 0.2337587408721447, + "grad_min_sv": 1.2529785493875512e-08, + "grad_condition": 24243355.610875387, + "lr": 0.0007853567838422158, + "time_sec": 49.64337158203125 + }, + { + "epoch": 47, + "train_loss": 2.287512142944336, + "train_acc": 0.39698, + "test_loss": 7.659019016265869, + "test_acc": 0.0729, + "lyapunov": null, + "grad_norm": 0.6552491008893353, + "grad_max_sv": 0.2252129375934601, + "grad_min_sv": 1.2101228903660389e-08, + "grad_condition": 37944286.39668895, + "lr": 0.0007766957746216719, + "time_sec": 49.610002756118774 + }, + { + "epoch": 48, + "train_loss": 2.2750962590026855, + "train_acc": 0.39712, + "test_loss": 6.906008920288086, + "test_acc": 0.085, + "lyapunov": null, + "grad_norm": 0.6572787443040576, + "grad_max_sv": 0.23201882764697074, + "grad_min_sv": 1.233105519499178e-08, + "grad_condition": 27571588.322845332, + "lr": 0.0007679133974894982, + "time_sec": 49.65186142921448 + }, + { + "epoch": 49, + "train_loss": 2.2525532193756104, + "train_acc": 0.40456, + "test_loss": 7.617325218963623, + "test_acc": 0.074, + "lyapunov": null, + "grad_norm": 0.6492386918943517, + "grad_max_sv": 0.2307146478444338, + "grad_min_sv": 1.229703296403914e-08, + "grad_condition": 211540506.258676, + "lr": 0.000759013504686565, + "time_sec": 49.6446647644043 + }, + { + "epoch": 50, + "train_loss": 2.237634787826538, + "train_acc": 0.40684, + "test_loss": 6.678198162841797, + "test_acc": 0.0633, + "lyapunov": null, + "grad_norm": 0.6565102133805185, + "grad_max_sv": 0.2293539997190237, + "grad_min_sv": 1.2340318197856526e-08, + "grad_condition": 27740724.758145083, + "lr": 0.0007499999999999998, + "time_sec": 49.653481006622314 + }, + { + "epoch": 51, + "train_loss": 2.209577166748047, + "train_acc": 0.40976, + "test_loss": 6.840425001525879, + "test_acc": 0.0718, + "lyapunov": null, + "grad_norm": 0.6547461235382159, + "grad_max_sv": 0.22949806824326516, + "grad_min_sv": 1.2320622985728668e-08, + "grad_condition": 23307963.55905198, + "lr": 0.0007408768370508575, + "time_sec": 49.61805582046509 + }, + { + "epoch": 52, + "train_loss": 2.200788235549927, + "train_acc": 0.41432, + "test_loss": 7.2077490463256835, + "test_acc": 0.0756, + "lyapunov": null, + "grad_norm": 0.6510213685672233, + "grad_max_sv": 0.23402363583445548, + "grad_min_sv": 1.2258231881986937e-08, + "grad_condition": 75476519.13664213, + "lr": 0.0007316480175599307, + "time_sec": 49.646629095077515 + }, + { + "epoch": 53, + "train_loss": 2.184033504333496, + "train_acc": 0.41906, + "test_loss": 6.790815046691894, + "test_acc": 0.0761, + "lyapunov": null, + "grad_norm": 0.6498948423513097, + "grad_max_sv": 0.2297774288803339, + "grad_min_sv": 1.2289613515736875e-08, + "grad_condition": 25175002.986691862, + "lr": 0.0007223175895924635, + "time_sec": 49.616777181625366 + }, + { + "epoch": 54, + "train_loss": 2.1751246100616455, + "train_acc": 0.4209, + "test_loss": 7.843894770812988, + "test_acc": 0.0728, + "lyapunov": null, + "grad_norm": 0.6502026955560598, + "grad_max_sv": 0.22432956397533416, + "grad_min_sv": 1.2058743079079725e-08, + "grad_condition": 27210725.454316296, + "lr": 0.0007128896457825361, + "time_sec": 49.63462972640991 + }, + { + "epoch": 55, + "train_loss": 2.1508761085510253, + "train_acc": 0.42416, + "test_loss": 7.085880072784424, + "test_acc": 0.0952, + "lyapunov": null, + "grad_norm": 0.6487356152863625, + "grad_max_sv": 0.22850245125591756, + "grad_min_sv": 1.2312155951710312e-08, + "grad_condition": 41183718.923533805, + "lr": 0.0007033683215378998, + "time_sec": 49.64608693122864 + }, + { + "epoch": 56, + "train_loss": 2.141602848587036, + "train_acc": 0.42634, + "test_loss": 6.250551121520996, + "test_acc": 0.0971, + "lyapunov": null, + "grad_norm": 0.6410808562446506, + "grad_max_sv": 0.2151340998709202, + "grad_min_sv": 1.176430176191845e-08, + "grad_condition": 30604181.986327033, + "lr": 0.0006937577932260512, + "time_sec": 49.70740008354187 + }, + { + "epoch": 57, + "train_loss": 2.14431159286499, + "train_acc": 0.42548, + "test_loss": 6.846168923950195, + "test_acc": 0.0958, + "lyapunov": null, + "grad_norm": 0.6444720385859491, + "grad_max_sv": 0.2224727988243103, + "grad_min_sv": 1.2025717233132837e-08, + "grad_condition": 23924517.448539954, + "lr": 0.0006840622763423388, + "time_sec": 49.63225722312927 + }, + { + "epoch": 58, + "train_loss": 2.10916792388916, + "train_acc": 0.43432, + "test_loss": 6.8249847625732425, + "test_acc": 0.1066, + "lyapunov": null, + "grad_norm": 0.6502634467633226, + "grad_max_sv": 0.22863934263587, + "grad_min_sv": 1.218627998234023e-08, + "grad_condition": 28771962.702913057, + "lr": 0.0006742860236609073, + "time_sec": 49.63661074638367 + }, + { + "epoch": 59, + "train_loss": 2.100633440322876, + "train_acc": 0.43724, + "test_loss": 7.080769053649902, + "test_acc": 0.097, + "lyapunov": null, + "grad_norm": 0.6514345540301675, + "grad_max_sv": 0.23131897561252118, + "grad_min_sv": 1.2473222341102818e-08, + "grad_condition": 23428156.69088362, + "lr": 0.0006644333233692913, + "time_sec": 49.631585359573364 + }, + { + "epoch": 60, + "train_loss": 2.0753550579452513, + "train_acc": 0.44222, + "test_loss": 7.097881182861328, + "test_acc": 0.0782, + "lyapunov": null, + "grad_norm": 0.642048459758103, + "grad_max_sv": 0.21754480227828027, + "grad_min_sv": 1.2038245155582273e-08, + "grad_condition": 35173118.59205349, + "lr": 0.0006545084971874734, + "time_sec": 49.642804861068726 + }, + { + "epoch": 61, + "train_loss": 2.060260758514404, + "train_acc": 0.4465, + "test_loss": 6.766320790863037, + "test_acc": 0.0839, + "lyapunov": null, + "grad_norm": 0.6459643627424662, + "grad_max_sv": 0.223102143406868, + "grad_min_sv": 1.22261165164117e-08, + "grad_condition": 22073921.720915027, + "lr": 0.0006445158984722354, + "time_sec": 49.64657950401306 + }, + { + "epoch": 62, + "train_loss": 2.0472131072998048, + "train_acc": 0.4486, + "test_loss": 6.881848452758789, + "test_acc": 0.0976, + "lyapunov": null, + "grad_norm": 0.6461433133831308, + "grad_max_sv": 0.22962211742997168, + "grad_min_sv": 1.2113809159074174e-08, + "grad_condition": 324038818.4677658, + "lr": 0.0006344599103076324, + "time_sec": 49.627341747283936 + }, + { + "epoch": 63, + "train_loss": 2.035955301361084, + "train_acc": 0.44882, + "test_loss": 7.18960142211914, + "test_acc": 0.0878, + "lyapunov": null, + "grad_norm": 0.6422783690964438, + "grad_max_sv": 0.2209172960370779, + "grad_min_sv": 1.2127595816480152e-08, + "grad_condition": 21910433.389134284, + "lr": 0.0006243449435824269, + "time_sec": 49.64501976966858 + }, + { + "epoch": 64, + "train_loss": 2.036686828079224, + "train_acc": 0.45056, + "test_loss": 7.650535336303711, + "test_acc": 0.0924, + "lyapunov": null, + "grad_norm": 0.641718667248247, + "grad_max_sv": 0.22157798074185847, + "grad_min_sv": 1.1966991517176062e-08, + "grad_condition": 25321432.686805125, + "lr": 0.0006141754350553275, + "time_sec": 49.63518667221069 + }, + { + "epoch": 65, + "train_loss": 2.0039944877624514, + "train_acc": 0.45574, + "test_loss": 7.262261317443848, + "test_acc": 0.114, + "lyapunov": null, + "grad_norm": 0.6509729656164255, + "grad_max_sv": 0.2328164666891098, + "grad_min_sv": 1.2227686406116046e-08, + "grad_condition": 78588688.09864715, + "lr": 0.0006039558454088793, + "time_sec": 49.62892246246338 + }, + { + "epoch": 66, + "train_loss": 1.9934623148345947, + "train_acc": 0.4604, + "test_loss": 6.735845774841309, + "test_acc": 0.0988, + "lyapunov": null, + "grad_norm": 0.6428090636861153, + "grad_max_sv": 0.22018610946834088, + "grad_min_sv": 1.2050285417425366e-08, + "grad_condition": 33987345.003156364, + "lr": 0.000593690657292862, + "time_sec": 49.634801626205444 + }, + { + "epoch": 67, + "train_loss": 1.968681404800415, + "train_acc": 0.46364, + "test_loss": 7.602304705810547, + "test_acc": 0.0987, + "lyapunov": null, + "grad_norm": 0.6457740641454927, + "grad_max_sv": 0.2279145259410143, + "grad_min_sv": 1.2256968678903136e-08, + "grad_condition": 23591230.853540566, + "lr": 0.0005833843733580507, + "time_sec": 49.640379190444946 + }, + { + "epoch": 68, + "train_loss": 1.9723771545791626, + "train_acc": 0.46456, + "test_loss": 7.501553115844726, + "test_acc": 0.0743, + "lyapunov": null, + "grad_norm": 0.6345718818470338, + "grad_max_sv": 0.21636971682310105, + "grad_min_sv": 1.1871784413863828e-08, + "grad_condition": 21468624.440050583, + "lr": 0.0005730415142812054, + "time_sec": 49.618358850479126 + }, + { + "epoch": 69, + "train_loss": 1.950169172744751, + "train_acc": 0.46892, + "test_loss": 7.0990902679443355, + "test_acc": 0.0888, + "lyapunov": null, + "grad_norm": 0.6406229801466465, + "grad_max_sv": 0.2206659872084856, + "grad_min_sv": 1.1992476682196051e-08, + "grad_condition": 56593916.45522114, + "lr": 0.0005626666167821517, + "time_sec": 49.63790965080261 + }, + { + "epoch": 70, + "train_loss": 1.939907547531128, + "train_acc": 0.4716, + "test_loss": 7.282066575622559, + "test_acc": 0.0983, + "lyapunov": null, + "grad_norm": 0.6459981596212524, + "grad_max_sv": 0.23004377372562884, + "grad_min_sv": 1.2037511798457245e-08, + "grad_condition": 28235857.849722397, + "lr": 0.0005522642316338265, + "time_sec": 49.62828755378723 + }, + { + "epoch": 71, + "train_loss": 1.929073366470337, + "train_acc": 0.47462, + "test_loss": 6.812109463500977, + "test_acc": 0.1063, + "lyapunov": null, + "grad_norm": 0.6476540219610287, + "grad_max_sv": 0.22166885659098626, + "grad_min_sv": 1.2136537663048897e-08, + "grad_condition": 51677369.32839097, + "lr": 0.0005418389216661573, + "time_sec": 49.61943817138672 + }, + { + "epoch": 72, + "train_loss": 1.919623097305298, + "train_acc": 0.47576, + "test_loss": 6.68877933883667, + "test_acc": 0.0798, + "lyapunov": null, + "grad_norm": 0.638990192022336, + "grad_max_sv": 0.2177750900387764, + "grad_min_sv": 1.1837285757154703e-08, + "grad_condition": 30448032.105450857, + "lr": 0.0005313952597646563, + "time_sec": 49.63543653488159 + }, + { + "epoch": 73, + "train_loss": 1.8911805786514282, + "train_acc": 0.4813, + "test_loss": 7.259025004577636, + "test_acc": 0.1017, + "lyapunov": null, + "grad_norm": 0.6388927531170105, + "grad_max_sv": 0.2268439143896103, + "grad_min_sv": 1.2116396552741548e-08, + "grad_condition": 25828769.58088143, + "lr": 0.0005209378268645994, + "time_sec": 49.63246250152588 + }, + { + "epoch": 74, + "train_loss": 1.87730663772583, + "train_acc": 0.4856, + "test_loss": 6.621179290771485, + "test_acc": 0.1118, + "lyapunov": null, + "grad_norm": 0.6382424632105009, + "grad_max_sv": 0.22017028257250787, + "grad_min_sv": 1.1917627623647676e-08, + "grad_condition": 36459230.544282585, + "lr": 0.0005104712099416781, + "time_sec": 49.63705110549927 + }, + { + "epoch": 75, + "train_loss": 1.8676763352966308, + "train_acc": 0.4867, + "test_loss": 6.639352639770507, + "test_acc": 0.1035, + "lyapunov": null, + "grad_norm": 0.6471776484855016, + "grad_max_sv": 0.22313491702079774, + "grad_min_sv": 1.2076539387256834e-08, + "grad_condition": 168096640.34612545, + "lr": 0.0004999999999999996, + "time_sec": 49.62802839279175 + }, + { + "epoch": 76, + "train_loss": 1.8601240715026854, + "train_acc": 0.48752, + "test_loss": 7.69632975769043, + "test_acc": 0.093, + "lyapunov": null, + "grad_norm": 0.6373532537157988, + "grad_max_sv": 0.21818222440779209, + "grad_min_sv": 1.1897569247160123e-08, + "grad_condition": 49575276.624648556, + "lr": 0.0004895287900583212, + "time_sec": 49.61473488807678 + }, + { + "epoch": 77, + "train_loss": 1.844694657020569, + "train_acc": 0.49, + "test_loss": 7.673219400024414, + "test_acc": 0.0971, + "lyapunov": null, + "grad_norm": 0.6357429485708425, + "grad_max_sv": 0.21753050275146962, + "grad_min_sv": 1.1727277435258366e-08, + "grad_condition": 25108982.07055033, + "lr": 0.0004790621731353997, + "time_sec": 49.61942458152771 + }, + { + "epoch": 78, + "train_loss": 1.8382536688232423, + "train_acc": 0.49426, + "test_loss": 8.053473236083985, + "test_acc": 0.0877, + "lyapunov": null, + "grad_norm": 0.6413732546621618, + "grad_max_sv": 0.22126910798251628, + "grad_min_sv": 1.217776433408424e-08, + "grad_condition": 50630196.79387429, + "lr": 0.000468604740235343, + "time_sec": 49.620675802230835 + }, + { + "epoch": 79, + "train_loss": 1.8119768780899048, + "train_acc": 0.50004, + "test_loss": 7.10159133605957, + "test_acc": 0.103, + "lyapunov": null, + "grad_norm": 0.64075038803741, + "grad_max_sv": 0.22004345506429673, + "grad_min_sv": 1.179401228554311e-08, + "grad_condition": 39644724.18434289, + "lr": 0.00045816107833384175, + "time_sec": 49.65424633026123 + }, + { + "epoch": 80, + "train_loss": 1.805297444114685, + "train_acc": 0.50122, + "test_loss": 7.127357855224609, + "test_acc": 0.1076, + "lyapunov": null, + "grad_norm": 0.6452326753546996, + "grad_max_sv": 0.2212912131100893, + "grad_min_sv": 1.2059882024961777e-08, + "grad_condition": 29968320.229064513, + "lr": 0.0004477357683661729, + "time_sec": 49.62116003036499 + }, + { + "epoch": 81, + "train_loss": 1.792769065246582, + "train_acc": 0.50348, + "test_loss": 7.439458018493652, + "test_acc": 0.0985, + "lyapunov": null, + "grad_norm": 0.6408257507786687, + "grad_max_sv": 0.22126449905335904, + "grad_min_sv": 1.1952658901526191e-08, + "grad_condition": 23156470.62447612, + "lr": 0.00043733338321784746, + "time_sec": 49.64424705505371 + }, + { + "epoch": 82, + "train_loss": 1.770621812400818, + "train_acc": 0.51052, + "test_loss": 7.155345419311524, + "test_acc": 0.1127, + "lyapunov": null, + "grad_norm": 0.6446017522348026, + "grad_max_sv": 0.22318419590592384, + "grad_min_sv": 1.1969205995082665e-08, + "grad_condition": 88594611.75801164, + "lr": 0.0004269584857187939, + "time_sec": 49.622429847717285 + }, + { + "epoch": 83, + "train_loss": 1.769109418029785, + "train_acc": 0.50846, + "test_loss": 7.010694668579101, + "test_acc": 0.1057, + "lyapunov": null, + "grad_norm": 0.6502891030839932, + "grad_max_sv": 0.2263760395348072, + "grad_min_sv": 1.2018579030603772e-08, + "grad_condition": 29299643.5314746, + "lr": 0.0004166156266419484, + "time_sec": 49.614967584609985 + }, + { + "epoch": 84, + "train_loss": 1.7552229693222046, + "train_acc": 0.51318, + "test_loss": 7.019638833618164, + "test_acc": 0.1006, + "lyapunov": null, + "grad_norm": 0.6441122145546607, + "grad_max_sv": 0.21587914675474168, + "grad_min_sv": 1.1914460645509606e-08, + "grad_condition": 54331112.96990696, + "lr": 0.0004063093427071373, + "time_sec": 49.63624048233032 + }, + { + "epoch": 85, + "train_loss": 1.7453889175796509, + "train_acc": 0.5142, + "test_loss": 6.935272999572754, + "test_acc": 0.0772, + "lyapunov": null, + "grad_norm": 0.6354119534548792, + "grad_max_sv": 0.22349480539560318, + "grad_min_sv": 1.188125494724912e-08, + "grad_condition": 54450146.559093714, + "lr": 0.0003960441545911199, + "time_sec": 49.63727903366089 + }, + { + "epoch": 86, + "train_loss": 1.7361508292388916, + "train_acc": 0.51694, + "test_loss": 6.903331332397461, + "test_acc": 0.0874, + "lyapunov": null, + "grad_norm": 0.6433396686482765, + "grad_max_sv": 0.2229986496269703, + "grad_min_sv": 1.2302347957016124e-08, + "grad_condition": 20829684.95092944, + "lr": 0.0003858245649446718, + "time_sec": 49.620397329330444 + }, + { + "epoch": 87, + "train_loss": 1.7140229907989502, + "train_acc": 0.52362, + "test_loss": 6.144080555725098, + "test_acc": 0.0973, + "lyapunov": null, + "grad_norm": 0.6397281329733326, + "grad_max_sv": 0.2236575834453106, + "grad_min_sv": 1.2130321444536741e-08, + "grad_condition": 24582093.327500105, + "lr": 0.00037565505641757235, + "time_sec": 49.63749957084656 + }, + { + "epoch": 88, + "train_loss": 1.698942677230835, + "train_acc": 0.52702, + "test_loss": 6.329557989501953, + "test_acc": 0.1043, + "lyapunov": null, + "grad_norm": 0.6429735672215783, + "grad_max_sv": 0.22443199381232262, + "grad_min_sv": 1.2242971281217762e-08, + "grad_condition": 21997184.984676402, + "lr": 0.00036554008969236695, + "time_sec": 49.64341187477112 + }, + { + "epoch": 89, + "train_loss": 1.6915926089859008, + "train_acc": 0.52672, + "test_loss": 6.97091061706543, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 0.6396443107842517, + "grad_max_sv": 0.21398231349885463, + "grad_min_sv": 1.1860397219898289e-08, + "grad_condition": 25819116.390227333, + "lr": 0.0003554841015277638, + "time_sec": 49.61740279197693 + }, + { + "epoch": 90, + "train_loss": 1.6705048236846924, + "train_acc": 0.53226, + "test_loss": 6.474410656738281, + "test_acc": 0.1104, + "lyapunov": null, + "grad_norm": 0.6447874278631877, + "grad_max_sv": 0.22352466247975827, + "grad_min_sv": 1.1839073051078675e-08, + "grad_condition": 194632597.18194634, + "lr": 0.000345491502812526, + "time_sec": 49.63944673538208 + }, + { + "epoch": 91, + "train_loss": 1.6604324224090576, + "train_acc": 0.53478, + "test_loss": 7.210493100738526, + "test_acc": 0.1186, + "lyapunov": null, + "grad_norm": 0.6483901695782636, + "grad_max_sv": 0.23147397823631763, + "grad_min_sv": 1.2240159032281435e-08, + "grad_condition": 833122995.4080375, + "lr": 0.0003355666766307081, + "time_sec": 49.65723490715027 + }, + { + "epoch": 92, + "train_loss": 1.655436181564331, + "train_acc": 0.53562, + "test_loss": 6.41819879989624, + "test_acc": 0.1099, + "lyapunov": null, + "grad_norm": 0.6422800867205569, + "grad_max_sv": 0.22188753299415112, + "grad_min_sv": 1.1910704758588687e-08, + "grad_condition": 31454971.248209517, + "lr": 0.00032571397633909225, + "time_sec": 49.62359666824341 + }, + { + "epoch": 93, + "train_loss": 1.6418727423477173, + "train_acc": 0.53886, + "test_loss": 6.5647822364807125, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 0.6425002000385331, + "grad_max_sv": 0.22996555864810944, + "grad_min_sv": 1.214085261491693e-08, + "grad_condition": 23136414.278494585, + "lr": 0.00031593772365766094, + "time_sec": 49.648432970047 + }, + { + "epoch": 94, + "train_loss": 1.6380917670822144, + "train_acc": 0.54016, + "test_loss": 6.60304995880127, + "test_acc": 0.1013, + "lyapunov": null, + "grad_norm": 0.6435715746993702, + "grad_max_sv": 0.22394425868988038, + "grad_min_sv": 1.1969105850884176e-08, + "grad_condition": 22813937.74993243, + "lr": 0.0003062422067739483, + "time_sec": 49.62917709350586 + }, + { + "epoch": 95, + "train_loss": 1.6159375607681274, + "train_acc": 0.54468, + "test_loss": 7.4295039352417, + "test_acc": 0.1043, + "lyapunov": null, + "grad_norm": 0.6459265748151144, + "grad_max_sv": 0.2222417715936899, + "grad_min_sv": 1.2084532810541226e-08, + "grad_condition": 23228929.65699155, + "lr": 0.00029663167846209965, + "time_sec": 49.633803606033325 + }, + { + "epoch": 96, + "train_loss": 1.6130770600128175, + "train_acc": 0.54918, + "test_loss": 7.755695833587646, + "test_acc": 0.103, + "lyapunov": null, + "grad_norm": 0.6373845581356181, + "grad_max_sv": 0.2166528631001711, + "grad_min_sv": 1.1723080543812881e-08, + "grad_condition": 61573060.408652686, + "lr": 0.00028711035421746345, + "time_sec": 49.63398790359497 + }, + { + "epoch": 97, + "train_loss": 1.5942238623046876, + "train_acc": 0.55338, + "test_loss": 7.366734781646729, + "test_acc": 0.0942, + "lyapunov": null, + "grad_norm": 0.645954709653033, + "grad_max_sv": 0.23344604782760142, + "grad_min_sv": 1.211216281021832e-08, + "grad_condition": 28920253.40686954, + "lr": 0.00027768241040753615, + "time_sec": 49.63687562942505 + }, + { + "epoch": 98, + "train_loss": 1.5829193838119506, + "train_acc": 0.55468, + "test_loss": 7.60546820526123, + "test_acc": 0.0996, + "lyapunov": null, + "grad_norm": 0.6414940955031293, + "grad_max_sv": 0.22326541543006898, + "grad_min_sv": 1.18154431003048e-08, + "grad_condition": 27850671.690087616, + "lr": 0.00026835198244006903, + "time_sec": 49.60518288612366 + }, + { + "epoch": 99, + "train_loss": 1.5702915887451172, + "train_acc": 0.55388, + "test_loss": 7.25171710357666, + "test_acc": 0.0857, + "lyapunov": null, + "grad_norm": 0.6448707164382114, + "grad_max_sv": 0.22703963220119477, + "grad_min_sv": 1.2078747084476315e-08, + "grad_condition": 30695848.89590156, + "lr": 0.0002591231629491421, + "time_sec": 49.6348443031311 + }, + { + "epoch": 100, + "train_loss": 1.563120531387329, + "train_acc": 0.5575, + "test_loss": 7.321073220062256, + "test_acc": 0.0975, + "lyapunov": null, + "grad_norm": 0.6501432324709732, + "grad_max_sv": 0.22466112971305846, + "grad_min_sv": 1.1973627836447952e-08, + "grad_condition": 23144250.2743996, + "lr": 0.0002499999999999997, + "time_sec": 49.639625549316406 + }, + { + "epoch": 101, + "train_loss": 1.5544149493026733, + "train_acc": 0.562, + "test_loss": 8.2606175201416, + "test_acc": 0.0986, + "lyapunov": null, + "grad_norm": 0.6383634384668164, + "grad_max_sv": 0.22597188949584962, + "grad_min_sv": 1.1897128555232727e-08, + "grad_condition": 42860913.99555977, + "lr": 0.00024098649531343477, + "time_sec": 49.64992117881775 + }, + { + "epoch": 102, + "train_loss": 1.547795528869629, + "train_acc": 0.5621, + "test_loss": 7.994213732910156, + "test_acc": 0.1009, + "lyapunov": null, + "grad_norm": 0.6440457566084322, + "grad_max_sv": 0.22605536915361882, + "grad_min_sv": 1.21044593875963e-08, + "grad_condition": 23222249.12666279, + "lr": 0.0002320866025105016, + "time_sec": 49.638099670410156 + }, + { + "epoch": 103, + "train_loss": 1.5383813903045653, + "train_acc": 0.56598, + "test_loss": 8.507730350494384, + "test_acc": 0.0971, + "lyapunov": null, + "grad_norm": 0.6412277700079685, + "grad_max_sv": 0.2286630392074585, + "grad_min_sv": 1.1935943896451695e-08, + "grad_condition": 61496117.17851217, + "lr": 0.0002233042253783278, + "time_sec": 49.624167919158936 + }, + { + "epoch": 104, + "train_loss": 1.5296855780792236, + "train_acc": 0.56802, + "test_loss": 7.766149099731446, + "test_acc": 0.1005, + "lyapunov": null, + "grad_norm": 0.6402323929530521, + "grad_max_sv": 0.2234394859522581, + "grad_min_sv": 1.1708301472790339e-08, + "grad_condition": 51957414.29232074, + "lr": 0.000214643216157784, + "time_sec": 49.62683367729187 + }, + { + "epoch": 105, + "train_loss": 1.515010786781311, + "train_acc": 0.5704, + "test_loss": 7.568338539123535, + "test_acc": 0.1172, + "lyapunov": null, + "grad_norm": 0.6478082803296404, + "grad_max_sv": 0.23342282325029373, + "grad_min_sv": 1.216084826727304e-08, + "grad_condition": 26048714.73020513, + "lr": 0.00020610737385376332, + "time_sec": 49.63592481613159 + }, + { + "epoch": 106, + "train_loss": 1.512930496749878, + "train_acc": 0.56978, + "test_loss": 7.760108979797363, + "test_acc": 0.1047, + "lyapunov": null, + "grad_norm": 0.6453652740846443, + "grad_max_sv": 0.22414597682654858, + "grad_min_sv": 1.1973005337173603e-08, + "grad_condition": 26272467.73653502, + "lr": 0.00019770044256881242, + "time_sec": 49.61698055267334 + }, + { + "epoch": 107, + "train_loss": 1.4956118043899536, + "train_acc": 0.57444, + "test_loss": 8.33652488708496, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 0.6438260578925417, + "grad_max_sv": 0.2238406077027321, + "grad_min_sv": 1.1764498750177488e-08, + "grad_condition": 28981818.37375744, + "lr": 0.0001894261098608447, + "time_sec": 49.63762021064758 + }, + { + "epoch": 108, + "train_loss": 1.491361379776001, + "train_acc": 0.57876, + "test_loss": 8.52306475906372, + "test_acc": 0.1029, + "lyapunov": null, + "grad_norm": 0.6413105894442734, + "grad_max_sv": 0.22412343323230743, + "grad_min_sv": 1.2146300558402157e-08, + "grad_condition": 34732320.931619205, + "lr": 0.000181288005125655, + "time_sec": 49.6246235370636 + }, + { + "epoch": 109, + "train_loss": 1.4785979221343994, + "train_acc": 0.5778, + "test_loss": 7.686713803100586, + "test_acc": 0.0994, + "lyapunov": null, + "grad_norm": 0.6419467845001164, + "grad_max_sv": 0.22575648352503777, + "grad_min_sv": 1.1847785963414737e-08, + "grad_condition": 32480603.86279717, + "lr": 0.0001732896980049473, + "time_sec": 49.628063678741455 + }, + { + "epoch": 110, + "train_loss": 1.4723126147842407, + "train_acc": 0.57888, + "test_loss": 8.482755671691894, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 0.6427405399098718, + "grad_max_sv": 0.2258045580238104, + "grad_min_sv": 1.177179903347203e-08, + "grad_condition": 55737890.93326217, + "lr": 0.00016543469682057076, + "time_sec": 49.82239508628845 + }, + { + "epoch": 111, + "train_loss": 1.4714193873977661, + "train_acc": 0.5821, + "test_loss": 8.059153175354004, + "test_acc": 0.1095, + "lyapunov": null, + "grad_norm": 0.643358384906005, + "grad_max_sv": 0.2271666146814823, + "grad_min_sv": 1.1828724497814358e-08, + "grad_condition": 53541240.65537085, + "lr": 0.00015772644703565552, + "time_sec": 49.64692163467407 + }, + { + "epoch": 112, + "train_loss": 1.4565179361724854, + "train_acc": 0.58618, + "test_loss": 8.070704318237304, + "test_acc": 0.0989, + "lyapunov": null, + "grad_norm": 0.6414562113271406, + "grad_max_sv": 0.22715382017195224, + "grad_min_sv": 1.2078682694316445e-08, + "grad_condition": 27450211.87146064, + "lr": 0.00015016832974331713, + "time_sec": 49.634828329086304 + }, + { + "epoch": 113, + "train_loss": 1.445754097442627, + "train_acc": 0.58848, + "test_loss": 8.390233863830566, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 0.6411801061752302, + "grad_max_sv": 0.2343009330332279, + "grad_min_sv": 1.2054243894374373e-08, + "grad_condition": 73622071.21411385, + "lr": 0.00014276366018359834, + "time_sec": 49.62168598175049 + }, + { + "epoch": 114, + "train_loss": 1.4396562029647828, + "train_acc": 0.59112, + "test_loss": 7.990397840881347, + "test_acc": 0.1207, + "lyapunov": null, + "grad_norm": 0.6446675700592518, + "grad_max_sv": 0.22858907766640185, + "grad_min_sv": 1.2150255043752444e-08, + "grad_condition": 23031763.367673956, + "lr": 0.00013551568628929425, + "time_sec": 49.621737480163574 + }, + { + "epoch": 115, + "train_loss": 1.4295790006256104, + "train_acc": 0.5919, + "test_loss": 7.907929286956787, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 0.6414787996170513, + "grad_max_sv": 0.22259003035724162, + "grad_min_sv": 1.1937235663839196e-08, + "grad_condition": 26925988.130458646, + "lr": 0.00012842758726130276, + "time_sec": 49.702799558639526 + }, + { + "epoch": 116, + "train_loss": 1.419941686477661, + "train_acc": 0.59402, + "test_loss": 7.794718334197998, + "test_acc": 0.118, + "lyapunov": null, + "grad_norm": 0.6403562503796186, + "grad_max_sv": 0.23044625744223596, + "grad_min_sv": 1.1990111638271461e-08, + "grad_condition": 86324103.75912428, + "lr": 0.0001215024721741218, + "time_sec": 49.6519889831543 + }, + { + "epoch": 117, + "train_loss": 1.4125151259613038, + "train_acc": 0.59724, + "test_loss": 8.082193556976318, + "test_acc": 0.1093, + "lyapunov": null, + "grad_norm": 0.6390276536629967, + "grad_max_sv": 0.22913259454071522, + "grad_min_sv": 1.1846856870501021e-08, + "grad_condition": 38051050.155520104, + "lr": 0.00011474337861210538, + "time_sec": 49.67843008041382 + }, + { + "epoch": 118, + "train_loss": 1.4061624579238892, + "train_acc": 0.59848, + "test_loss": 7.994955434417725, + "test_acc": 0.1217, + "lyapunov": null, + "grad_norm": 0.6431427525608711, + "grad_max_sv": 0.22681293152272702, + "grad_min_sv": 1.2012494199353796e-08, + "grad_condition": 22440692.932778567, + "lr": 0.00010815327133708009, + "time_sec": 49.65889072418213 + }, + { + "epoch": 119, + "train_loss": 1.4033130680847168, + "train_acc": 0.59806, + "test_loss": 7.7351758087158204, + "test_acc": 0.1159, + "lyapunov": null, + "grad_norm": 0.6393512801434791, + "grad_max_sv": 0.22470695674419403, + "grad_min_sv": 1.173807711446484e-08, + "grad_condition": 33523113.628067147, + "lr": 0.00010173504098790182, + "time_sec": 49.65284276008606 + }, + { + "epoch": 120, + "train_loss": 1.3988560864257813, + "train_acc": 0.59928, + "test_loss": 8.596598931121827, + "test_acc": 0.104, + "lyapunov": null, + "grad_norm": 0.6430512338238313, + "grad_max_sv": 0.23124604262411594, + "grad_min_sv": 1.2035057309067731e-08, + "grad_condition": 27263284.07382477, + "lr": 9.549150281252629e-05, + "time_sec": 49.64090633392334 + }, + { + "epoch": 121, + "train_loss": 1.3857270031356812, + "train_acc": 0.60484, + "test_loss": 7.9892033752441405, + "test_acc": 0.1183, + "lyapunov": null, + "grad_norm": 0.6395461283787793, + "grad_max_sv": 0.22570451460778712, + "grad_min_sv": 1.2030840006518884e-08, + "grad_condition": 53181043.26539834, + "lr": 8.942539543314794e-05, + "time_sec": 49.60771918296814 + }, + { + "epoch": 122, + "train_loss": 1.3880330154037475, + "train_acc": 0.60376, + "test_loss": 8.22642307357788, + "test_acc": 0.115, + "lyapunov": null, + "grad_norm": 0.6427946655580464, + "grad_max_sv": 0.22782764062285424, + "grad_min_sv": 1.1785313203116487e-08, + "grad_condition": 24787267.408791415, + "lr": 8.353937964495024e-05, + "time_sec": 49.64048886299133 + }, + { + "epoch": 123, + "train_loss": 1.377012547569275, + "train_acc": 0.60464, + "test_loss": 7.7657553009033204, + "test_acc": 0.114, + "lyapunov": null, + "grad_norm": 0.6396634441881897, + "grad_max_sv": 0.23086622469127177, + "grad_min_sv": 1.198922548739656e-08, + "grad_condition": 23123320.372294467, + "lr": 7.783603724899243e-05, + "time_sec": 49.63312888145447 + }, + { + "epoch": 124, + "train_loss": 1.376011091003418, + "train_acc": 0.60928, + "test_loss": 7.944722248840332, + "test_acc": 0.1039, + "lyapunov": null, + "grad_norm": 0.6321494808563242, + "grad_max_sv": 0.22378434427082539, + "grad_min_sv": 1.1604401764855887e-08, + "grad_condition": 58244211.34800786, + "lr": 7.231786991974666e-05, + "time_sec": 49.64424800872803 + }, + { + "epoch": 125, + "train_loss": 1.368886891708374, + "train_acc": 0.60824, + "test_loss": 8.258360435485839, + "test_acc": 0.1147, + "lyapunov": null, + "grad_norm": 0.6400148651728099, + "grad_max_sv": 0.22423702478408813, + "grad_min_sv": 1.175346897655527e-08, + "grad_condition": 47951723.35743973, + "lr": 6.698729810778072e-05, + "time_sec": 49.635197162628174 + }, + { + "epoch": 126, + "train_loss": 1.368887268447876, + "train_acc": 0.60784, + "test_loss": 8.00912710647583, + "test_acc": 0.1098, + "lyapunov": null, + "grad_norm": 0.6414620945866057, + "grad_max_sv": 0.22984928116202355, + "grad_min_sv": 1.1862470802870284e-08, + "grad_condition": 27488218.9085432, + "lr": 6.184665997806817e-05, + "time_sec": 49.63115334510803 + }, + { + "epoch": 127, + "train_loss": 1.3691972059631348, + "train_acc": 0.60894, + "test_loss": 8.099956825256347, + "test_acc": 0.1137, + "lyapunov": null, + "grad_norm": 0.6379342286587659, + "grad_max_sv": 0.22721209563314915, + "grad_min_sv": 1.1842124452571268e-08, + "grad_condition": 66054597.76675473, + "lr": 5.6898210384392595e-05, + "time_sec": 49.64264273643494 + }, + { + "epoch": 128, + "train_loss": 1.3585320538711547, + "train_acc": 0.61176, + "test_loss": 8.168904312896728, + "test_acc": 0.1178, + "lyapunov": null, + "grad_norm": 0.6384779111033096, + "grad_max_sv": 0.2258748199790716, + "grad_min_sv": 1.1702591148909925e-08, + "grad_condition": 121211424.44652918, + "lr": 5.214411988029363e-05, + "time_sec": 49.62958645820618 + }, + { + "epoch": 129, + "train_loss": 1.3585711254501343, + "train_acc": 0.6101, + "test_loss": 7.90961298828125, + "test_acc": 0.1095, + "lyapunov": null, + "grad_norm": 0.6412738082737135, + "grad_max_sv": 0.22799600511789322, + "grad_min_sv": 1.2047476663501478e-08, + "grad_condition": 44984170.42448841, + "lr": 4.7586473766990294e-05, + "time_sec": 49.62019920349121 + }, + { + "epoch": 130, + "train_loss": 1.3606473222351074, + "train_acc": 0.60866, + "test_loss": 7.8885728500366215, + "test_acc": 0.1165, + "lyapunov": null, + "grad_norm": 0.6429377341506345, + "grad_max_sv": 0.22763566635549068, + "grad_min_sv": 1.1949406383826578e-08, + "grad_condition": 23238593.216242827, + "lr": 4.32272711786996e-05, + "time_sec": 49.60610270500183 + }, + { + "epoch": 131, + "train_loss": 1.340769683189392, + "train_acc": 0.61422, + "test_loss": 7.97282382888794, + "test_acc": 0.1176, + "lyapunov": null, + "grad_norm": 0.6365898965081005, + "grad_max_sv": 0.22698684968054295, + "grad_min_sv": 1.1841301903944835e-08, + "grad_condition": 57050057.91630666, + "lr": 3.906842420574966e-05, + "time_sec": 49.639729738235474 + }, + { + "epoch": 132, + "train_loss": 1.3506625385284423, + "train_acc": 0.61254, + "test_loss": 8.237340574645996, + "test_acc": 0.1112, + "lyapunov": null, + "grad_norm": 0.6405822016126281, + "grad_max_sv": 0.2313113920390606, + "grad_min_sv": 1.1943680751358432e-08, + "grad_condition": 32855860.000038534, + "lr": 3.5111757055874305e-05, + "time_sec": 49.62140464782715 + }, + { + "epoch": 133, + "train_loss": 1.3537355774307251, + "train_acc": 0.60946, + "test_loss": 8.220967332458496, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 0.6424071935223469, + "grad_max_sv": 0.2330889504402876, + "grad_min_sv": 1.1997084857148787e-08, + "grad_condition": 44613447.03937371, + "lr": 3.1359005254054254e-05, + "time_sec": 49.62578868865967 + }, + { + "epoch": 134, + "train_loss": 1.33552843044281, + "train_acc": 0.61362, + "test_loss": 8.059291929626465, + "test_acc": 0.1019, + "lyapunov": null, + "grad_norm": 0.6408761914883747, + "grad_max_sv": 0.2316820841282606, + "grad_min_sv": 1.1778968132813982e-08, + "grad_condition": 105523171.68805893, + "lr": 2.7811814881259484e-05, + "time_sec": 49.62417006492615 + }, + { + "epoch": 135, + "train_loss": 1.3386833112335206, + "train_acc": 0.61374, + "test_loss": 7.973577444458008, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 0.6388300432658766, + "grad_max_sv": 0.22841673195362092, + "grad_min_sv": 1.1936609616361448e-08, + "grad_condition": 69324765.09964362, + "lr": 2.4471741852423218e-05, + "time_sec": 49.65416145324707 + }, + { + "epoch": 136, + "train_loss": 1.3311992990112305, + "train_acc": 0.618, + "test_loss": 8.200102568817139, + "test_acc": 0.1214, + "lyapunov": null, + "grad_norm": 0.638950694855791, + "grad_max_sv": 0.2365179505199194, + "grad_min_sv": 1.1939427453644402e-08, + "grad_condition": 27475716.41514334, + "lr": 2.1340251233966362e-05, + "time_sec": 49.64095640182495 + }, + { + "epoch": 137, + "train_loss": 1.3340746058273316, + "train_acc": 0.61812, + "test_loss": 7.946666102600098, + "test_acc": 0.1106, + "lyapunov": null, + "grad_norm": 0.6352812169452327, + "grad_max_sv": 0.22020692974328995, + "grad_min_sv": 1.1623311241271139e-08, + "grad_condition": 29930613.060724013, + "lr": 1.8418716601170932e-05, + "time_sec": 49.633143186569214 + }, + { + "epoch": 138, + "train_loss": 1.336420276031494, + "train_acc": 0.61512, + "test_loss": 8.25653330230713, + "test_acc": 0.112, + "lyapunov": null, + "grad_norm": 0.6397251204580275, + "grad_max_sv": 0.23347726799547672, + "grad_min_sv": 1.1918404803357152e-08, + "grad_condition": 81456104.36957063, + "lr": 1.570841943568445e-05, + "time_sec": 49.639748334884644 + }, + { + "epoch": 139, + "train_loss": 1.3220760538482665, + "train_acc": 0.61838, + "test_loss": 8.026485778808594, + "test_acc": 0.1138, + "lyapunov": null, + "grad_norm": 0.6398193491025633, + "grad_max_sv": 0.2238193929195404, + "grad_min_sv": 1.1681687835801702e-08, + "grad_condition": 38144371.645152286, + "lr": 1.3210548563419845e-05, + "time_sec": 49.63212180137634 + }, + { + "epoch": 140, + "train_loss": 1.3198553924942016, + "train_acc": 0.61854, + "test_loss": 8.029016185760499, + "test_acc": 0.1179, + "lyapunov": null, + "grad_norm": 0.639466602267434, + "grad_max_sv": 0.22324420213699342, + "grad_min_sv": 1.1702349164699477e-08, + "grad_condition": 28474783.149248235, + "lr": 1.0926199633097203e-05, + "time_sec": 49.65198302268982 + }, + { + "epoch": 141, + "train_loss": 1.3253049739837646, + "train_acc": 0.62014, + "test_loss": 8.258732906341553, + "test_acc": 0.1086, + "lyapunov": null, + "grad_norm": 0.6377969869493302, + "grad_max_sv": 0.23066396303474904, + "grad_min_sv": 1.1955105984340354e-08, + "grad_condition": 28290681.03527581, + "lr": 8.856374635655688e-06, + "time_sec": 49.712565183639526 + }, + { + "epoch": 142, + "train_loss": 1.3294593518066407, + "train_acc": 0.6165, + "test_loss": 8.097643237304688, + "test_acc": 0.1079, + "lyapunov": null, + "grad_norm": 0.6416721044495594, + "grad_max_sv": 0.22946001626551152, + "grad_min_sv": 1.1918349693273988e-08, + "grad_condition": 33830275.99348913, + "lr": 7.001981464747503e-06, + "time_sec": 49.62647032737732 + }, + { + "epoch": 143, + "train_loss": 1.3246013949203492, + "train_acc": 0.619, + "test_loss": 8.003326276397704, + "test_acc": 0.1093, + "lyapunov": null, + "grad_norm": 0.6406658358506779, + "grad_max_sv": 0.22979442439973355, + "grad_min_sv": 1.1885957310075503e-08, + "grad_condition": 1265929967.3983974, + "lr": 5.3638335185058295e-06, + "time_sec": 49.64323043823242 + }, + { + "epoch": 144, + "train_loss": 1.3237170028686522, + "train_acc": 0.61912, + "test_loss": 8.245773946380615, + "test_acc": 0.1116, + "lyapunov": null, + "grad_norm": 0.640154182788332, + "grad_max_sv": 0.22960694395005704, + "grad_min_sv": 1.1789325913159205e-08, + "grad_condition": 220785020.05461937, + "lr": 3.942649342761114e-06, + "time_sec": 49.62677884101868 + }, + { + "epoch": 145, + "train_loss": 1.323034522781372, + "train_acc": 0.61748, + "test_loss": 8.367132460784912, + "test_acc": 0.1101, + "lyapunov": null, + "grad_norm": 0.6399875505077857, + "grad_max_sv": 0.2292648758739233, + "grad_min_sv": 1.1756407276852787e-08, + "grad_condition": 46749240.33218758, + "lr": 2.7390523158633524e-06, + "time_sec": 49.61358666419983 + }, + { + "epoch": 146, + "train_loss": 1.3221456618118286, + "train_acc": 0.61958, + "test_loss": 8.256616510772705, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 0.6401843350865242, + "grad_max_sv": 0.23075628280639648, + "grad_min_sv": 1.1929567545268527e-08, + "grad_condition": 56821403.658394314, + "lr": 1.7535703752478133e-06, + "time_sec": 49.62871527671814 + }, + { + "epoch": 147, + "train_loss": 1.32188304227829, + "train_acc": 0.62262, + "test_loss": 7.983602857208252, + "test_acc": 0.115, + "lyapunov": null, + "grad_norm": 0.6377455957871468, + "grad_max_sv": 0.2265624139457941, + "grad_min_sv": 1.1661963828825395e-08, + "grad_condition": 178436067.44761798, + "lr": 9.866357858642196e-07, + "time_sec": 49.63710594177246 + }, + { + "epoch": 148, + "train_loss": 1.3234341220855712, + "train_acc": 0.61708, + "test_loss": 8.329111752319337, + "test_acc": 0.1046, + "lyapunov": null, + "grad_norm": 0.6428801038701755, + "grad_max_sv": 0.2313603863120079, + "grad_min_sv": 1.1845945344264585e-08, + "grad_condition": 144408842.21709472, + "lr": 4.38584950570808e-07, + "time_sec": 49.63905072212219 + }, + { + "epoch": 149, + "train_loss": 1.3202154207611083, + "train_acc": 0.61986, + "test_loss": 8.021684009552002, + "test_acc": 0.1127, + "lyapunov": null, + "grad_norm": 0.6406912156142667, + "grad_max_sv": 0.2288107428699732, + "grad_min_sv": 1.181119294590971e-08, + "grad_condition": 65688308.80478315, + "lr": 1.096582625772501e-07, + "time_sec": 49.61029553413391 + }, + { + "epoch": 150, + "train_loss": 1.3158636585235595, + "train_acc": 0.62006, + "test_loss": 8.094485763549805, + "test_acc": 0.1123, + "lyapunov": null, + "grad_norm": 0.6406489877650078, + "grad_max_sv": 0.23017469234764576, + "grad_min_sv": 1.1906818318807578e-08, + "grad_condition": 37789807.4961655, + "lr": 0.0, + "time_sec": 49.65584897994995 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.089254416656495, + "train_acc": 0.01344, + "test_loss": 4.870831555175781, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 5.582063459208639, + "grad_max_sv": 5.0306542873382565, + "grad_min_sv": 8.441757832766683e-08, + "grad_condition": 74707534.78681344, + "lr": 0.0009998903417374227, + "time_sec": 66.70097637176514 + }, + { + "epoch": 2, + "train_loss": 4.736304296569824, + "train_acc": 0.02172, + "test_loss": 4.92340059890747, + "test_acc": 0.01, + "lyapunov": null, + "grad_norm": 4.087296772772229, + "grad_max_sv": 3.672157108783722, + "grad_min_sv": 6.109624839933935e-08, + "grad_condition": 230714811.36310124, + "lr": 0.0009995614150494292, + "time_sec": 66.83215641975403 + }, + { + "epoch": 3, + "train_loss": 4.52685978515625, + "train_acc": 0.03204, + "test_loss": 5.045831031799317, + "test_acc": 0.0094, + "lyapunov": null, + "grad_norm": 3.1470044543912175, + "grad_max_sv": 2.6447540044784548, + "grad_min_sv": 4.639755384339139e-08, + "grad_condition": 65625701.84585605, + "lr": 0.0009990133642141358, + "time_sec": 66.70765495300293 + }, + { + "epoch": 4, + "train_loss": 4.371717319641113, + "train_acc": 0.04112, + "test_loss": 4.993129699707032, + "test_acc": 0.0115, + "lyapunov": null, + "grad_norm": 2.5123688948843395, + "grad_max_sv": 2.1027904629707335, + "grad_min_sv": 3.615837387664633e-08, + "grad_condition": 418817692.03399765, + "lr": 0.0009982464296247522, + "time_sec": 66.70319509506226 + }, + { + "epoch": 5, + "train_loss": 4.27407361251831, + "train_acc": 0.0488, + "test_loss": 5.161634465789795, + "test_acc": 0.0119, + "lyapunov": null, + "grad_norm": 1.9573801826064445, + "grad_max_sv": 1.613087645173073, + "grad_min_sv": 2.8529539808364034e-08, + "grad_condition": 62747668.20627429, + "lr": 0.0009972609476841367, + "time_sec": 66.74726390838623 + }, + { + "epoch": 6, + "train_loss": 4.183251854553222, + "train_acc": 0.05812, + "test_loss": 5.447854755401611, + "test_acc": 0.0093, + "lyapunov": null, + "grad_norm": 1.436449079599314, + "grad_max_sv": 1.0459295481443405, + "grad_min_sv": 2.0654144772258576e-08, + "grad_condition": 94732574.16372415, + "lr": 0.000996057350657239, + "time_sec": 66.68073081970215 + }, + { + "epoch": 7, + "train_loss": 4.103355536193848, + "train_acc": 0.06872, + "test_loss": 5.544150679016114, + "test_acc": 0.0124, + "lyapunov": null, + "grad_norm": 1.082624040556548, + "grad_max_sv": 0.678101472556591, + "grad_min_sv": 1.6660088839048904e-08, + "grad_condition": 49338508.46283151, + "lr": 0.000994636166481494, + "time_sec": 66.77410340309143 + }, + { + "epoch": 8, + "train_loss": 4.040529095458984, + "train_acc": 0.07876, + "test_loss": 5.577163777160645, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.963869121683512, + "grad_max_sv": 0.5578698106110096, + "grad_min_sv": 1.4817374840991882e-08, + "grad_condition": 46172185.25999212, + "lr": 0.0009929980185352525, + "time_sec": 66.7442455291748 + }, + { + "epoch": 9, + "train_loss": 3.999490645446777, + "train_acc": 0.0856, + "test_loss": 5.472281336975097, + "test_acc": 0.0116, + "lyapunov": null, + "grad_norm": 0.9198022107734598, + "grad_max_sv": 0.5003849364817142, + "grad_min_sv": 1.3862486752946878e-08, + "grad_condition": 137028895.09887612, + "lr": 0.0009911436253643444, + "time_sec": 66.71199488639832 + }, + { + "epoch": 10, + "train_loss": 3.9641557629394533, + "train_acc": 0.09124, + "test_loss": 5.43024553604126, + "test_acc": 0.0112, + "lyapunov": null, + "grad_norm": 0.8539816540258655, + "grad_max_sv": 0.4397390566766262, + "grad_min_sv": 1.3177782898221579e-08, + "grad_condition": 50953468.3517745, + "lr": 0.0009890738003669028, + "time_sec": 66.71694684028625 + }, + { + "epoch": 11, + "train_loss": 3.9142907052612306, + "train_acc": 0.09788, + "test_loss": 5.24972756652832, + "test_acc": 0.0174, + "lyapunov": null, + "grad_norm": 0.8303589651826888, + "grad_max_sv": 0.4246540553867817, + "grad_min_sv": 1.288730961390705e-08, + "grad_condition": 88294678.08247125, + "lr": 0.00098678945143658, + "time_sec": 66.70689487457275 + }, + { + "epoch": 12, + "train_loss": 3.881778168411255, + "train_acc": 0.1037, + "test_loss": 5.765969756317139, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.7855031029198277, + "grad_max_sv": 0.3756070680916309, + "grad_min_sv": 1.2611303298881715e-08, + "grad_condition": 36786532.210794725, + "lr": 0.0009842915805643154, + "time_sec": 66.73540306091309 + }, + { + "epoch": 13, + "train_loss": 3.8490214154815674, + "train_acc": 0.1068, + "test_loss": 5.832162282562256, + "test_acc": 0.0138, + "lyapunov": null, + "grad_norm": 0.7681061932199776, + "grad_max_sv": 0.3604050487279892, + "grad_min_sv": 1.2243067453593382e-08, + "grad_condition": 131143000.26933214, + "lr": 0.000981581283398829, + "time_sec": 66.73431468009949 + }, + { + "epoch": 14, + "train_loss": 3.828877674636841, + "train_acc": 0.11234, + "test_loss": 6.293205305480957, + "test_acc": 0.0134, + "lyapunov": null, + "grad_norm": 0.7460407539013362, + "grad_max_sv": 0.34510768875479697, + "grad_min_sv": 1.1813573212726692e-08, + "grad_condition": 49629148.15911349, + "lr": 0.0009786597487660333, + "time_sec": 66.77479386329651 + }, + { + "epoch": 15, + "train_loss": 3.803487832107544, + "train_acc": 0.1159, + "test_loss": 6.4087516273498535, + "test_acc": 0.013, + "lyapunov": null, + "grad_norm": 0.716379034773642, + "grad_max_sv": 0.3261814657598734, + "grad_min_sv": 1.1572917107960378e-08, + "grad_condition": 31644703.4401185, + "lr": 0.0009755282581475766, + "time_sec": 66.73083448410034 + }, + { + "epoch": 16, + "train_loss": 3.7821172668457033, + "train_acc": 0.11904, + "test_loss": 6.406122239685058, + "test_acc": 0.0123, + "lyapunov": null, + "grad_norm": 0.697749546532161, + "grad_max_sv": 0.31582852490246294, + "grad_min_sv": 1.1393312793206434e-08, + "grad_condition": 39132519.74005551, + "lr": 0.0009721881851187403, + "time_sec": 66.74327826499939 + }, + { + "epoch": 17, + "train_loss": 3.7480180199432374, + "train_acc": 0.12526, + "test_loss": 6.8633532814025875, + "test_acc": 0.0132, + "lyapunov": null, + "grad_norm": 0.6758633251362415, + "grad_max_sv": 0.2994280070066452, + "grad_min_sv": 1.1069095015581176e-08, + "grad_condition": 36563832.03358241, + "lr": 0.0009686409947459456, + "time_sec": 66.76521873474121 + }, + { + "epoch": 18, + "train_loss": 3.730831000213623, + "train_acc": 0.12792, + "test_loss": 6.246407075500488, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.664831990265232, + "grad_max_sv": 0.2994547080248594, + "grad_min_sv": 1.0997234457625626e-08, + "grad_condition": 122736750.78260681, + "lr": 0.0009648882429441254, + "time_sec": 66.71729445457458 + }, + { + "epoch": 19, + "train_loss": 3.716553072052002, + "train_acc": 0.12942, + "test_loss": 5.873876965332031, + "test_acc": 0.0149, + "lyapunov": null, + "grad_norm": 0.6518241757841252, + "grad_max_sv": 0.29539270177483556, + "grad_min_sv": 1.0741561572852331e-08, + "grad_condition": 49669322.25294405, + "lr": 0.00096093157579425, + "time_sec": 66.81875944137573 + }, + { + "epoch": 20, + "train_loss": 3.6975706172180174, + "train_acc": 0.13298, + "test_loss": 6.400744886779785, + "test_acc": 0.0155, + "lyapunov": null, + "grad_norm": 0.6347864002121714, + "grad_max_sv": 0.28284979946911337, + "grad_min_sv": 1.0701284272607303e-08, + "grad_condition": 30013146.4819826, + "lr": 0.0009567727288213001, + "time_sec": 66.8477098941803 + }, + { + "epoch": 21, + "train_loss": 3.673498316040039, + "train_acc": 0.13564, + "test_loss": 6.160238801574707, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.6252581472584972, + "grad_max_sv": 0.27260397262871267, + "grad_min_sv": 1.0594542484282377e-08, + "grad_condition": 46350413.24314589, + "lr": 0.0009524135262330095, + "time_sec": 66.72814178466797 + }, + { + "epoch": 22, + "train_loss": 3.654527678833008, + "train_acc": 0.1393, + "test_loss": 6.9474281982421875, + "test_acc": 0.0176, + "lyapunov": null, + "grad_norm": 0.6149063083720292, + "grad_max_sv": 0.26224171184003353, + "grad_min_sv": 1.035294387718988e-08, + "grad_condition": 32282705.350815333, + "lr": 0.0009478558801197061, + "time_sec": 66.82811260223389 + }, + { + "epoch": 23, + "train_loss": 3.6450364729309084, + "train_acc": 0.14028, + "test_loss": 7.2393467880249025, + "test_acc": 0.0127, + "lyapunov": null, + "grad_norm": 0.6067467053692205, + "grad_max_sv": 0.26614573895931243, + "grad_min_sv": 1.0267544686692886e-08, + "grad_condition": 28213061.075003404, + "lr": 0.000943101789615607, + "time_sec": 66.74721336364746 + }, + { + "epoch": 24, + "train_loss": 3.623104200592041, + "train_acc": 0.14594, + "test_loss": 6.526107063293457, + "test_acc": 0.0187, + "lyapunov": null, + "grad_norm": 0.5980858749774747, + "grad_max_sv": 0.25203392654657364, + "grad_min_sv": 1.0098680717357534e-08, + "grad_condition": 50563247.00258337, + "lr": 0.0009381533400219313, + "time_sec": 66.77076554298401 + }, + { + "epoch": 25, + "train_loss": 3.6136645338439943, + "train_acc": 0.14728, + "test_loss": 7.030907647705078, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.594016587561951, + "grad_max_sv": 0.25378315448760985, + "grad_min_sv": 9.976338428627219e-09, + "grad_condition": 72065195.62747766, + "lr": 0.0009330127018922189, + "time_sec": 66.78083634376526 + }, + { + "epoch": 26, + "train_loss": 3.5951533477020265, + "train_acc": 0.15, + "test_loss": 6.8098891067504885, + "test_acc": 0.0193, + "lyapunov": null, + "grad_norm": 0.5888833643522708, + "grad_max_sv": 0.24365438856184482, + "grad_min_sv": 9.933017187935267e-09, + "grad_condition": 44149369.91233202, + "lr": 0.000927682130080253, + "time_sec": 66.72774887084961 + }, + { + "epoch": 27, + "train_loss": 3.5870719739532473, + "train_acc": 0.15012, + "test_loss": 6.188968405151368, + "test_acc": 0.0198, + "lyapunov": null, + "grad_norm": 0.5778870286561091, + "grad_max_sv": 0.23904258161783218, + "grad_min_sv": 9.864321945385335e-09, + "grad_condition": 29413784.94482057, + "lr": 0.0009221639627510072, + "time_sec": 66.7466390132904 + }, + { + "epoch": 28, + "train_loss": 3.5677108099365236, + "train_acc": 0.15438, + "test_loss": 7.111977198028565, + "test_acc": 0.0186, + "lyapunov": null, + "grad_norm": 0.565332521044754, + "grad_max_sv": 0.22653766870498657, + "grad_min_sv": 9.587734812674387e-09, + "grad_condition": 61781100.03898337, + "lr": 0.0009164606203550494, + "time_sec": 66.74424004554749 + }, + { + "epoch": 29, + "train_loss": 3.5525446216583254, + "train_acc": 0.1561, + "test_loss": 6.844758932495117, + "test_acc": 0.0209, + "lyapunov": null, + "grad_norm": 0.5709459777275144, + "grad_max_sv": 0.22716681994497775, + "grad_min_sv": 9.63618568827762e-09, + "grad_condition": 26044218.51829529, + "lr": 0.0009105746045668516, + "time_sec": 66.73790216445923 + }, + { + "epoch": 30, + "train_loss": 3.5511199297332765, + "train_acc": 0.15632, + "test_loss": 6.829617092895508, + "test_acc": 0.0179, + "lyapunov": null, + "grad_norm": 0.5599177583176913, + "grad_max_sv": 0.22315906584262848, + "grad_min_sv": 9.481845958392298e-09, + "grad_condition": 31696446.039096247, + "lr": 0.0009045084971874733, + "time_sec": 66.74309277534485 + }, + { + "epoch": 31, + "train_loss": 3.5346223778533936, + "train_acc": 0.15964, + "test_loss": 7.171929656982422, + "test_acc": 0.0181, + "lyapunov": null, + "grad_norm": 0.5560980115082016, + "grad_max_sv": 0.22190811820328235, + "grad_min_sv": 9.472099816998369e-09, + "grad_condition": 65999783.19253375, + "lr": 0.0008982649590120977, + "time_sec": 66.72736811637878 + }, + { + "epoch": 32, + "train_loss": 3.523619603424072, + "train_acc": 0.16298, + "test_loss": 7.11264291381836, + "test_acc": 0.0196, + "lyapunov": null, + "grad_norm": 0.5484008571230936, + "grad_max_sv": 0.21031202785670758, + "grad_min_sv": 9.324677128358382e-09, + "grad_condition": 59831756.702754, + "lr": 0.0008918467286629196, + "time_sec": 66.70681715011597 + }, + { + "epoch": 33, + "train_loss": 3.503953924026489, + "train_acc": 0.1662, + "test_loss": 6.848249008178711, + "test_acc": 0.0242, + "lyapunov": null, + "grad_norm": 0.5416204323895276, + "grad_max_sv": 0.2181798741221428, + "grad_min_sv": 9.399793365156769e-09, + "grad_condition": 389136802.1825175, + "lr": 0.0008852566213878943, + "time_sec": 66.73786091804504 + }, + { + "epoch": 34, + "train_loss": 3.505652629928589, + "train_acc": 0.16502, + "test_loss": 6.877189469909668, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.5355113980631458, + "grad_max_sv": 0.20969012342393398, + "grad_min_sv": 9.270577998321538e-09, + "grad_condition": 31525454.84069126, + "lr": 0.000878497527825878, + "time_sec": 66.72686457633972 + }, + { + "epoch": 35, + "train_loss": 3.486978895339966, + "train_acc": 0.16714, + "test_loss": 7.1552359481811525, + "test_acc": 0.0172, + "lyapunov": null, + "grad_norm": 0.5346080374847578, + "grad_max_sv": 0.20298720821738242, + "grad_min_sv": 9.306896420202548e-09, + "grad_condition": 25441508.50613912, + "lr": 0.000871572412738697, + "time_sec": 66.75551271438599 + }, + { + "epoch": 36, + "train_loss": 3.479604592208862, + "train_acc": 0.16902, + "test_loss": 6.844674809265137, + "test_acc": 0.0223, + "lyapunov": null, + "grad_norm": 0.5311517334543933, + "grad_max_sv": 0.20205551721155643, + "grad_min_sv": 9.200601613218452e-09, + "grad_condition": 45450108.39040236, + "lr": 0.0008644843137107055, + "time_sec": 66.7082417011261 + }, + { + "epoch": 37, + "train_loss": 3.4750630870819093, + "train_acc": 0.16898, + "test_loss": 7.165343771362305, + "test_acc": 0.0171, + "lyapunov": null, + "grad_norm": 0.5255800840531358, + "grad_max_sv": 0.19590781554579734, + "grad_min_sv": 9.155419039910683e-09, + "grad_condition": 108339245.17679186, + "lr": 0.0008572363398164014, + "time_sec": 66.71217584609985 + }, + { + "epoch": 38, + "train_loss": 3.461921478424072, + "train_acc": 0.17176, + "test_loss": 7.6983903167724606, + "test_acc": 0.0204, + "lyapunov": null, + "grad_norm": 0.5291599359124736, + "grad_max_sv": 0.19806304536759853, + "grad_min_sv": 9.252919158653227e-09, + "grad_condition": 26129114.857841287, + "lr": 0.0008498316702566826, + "time_sec": 66.83607125282288 + }, + { + "epoch": 39, + "train_loss": 3.4502412219238283, + "train_acc": 0.1729, + "test_loss": 6.8047522277832035, + "test_acc": 0.0213, + "lyapunov": null, + "grad_norm": 0.5281639901017625, + "grad_max_sv": 0.20096433460712432, + "grad_min_sv": 9.085016680621116e-09, + "grad_condition": 33958186.51443162, + "lr": 0.0008422735529643442, + "time_sec": 66.73851490020752 + }, + { + "epoch": 40, + "train_loss": 3.4376924714660646, + "train_acc": 0.17616, + "test_loss": 7.263092966461182, + "test_acc": 0.0182, + "lyapunov": null, + "grad_norm": 0.5216932066323713, + "grad_max_sv": 0.19504240863025188, + "grad_min_sv": 9.154586153026223e-09, + "grad_condition": 25458573.387380652, + "lr": 0.0008345653031794289, + "time_sec": 66.7052755355835 + }, + { + "epoch": 41, + "train_loss": 3.4279933405303957, + "train_acc": 0.17836, + "test_loss": 6.396369320678711, + "test_acc": 0.0195, + "lyapunov": null, + "grad_norm": 0.5194410647845549, + "grad_max_sv": 0.19078941717743875, + "grad_min_sv": 9.012956635884306e-09, + "grad_condition": 42363604.716461524, + "lr": 0.0008267103019950526, + "time_sec": 66.72479486465454 + }, + { + "epoch": 42, + "train_loss": 3.4256856929016113, + "train_acc": 0.17732, + "test_loss": 6.679870991516113, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5198265520764738, + "grad_max_sv": 0.19169757179915906, + "grad_min_sv": 9.036233127035497e-09, + "grad_condition": 51260505.579239644, + "lr": 0.0008187119948743447, + "time_sec": 66.75225281715393 + }, + { + "epoch": 43, + "train_loss": 3.411117221832275, + "train_acc": 0.18158, + "test_loss": 7.357481904602051, + "test_acc": 0.0185, + "lyapunov": null, + "grad_norm": 0.5156740849780826, + "grad_max_sv": 0.19417562745511532, + "grad_min_sv": 9.037307471815303e-09, + "grad_condition": 35283510.30299447, + "lr": 0.000810573890139155, + "time_sec": 66.72709918022156 + }, + { + "epoch": 44, + "train_loss": 3.4085953338623045, + "train_acc": 0.18096, + "test_loss": 7.635249890899658, + "test_acc": 0.0161, + "lyapunov": null, + "grad_norm": 0.5119612982206426, + "grad_max_sv": 0.18738919235765933, + "grad_min_sv": 8.878314214366689e-09, + "grad_condition": 31365951.59678828, + "lr": 0.0008022995574311873, + "time_sec": 66.72823333740234 + }, + { + "epoch": 45, + "train_loss": 3.391282188873291, + "train_acc": 0.18358, + "test_loss": 7.057773623657226, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.512636753960722, + "grad_max_sv": 0.18591308295726777, + "grad_min_sv": 8.905265155845221e-09, + "grad_condition": 34037092.10974729, + "lr": 0.0007938926261462363, + "time_sec": 66.75207853317261 + }, + { + "epoch": 46, + "train_loss": 3.385137359466553, + "train_acc": 0.18694, + "test_loss": 7.400888244628907, + "test_acc": 0.0212, + "lyapunov": null, + "grad_norm": 0.5082656505289807, + "grad_max_sv": 0.18733446709811688, + "grad_min_sv": 8.893193696474926e-09, + "grad_condition": 125851280.80010274, + "lr": 0.0007853567838422158, + "time_sec": 66.7163679599762 + }, + { + "epoch": 47, + "train_loss": 3.376342626800537, + "train_acc": 0.18838, + "test_loss": 7.475112818908691, + "test_acc": 0.0175, + "lyapunov": null, + "grad_norm": 0.5045706953392911, + "grad_max_sv": 0.18063193671405314, + "grad_min_sv": 8.950101182403359e-09, + "grad_condition": 22625503.611506984, + "lr": 0.0007766957746216719, + "time_sec": 66.7100522518158 + }, + { + "epoch": 48, + "train_loss": 3.3649324946594237, + "train_acc": 0.18694, + "test_loss": 8.045938752746583, + "test_acc": 0.0189, + "lyapunov": null, + "grad_norm": 0.5007866825544302, + "grad_max_sv": 0.1830794021487236, + "grad_min_sv": 8.805358707453248e-09, + "grad_condition": 27558131.426934887, + "lr": 0.0007679133974894982, + "time_sec": 66.70468735694885 + }, + { + "epoch": 49, + "train_loss": 3.3610028453063965, + "train_acc": 0.1888, + "test_loss": 7.112044483947754, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.5007184914478864, + "grad_max_sv": 0.18336209803819656, + "grad_min_sv": 9.024269038288013e-09, + "grad_condition": 33518235.006607275, + "lr": 0.000759013504686565, + "time_sec": 66.7611026763916 + }, + { + "epoch": 50, + "train_loss": 3.3484571326446533, + "train_acc": 0.1906, + "test_loss": 7.519181715393066, + "test_acc": 0.0209, + "lyapunov": null, + "grad_norm": 0.5018491559425493, + "grad_max_sv": 0.18028105311095716, + "grad_min_sv": 8.925991949043643e-09, + "grad_condition": 33524852.83647134, + "lr": 0.0007499999999999998, + "time_sec": 66.76505136489868 + }, + { + "epoch": 51, + "train_loss": 3.3410891053009033, + "train_acc": 0.1921, + "test_loss": 7.056560147094727, + "test_acc": 0.0249, + "lyapunov": null, + "grad_norm": 0.4996656726107064, + "grad_max_sv": 0.17895969636738301, + "grad_min_sv": 8.92833956489536e-09, + "grad_condition": 30339744.194165338, + "lr": 0.0007408768370508575, + "time_sec": 66.76679730415344 + }, + { + "epoch": 52, + "train_loss": 3.329959710845947, + "train_acc": 0.19464, + "test_loss": 7.733986283874512, + "test_acc": 0.02, + "lyapunov": null, + "grad_norm": 0.49662871046839857, + "grad_max_sv": 0.17035150155425072, + "grad_min_sv": 8.920055267341853e-09, + "grad_condition": 39560292.40680326, + "lr": 0.0007316480175599307, + "time_sec": 66.73509478569031 + }, + { + "epoch": 53, + "train_loss": 3.328139169998169, + "train_acc": 0.1964, + "test_loss": 8.010476211547852, + "test_acc": 0.0211, + "lyapunov": null, + "grad_norm": 0.4958475219811756, + "grad_max_sv": 0.17490845173597336, + "grad_min_sv": 8.784460091802727e-09, + "grad_condition": 71860322.54887062, + "lr": 0.0007223175895924635, + "time_sec": 66.72841596603394 + }, + { + "epoch": 54, + "train_loss": 3.3162127281188964, + "train_acc": 0.19728, + "test_loss": 7.010640211486816, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.4961833449463003, + "grad_max_sv": 0.17223588079214097, + "grad_min_sv": 8.753281316442596e-09, + "grad_condition": 22715187.33107339, + "lr": 0.0007128896457825361, + "time_sec": 66.72108912467957 + }, + { + "epoch": 55, + "train_loss": 3.3105887175750732, + "train_acc": 0.1977, + "test_loss": 8.294336575317383, + "test_acc": 0.0177, + "lyapunov": null, + "grad_norm": 0.4959871213831781, + "grad_max_sv": 0.17211879640817643, + "grad_min_sv": 8.85512002890554e-09, + "grad_condition": 22832904.69554911, + "lr": 0.0007033683215378998, + "time_sec": 66.77683353424072 + }, + { + "epoch": 56, + "train_loss": 3.3091206261444093, + "train_acc": 0.19822, + "test_loss": 6.872190827941894, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.4968424527269832, + "grad_max_sv": 0.16929374635219574, + "grad_min_sv": 8.852659438840504e-09, + "grad_condition": 21482011.311691545, + "lr": 0.0006937577932260512, + "time_sec": 66.7394802570343 + }, + { + "epoch": 57, + "train_loss": 3.2911807606506347, + "train_acc": 0.20104, + "test_loss": 6.781019482421875, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.49806961864225907, + "grad_max_sv": 0.17269197143614293, + "grad_min_sv": 9.028358619045385e-09, + "grad_condition": 21860182.81813491, + "lr": 0.0006840622763423388, + "time_sec": 66.74213409423828 + }, + { + "epoch": 58, + "train_loss": 3.28923882019043, + "train_acc": 0.2009, + "test_loss": 7.48718016204834, + "test_acc": 0.0233, + "lyapunov": null, + "grad_norm": 0.497037583502488, + "grad_max_sv": 0.17720941305160523, + "grad_min_sv": 8.923951845540844e-09, + "grad_condition": 25638959.340645056, + "lr": 0.0006742860236609073, + "time_sec": 66.70864987373352 + }, + { + "epoch": 59, + "train_loss": 3.288974278411865, + "train_acc": 0.2022, + "test_loss": 6.711775099182129, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.5006739014854031, + "grad_max_sv": 0.1799727737903595, + "grad_min_sv": 8.922615390982714e-09, + "grad_condition": 22962596.945499133, + "lr": 0.0006644333233692913, + "time_sec": 66.72898769378662 + }, + { + "epoch": 60, + "train_loss": 3.283515991897583, + "train_acc": 0.20374, + "test_loss": 7.436810195922852, + "test_acc": 0.0217, + "lyapunov": null, + "grad_norm": 0.4970314759637393, + "grad_max_sv": 0.1713873755186796, + "grad_min_sv": 8.852956717708694e-09, + "grad_condition": 21460924.515540235, + "lr": 0.0006545084971874734, + "time_sec": 66.77793312072754 + }, + { + "epoch": 61, + "train_loss": 3.2660218312072753, + "train_acc": 0.2052, + "test_loss": 7.1023060356140135, + "test_acc": 0.0237, + "lyapunov": null, + "grad_norm": 0.49642283106124174, + "grad_max_sv": 0.17171172685921193, + "grad_min_sv": 9.03237155625014e-09, + "grad_condition": 23554914.711565603, + "lr": 0.0006445158984722354, + "time_sec": 66.71418523788452 + }, + { + "epoch": 62, + "train_loss": 3.254552359466553, + "train_acc": 0.2084, + "test_loss": 7.483150309753418, + "test_acc": 0.0225, + "lyapunov": null, + "grad_norm": 0.4960786681631791, + "grad_max_sv": 0.1668458305299282, + "grad_min_sv": 8.818685695577421e-09, + "grad_condition": 74094011.9951904, + "lr": 0.0006344599103076324, + "time_sec": 66.70579290390015 + }, + { + "epoch": 63, + "train_loss": 3.2479764625549317, + "train_acc": 0.20702, + "test_loss": 7.495381002807617, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.4917077399114027, + "grad_max_sv": 0.16495948433876037, + "grad_min_sv": 8.864074795694732e-09, + "grad_condition": 30857102.41845674, + "lr": 0.0006243449435824269, + "time_sec": 66.72497200965881 + }, + { + "epoch": 64, + "train_loss": 3.245808661117554, + "train_acc": 0.20704, + "test_loss": 6.5149994140625, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.4942308484852371, + "grad_max_sv": 0.16808778569102287, + "grad_min_sv": 8.905879750331636e-09, + "grad_condition": 21297665.020826895, + "lr": 0.0006141754350553275, + "time_sec": 66.71531987190247 + }, + { + "epoch": 65, + "train_loss": 3.2359812786102293, + "train_acc": 0.20964, + "test_loss": 6.7083621681213375, + "test_acc": 0.0257, + "lyapunov": null, + "grad_norm": 0.4924300564127143, + "grad_max_sv": 0.1668924294412136, + "grad_min_sv": 8.814785660855167e-09, + "grad_condition": 387068362.7974197, + "lr": 0.0006039558454088793, + "time_sec": 66.739919424057 + }, + { + "epoch": 66, + "train_loss": 3.2231747630310057, + "train_acc": 0.21288, + "test_loss": 6.6462861267089846, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.49278283649554394, + "grad_max_sv": 0.16672560423612595, + "grad_min_sv": 8.910612160628607e-09, + "grad_condition": 23460863.699399397, + "lr": 0.000593690657292862, + "time_sec": 66.73168134689331 + }, + { + "epoch": 67, + "train_loss": 3.2156623792266847, + "train_acc": 0.21342, + "test_loss": 7.029375877380371, + "test_acc": 0.0223, + "lyapunov": null, + "grad_norm": 0.4909443834963243, + "grad_max_sv": 0.16597550213336945, + "grad_min_sv": 8.912085689566362e-09, + "grad_condition": 31291994.15683285, + "lr": 0.0005833843733580507, + "time_sec": 66.72268962860107 + }, + { + "epoch": 68, + "train_loss": 3.2102099297332765, + "train_acc": 0.21536, + "test_loss": 6.8582941429138184, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.49321037808878027, + "grad_max_sv": 0.16992229372262954, + "grad_min_sv": 8.80631389199582e-09, + "grad_condition": 129842817.14263825, + "lr": 0.0005730415142812054, + "time_sec": 66.73015308380127 + }, + { + "epoch": 69, + "train_loss": 3.2087192346191404, + "train_acc": 0.21692, + "test_loss": 6.703964881134033, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.4884522648005531, + "grad_max_sv": 0.16176489181816578, + "grad_min_sv": 8.772693779746099e-09, + "grad_condition": 26469955.870484192, + "lr": 0.0005626666167821517, + "time_sec": 66.71746468544006 + }, + { + "epoch": 70, + "train_loss": 3.195241547088623, + "train_acc": 0.21844, + "test_loss": 6.542587074279785, + "test_acc": 0.0284, + "lyapunov": null, + "grad_norm": 0.49091657002079947, + "grad_max_sv": 0.16242207810282708, + "grad_min_sv": 9.02578579792257e-09, + "grad_condition": 23591537.371170804, + "lr": 0.0005522642316338265, + "time_sec": 66.72597932815552 + }, + { + "epoch": 71, + "train_loss": 3.1896180830383303, + "train_acc": 0.21886, + "test_loss": 6.82057219543457, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.4892216781222015, + "grad_max_sv": 0.1621775720268488, + "grad_min_sv": 8.926039651857565e-09, + "grad_condition": 20890687.882442366, + "lr": 0.0005418389216661573, + "time_sec": 66.7145037651062 + }, + { + "epoch": 72, + "train_loss": 3.18413442276001, + "train_acc": 0.21908, + "test_loss": 7.1544591903686525, + "test_acc": 0.0243, + "lyapunov": null, + "grad_norm": 0.48870515357132727, + "grad_max_sv": 0.16475776992738247, + "grad_min_sv": 8.91442188816205e-09, + "grad_condition": 35365218.5794013, + "lr": 0.0005313952597646563, + "time_sec": 66.72212243080139 + }, + { + "epoch": 73, + "train_loss": 3.1829597901153566, + "train_acc": 0.21974, + "test_loss": 7.2174785011291505, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4892142900976219, + "grad_max_sv": 0.16382574513554574, + "grad_min_sv": 8.810792702352264e-09, + "grad_condition": 2088135479.3673325, + "lr": 0.0005209378268645994, + "time_sec": 66.73431754112244 + }, + { + "epoch": 74, + "train_loss": 3.172711128463745, + "train_acc": 0.22268, + "test_loss": 7.406581823730469, + "test_acc": 0.0232, + "lyapunov": null, + "grad_norm": 0.48885933422631656, + "grad_max_sv": 0.1622017789632082, + "grad_min_sv": 8.900176362569568e-09, + "grad_condition": 22065867.848713316, + "lr": 0.0005104712099416781, + "time_sec": 66.76118803024292 + }, + { + "epoch": 75, + "train_loss": 3.1605979063415526, + "train_acc": 0.22268, + "test_loss": 7.909864106750488, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.4864315646638775, + "grad_max_sv": 0.16106058210134505, + "grad_min_sv": 8.83298489941231e-09, + "grad_condition": 46212562.907684386, + "lr": 0.0004999999999999996, + "time_sec": 66.70442318916321 + }, + { + "epoch": 76, + "train_loss": 3.1487682283020018, + "train_acc": 0.22692, + "test_loss": 7.801919015502929, + "test_acc": 0.0215, + "lyapunov": null, + "grad_norm": 0.49432790922941905, + "grad_max_sv": 0.1653361301869154, + "grad_min_sv": 9.004006756851979e-09, + "grad_condition": 21481137.43510855, + "lr": 0.0004895287900583212, + "time_sec": 66.72583270072937 + }, + { + "epoch": 77, + "train_loss": 3.150441154251099, + "train_acc": 0.22298, + "test_loss": 7.5658083923339845, + "test_acc": 0.0206, + "lyapunov": null, + "grad_norm": 0.4905609551233629, + "grad_max_sv": 0.16559089235961438, + "grad_min_sv": 9.02131503666137e-09, + "grad_condition": 20767700.255871035, + "lr": 0.0004790621731353997, + "time_sec": 66.69700527191162 + }, + { + "epoch": 78, + "train_loss": 3.1500933878326416, + "train_acc": 0.22786, + "test_loss": 7.626110935974121, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.4905443897236645, + "grad_max_sv": 0.16319101713597775, + "grad_min_sv": 8.856467318546501e-09, + "grad_condition": 30384641.86177106, + "lr": 0.000468604740235343, + "time_sec": 66.70938420295715 + }, + { + "epoch": 79, + "train_loss": 3.1403994177246095, + "train_acc": 0.22896, + "test_loss": 7.712996089172363, + "test_acc": 0.0224, + "lyapunov": null, + "grad_norm": 0.4915245764953966, + "grad_max_sv": 0.16383215487003328, + "grad_min_sv": 9.000386157198559e-09, + "grad_condition": 24292562.845880195, + "lr": 0.00045816107833384175, + "time_sec": 66.70869493484497 + }, + { + "epoch": 80, + "train_loss": 3.135038282623291, + "train_acc": 0.22664, + "test_loss": 7.267129122161865, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.49111047918715733, + "grad_max_sv": 0.1639216773211956, + "grad_min_sv": 8.921349751783367e-09, + "grad_condition": 420151306.09404176, + "lr": 0.0004477357683661729, + "time_sec": 66.7166097164154 + }, + { + "epoch": 81, + "train_loss": 3.1244947747802736, + "train_acc": 0.22956, + "test_loss": 7.662328411865234, + "test_acc": 0.0247, + "lyapunov": null, + "grad_norm": 0.49289166159918185, + "grad_max_sv": 0.16057575568556787, + "grad_min_sv": 9.007528779803043e-09, + "grad_condition": 25322164.642992593, + "lr": 0.00043733338321784746, + "time_sec": 66.70411825180054 + }, + { + "epoch": 82, + "train_loss": 3.1161900270080567, + "train_acc": 0.23102, + "test_loss": 6.92779616394043, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.49270870414948964, + "grad_max_sv": 0.1599017258733511, + "grad_min_sv": 9.11951086590701e-09, + "grad_condition": 20698906.206454754, + "lr": 0.0004269584857187939, + "time_sec": 66.70752501487732 + }, + { + "epoch": 83, + "train_loss": 3.117374754104614, + "train_acc": 0.23338, + "test_loss": 7.148474893188476, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.4925974195490984, + "grad_max_sv": 0.16150497682392598, + "grad_min_sv": 8.971566273219267e-09, + "grad_condition": 20007661.368726093, + "lr": 0.0004166156266419484, + "time_sec": 66.70796918869019 + }, + { + "epoch": 84, + "train_loss": 3.1047154219055177, + "train_acc": 0.23342, + "test_loss": 7.627574306488037, + "test_acc": 0.0234, + "lyapunov": null, + "grad_norm": 0.4921892080867045, + "grad_max_sv": 0.16364577710628508, + "grad_min_sv": 8.967278117277822e-09, + "grad_condition": 20465428.39487014, + "lr": 0.0004063093427071373, + "time_sec": 66.70926451683044 + }, + { + "epoch": 85, + "train_loss": 3.0953226109313965, + "train_acc": 0.23356, + "test_loss": 7.637861351776123, + "test_acc": 0.0254, + "lyapunov": null, + "grad_norm": 0.49401889904765806, + "grad_max_sv": 0.16418364495038987, + "grad_min_sv": 8.915860015990679e-09, + "grad_condition": 203043858.99741915, + "lr": 0.0003960441545911199, + "time_sec": 66.6929943561554 + }, + { + "epoch": 86, + "train_loss": 3.0932106770324705, + "train_acc": 0.23452, + "test_loss": 7.435467148590088, + "test_acc": 0.0248, + "lyapunov": null, + "grad_norm": 0.4934388084197917, + "grad_max_sv": 0.16211238466203212, + "grad_min_sv": 9.0381108895643e-09, + "grad_condition": 38210459.14289879, + "lr": 0.0003858245649446718, + "time_sec": 66.71461033821106 + }, + { + "epoch": 87, + "train_loss": 3.091542336883545, + "train_acc": 0.23574, + "test_loss": 7.27965379486084, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.49327307505927953, + "grad_max_sv": 0.1624306257814169, + "grad_min_sv": 9.051206378840603e-09, + "grad_condition": 19977131.887911893, + "lr": 0.00037565505641757235, + "time_sec": 66.7017343044281 + }, + { + "epoch": 88, + "train_loss": 3.0846370722961427, + "train_acc": 0.2367, + "test_loss": 7.714011827087402, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.49521950469943726, + "grad_max_sv": 0.16350008510053157, + "grad_min_sv": 9.132233064201855e-09, + "grad_condition": 20496153.697574906, + "lr": 0.00036554008969236695, + "time_sec": 66.80735445022583 + }, + { + "epoch": 89, + "train_loss": 3.067184111480713, + "train_acc": 0.23956, + "test_loss": 7.469543979644776, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.49450885750587337, + "grad_max_sv": 0.16215350292623043, + "grad_min_sv": 9.075074243122815e-09, + "grad_condition": 63145499.63971396, + "lr": 0.0003554841015277638, + "time_sec": 66.7019522190094 + }, + { + "epoch": 90, + "train_loss": 3.0696119786071776, + "train_acc": 0.23776, + "test_loss": 7.227960666656494, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.49496033151417024, + "grad_max_sv": 0.15985839106142521, + "grad_min_sv": 9.114914140302688e-09, + "grad_condition": 88232236.67419389, + "lr": 0.000345491502812526, + "time_sec": 66.71336770057678 + }, + { + "epoch": 91, + "train_loss": 3.0570466086578367, + "train_acc": 0.24112, + "test_loss": 7.087581924438476, + "test_acc": 0.0285, + "lyapunov": null, + "grad_norm": 0.49532470616490887, + "grad_max_sv": 0.16271125935018063, + "grad_min_sv": 9.14848334726548e-09, + "grad_condition": 28858228.725753903, + "lr": 0.0003355666766307081, + "time_sec": 66.71155142784119 + }, + { + "epoch": 92, + "train_loss": 3.060674235687256, + "train_acc": 0.24284, + "test_loss": 7.354493684387207, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.49422169257384346, + "grad_max_sv": 0.16212479658424855, + "grad_min_sv": 9.094859150515777e-09, + "grad_condition": 27013716.07646851, + "lr": 0.00032571397633909225, + "time_sec": 66.73360872268677 + }, + { + "epoch": 93, + "train_loss": 3.045851851577759, + "train_acc": 0.24666, + "test_loss": 6.961697528839111, + "test_acc": 0.0257, + "lyapunov": null, + "grad_norm": 0.4943781413484412, + "grad_max_sv": 0.15829392597079278, + "grad_min_sv": 9.1174124181026e-09, + "grad_condition": 24719922.26471028, + "lr": 0.00031593772365766094, + "time_sec": 66.72647047042847 + }, + { + "epoch": 94, + "train_loss": 3.0384512644958495, + "train_acc": 0.24492, + "test_loss": 7.376283264160156, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.49582915049730736, + "grad_max_sv": 0.1624866124242544, + "grad_min_sv": 9.118276048341972e-09, + "grad_condition": 727643917.2657491, + "lr": 0.0003062422067739483, + "time_sec": 66.70089149475098 + }, + { + "epoch": 95, + "train_loss": 3.039133260345459, + "train_acc": 0.24476, + "test_loss": 7.406265617370606, + "test_acc": 0.0298, + "lyapunov": null, + "grad_norm": 0.4964727526376002, + "grad_max_sv": 0.15984426029026508, + "grad_min_sv": 9.0936182872009e-09, + "grad_condition": 53822276.22529755, + "lr": 0.00029663167846209965, + "time_sec": 66.71791744232178 + }, + { + "epoch": 96, + "train_loss": 3.0375169485473634, + "train_acc": 0.24388, + "test_loss": 7.3450915855407715, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.4980105941759735, + "grad_max_sv": 0.1639113176614046, + "grad_min_sv": 9.174823172204694e-09, + "grad_condition": 75847501.33547327, + "lr": 0.00028711035421746345, + "time_sec": 66.74349761009216 + }, + { + "epoch": 97, + "train_loss": 3.036133956604004, + "train_acc": 0.2481, + "test_loss": 7.577465545654297, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.4958252185119339, + "grad_max_sv": 0.16029710061848162, + "grad_min_sv": 8.978423951533366e-09, + "grad_condition": 19961795.980553128, + "lr": 0.00027768241040753615, + "time_sec": 66.72821807861328 + }, + { + "epoch": 98, + "train_loss": 3.021324711227417, + "train_acc": 0.25076, + "test_loss": 7.219669580841065, + "test_acc": 0.0303, + "lyapunov": null, + "grad_norm": 0.4970296963841891, + "grad_max_sv": 0.16001575216650962, + "grad_min_sv": 9.067042531715752e-09, + "grad_condition": 41223693.265652105, + "lr": 0.00026835198244006903, + "time_sec": 66.74218535423279 + }, + { + "epoch": 99, + "train_loss": 3.0151924266815184, + "train_acc": 0.25042, + "test_loss": 7.808471519470215, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.497912540335549, + "grad_max_sv": 0.1632791668176651, + "grad_min_sv": 9.184349171464934e-09, + "grad_condition": 23400737.365473915, + "lr": 0.0002591231629491421, + "time_sec": 66.70754623413086 + }, + { + "epoch": 100, + "train_loss": 3.0173143773651123, + "train_acc": 0.24922, + "test_loss": 7.265430112457276, + "test_acc": 0.028, + "lyapunov": null, + "grad_norm": 0.49818870466542803, + "grad_max_sv": 0.16289953589439393, + "grad_min_sv": 9.281307221387091e-09, + "grad_condition": 23108793.760435097, + "lr": 0.0002499999999999997, + "time_sec": 66.74620199203491 + }, + { + "epoch": 101, + "train_loss": 3.0063516328430175, + "train_acc": 0.25068, + "test_loss": 7.405182618713379, + "test_acc": 0.0321, + "lyapunov": null, + "grad_norm": 0.4980158759477165, + "grad_max_sv": 0.16276963874697686, + "grad_min_sv": 9.112035989633505e-09, + "grad_condition": 21414811.754604597, + "lr": 0.00024098649531343477, + "time_sec": 66.74015522003174 + }, + { + "epoch": 102, + "train_loss": 3.004280758743286, + "train_acc": 0.25098, + "test_loss": 7.399062448120117, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.500738337792044, + "grad_max_sv": 0.1635062240064144, + "grad_min_sv": 9.288643754157277e-09, + "grad_condition": 21845553.2838238, + "lr": 0.0002320866025105016, + "time_sec": 66.69196605682373 + }, + { + "epoch": 103, + "train_loss": 2.9984512678527833, + "train_acc": 0.2512, + "test_loss": 7.320097260284424, + "test_acc": 0.0284, + "lyapunov": null, + "grad_norm": 0.4980454163272628, + "grad_max_sv": 0.1580117117613554, + "grad_min_sv": 9.07426482149587e-09, + "grad_condition": 30985957.899948187, + "lr": 0.0002233042253783278, + "time_sec": 66.74033546447754 + }, + { + "epoch": 104, + "train_loss": 2.99728506942749, + "train_acc": 0.25086, + "test_loss": 7.463210521697998, + "test_acc": 0.0329, + "lyapunov": null, + "grad_norm": 0.5009998323620124, + "grad_max_sv": 0.16469128727912902, + "grad_min_sv": 9.2030743081839e-09, + "grad_condition": 22045083.846339237, + "lr": 0.000214643216157784, + "time_sec": 66.72671890258789 + }, + { + "epoch": 105, + "train_loss": 2.9898451292419432, + "train_acc": 0.25504, + "test_loss": 7.531641695404053, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.5022636847492568, + "grad_max_sv": 0.16528656147420406, + "grad_min_sv": 9.158518983476415e-09, + "grad_condition": 24732730.3300323, + "lr": 0.00020610737385376332, + "time_sec": 66.72895193099976 + }, + { + "epoch": 106, + "train_loss": 2.984173779754639, + "train_acc": 0.25438, + "test_loss": 7.581431744384766, + "test_acc": 0.0273, + "lyapunov": null, + "grad_norm": 0.5028431980176926, + "grad_max_sv": 0.1630011171102524, + "grad_min_sv": 9.238039688774791e-09, + "grad_condition": 20675234.791328143, + "lr": 0.00019770044256881242, + "time_sec": 66.73670959472656 + }, + { + "epoch": 107, + "train_loss": 2.974853392868042, + "train_acc": 0.25748, + "test_loss": 7.1432702926635745, + "test_acc": 0.0313, + "lyapunov": null, + "grad_norm": 0.49959385619284613, + "grad_max_sv": 0.16204869262874128, + "grad_min_sv": 9.195193381716926e-09, + "grad_condition": 21149671.894155927, + "lr": 0.0001894261098608447, + "time_sec": 66.74563598632812 + }, + { + "epoch": 108, + "train_loss": 2.9721791679382323, + "train_acc": 0.25728, + "test_loss": 7.795809649658203, + "test_acc": 0.0298, + "lyapunov": null, + "grad_norm": 0.4995722502777866, + "grad_max_sv": 0.15964266508817673, + "grad_min_sv": 9.203898770904218e-09, + "grad_condition": 20323974.743836712, + "lr": 0.000181288005125655, + "time_sec": 66.73793625831604 + }, + { + "epoch": 109, + "train_loss": 2.970719254760742, + "train_acc": 0.25944, + "test_loss": 7.365542489624024, + "test_acc": 0.0299, + "lyapunov": null, + "grad_norm": 0.500757198933526, + "grad_max_sv": 0.16609507314860822, + "grad_min_sv": 9.356035884922065e-09, + "grad_condition": 20439457.080971286, + "lr": 0.0001732896980049473, + "time_sec": 66.7298583984375 + }, + { + "epoch": 110, + "train_loss": 2.972525007095337, + "train_acc": 0.25712, + "test_loss": 7.133980830383301, + "test_acc": 0.0312, + "lyapunov": null, + "grad_norm": 0.5042334021436244, + "grad_max_sv": 0.15981336012482644, + "grad_min_sv": 9.288604266299849e-09, + "grad_condition": 21280953.98530178, + "lr": 0.00016543469682057076, + "time_sec": 66.76267719268799 + }, + { + "epoch": 111, + "train_loss": 2.9631910160827637, + "train_acc": 0.25998, + "test_loss": 7.417809590148925, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5014056320574171, + "grad_max_sv": 0.16821228563785554, + "grad_min_sv": 9.333871581716779e-09, + "grad_condition": 101661462.28679642, + "lr": 0.00015772644703565552, + "time_sec": 66.72111940383911 + }, + { + "epoch": 112, + "train_loss": 2.9575250452423094, + "train_acc": 0.26008, + "test_loss": 7.389129028320313, + "test_acc": 0.0277, + "lyapunov": null, + "grad_norm": 0.5007918938537274, + "grad_max_sv": 0.16079586669802665, + "grad_min_sv": 9.307818968351534e-09, + "grad_condition": 20753238.25422468, + "lr": 0.00015016832974331713, + "time_sec": 66.72973942756653 + }, + { + "epoch": 113, + "train_loss": 2.952999960632324, + "train_acc": 0.26198, + "test_loss": 7.37722262878418, + "test_acc": 0.0287, + "lyapunov": null, + "grad_norm": 0.5013173930748581, + "grad_max_sv": 0.16444203816354275, + "grad_min_sv": 9.318139330971587e-09, + "grad_condition": 26788166.113831718, + "lr": 0.00014276366018359834, + "time_sec": 66.83487486839294 + }, + { + "epoch": 114, + "train_loss": 2.948192635574341, + "train_acc": 0.26038, + "test_loss": 7.436811110687255, + "test_acc": 0.0279, + "lyapunov": null, + "grad_norm": 0.5032371113955786, + "grad_max_sv": 0.1634738527238369, + "grad_min_sv": 9.2874662635219e-09, + "grad_condition": 319138381.19418097, + "lr": 0.00013551568628929425, + "time_sec": 66.70622992515564 + }, + { + "epoch": 115, + "train_loss": 2.9517051191711428, + "train_acc": 0.26036, + "test_loss": 7.19214797668457, + "test_acc": 0.03, + "lyapunov": null, + "grad_norm": 0.5054472421665304, + "grad_max_sv": 0.16728437952697278, + "grad_min_sv": 9.324679213496e-09, + "grad_condition": 26191438.542866766, + "lr": 0.00012842758726130276, + "time_sec": 66.71952223777771 + }, + { + "epoch": 116, + "train_loss": 2.9479563136291502, + "train_acc": 0.25988, + "test_loss": 7.865117324829102, + "test_acc": 0.0272, + "lyapunov": null, + "grad_norm": 0.501425656974135, + "grad_max_sv": 0.16254092417657376, + "grad_min_sv": 9.171186369366646e-09, + "grad_condition": 43416689.99828492, + "lr": 0.0001215024721741218, + "time_sec": 66.74095702171326 + }, + { + "epoch": 117, + "train_loss": 2.9373822256469726, + "train_acc": 0.26326, + "test_loss": 7.544526052856446, + "test_acc": 0.0288, + "lyapunov": null, + "grad_norm": 0.5031467536307935, + "grad_max_sv": 0.16549900099635123, + "grad_min_sv": 9.4188400051598e-09, + "grad_condition": 19833315.44179687, + "lr": 0.00011474337861210538, + "time_sec": 66.72034072875977 + }, + { + "epoch": 118, + "train_loss": 2.9374622593688966, + "train_acc": 0.26362, + "test_loss": 7.940575238037109, + "test_acc": 0.0276, + "lyapunov": null, + "grad_norm": 0.502189701036258, + "grad_max_sv": 0.1663150992244482, + "grad_min_sv": 9.337868267511595e-09, + "grad_condition": 22055002.57718137, + "lr": 0.00010815327133708009, + "time_sec": 66.71819615364075 + }, + { + "epoch": 119, + "train_loss": 2.9290069982910154, + "train_acc": 0.26682, + "test_loss": 8.381109976196289, + "test_acc": 0.0245, + "lyapunov": null, + "grad_norm": 0.5022580399945052, + "grad_max_sv": 0.16189948543906213, + "grad_min_sv": 9.334797540505591e-09, + "grad_condition": 53795996.97598307, + "lr": 0.00010173504098790182, + "time_sec": 66.73639011383057 + }, + { + "epoch": 120, + "train_loss": 2.927497018890381, + "train_acc": 0.26494, + "test_loss": 8.134235343933106, + "test_acc": 0.0268, + "lyapunov": null, + "grad_norm": 0.5044191934677914, + "grad_max_sv": 0.1647841826081276, + "grad_min_sv": 9.31749464250231e-09, + "grad_condition": 21075801.592136864, + "lr": 9.549150281252629e-05, + "time_sec": 66.71619915962219 + }, + { + "epoch": 121, + "train_loss": 2.9210917962646485, + "train_acc": 0.2676, + "test_loss": 7.665898156738281, + "test_acc": 0.0284, + "lyapunov": null, + "grad_norm": 0.505046124945648, + "grad_max_sv": 0.16069133542478084, + "grad_min_sv": 9.383237816254498e-09, + "grad_condition": 53773449.70699586, + "lr": 8.942539543314794e-05, + "time_sec": 66.7949550151825 + }, + { + "epoch": 122, + "train_loss": 2.9300759950256348, + "train_acc": 0.26686, + "test_loss": 7.947439320373535, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5039924043792687, + "grad_max_sv": 0.16329768523573876, + "grad_min_sv": 9.309516596847645e-09, + "grad_condition": 105483269.53547074, + "lr": 8.353937964495024e-05, + "time_sec": 66.70848250389099 + }, + { + "epoch": 123, + "train_loss": 2.91971375289917, + "train_acc": 0.26734, + "test_loss": 7.80317967376709, + "test_acc": 0.0286, + "lyapunov": null, + "grad_norm": 0.5061715705620777, + "grad_max_sv": 0.16143706440925598, + "grad_min_sv": 9.3223205665377e-09, + "grad_condition": 44714095.26064149, + "lr": 7.783603724899243e-05, + "time_sec": 66.75235438346863 + }, + { + "epoch": 124, + "train_loss": 2.920988783569336, + "train_acc": 0.2672, + "test_loss": 7.688530905151367, + "test_acc": 0.0267, + "lyapunov": null, + "grad_norm": 0.5036561383144873, + "grad_max_sv": 0.16541591919958593, + "grad_min_sv": 9.339689868714807e-09, + "grad_condition": 21082674.48603835, + "lr": 7.231786991974666e-05, + "time_sec": 66.7428572177887 + }, + { + "epoch": 125, + "train_loss": 2.9158429930877685, + "train_acc": 0.26972, + "test_loss": 7.870475231933594, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.5050163715028828, + "grad_max_sv": 0.16450283974409102, + "grad_min_sv": 9.300618648844239e-09, + "grad_condition": 22745467.54728716, + "lr": 6.698729810778072e-05, + "time_sec": 66.70153951644897 + }, + { + "epoch": 126, + "train_loss": 2.9174345250701905, + "train_acc": 0.26804, + "test_loss": 7.7597047775268555, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5054786147107485, + "grad_max_sv": 0.16298311799764634, + "grad_min_sv": 9.272562198105183e-09, + "grad_condition": 355815933.8318427, + "lr": 6.184665997806817e-05, + "time_sec": 66.70234727859497 + }, + { + "epoch": 127, + "train_loss": 2.9025824697875975, + "train_acc": 0.26988, + "test_loss": 7.446964788818359, + "test_acc": 0.0276, + "lyapunov": null, + "grad_norm": 0.5066198768830174, + "grad_max_sv": 0.1645387414842844, + "grad_min_sv": 9.428870359484698e-09, + "grad_condition": 20208395.537682876, + "lr": 5.6898210384392595e-05, + "time_sec": 66.714515209198 + }, + { + "epoch": 128, + "train_loss": 2.915607092437744, + "train_acc": 0.26734, + "test_loss": 7.931312725830078, + "test_acc": 0.0244, + "lyapunov": null, + "grad_norm": 0.5071889354627791, + "grad_max_sv": 0.16293769851326942, + "grad_min_sv": 9.389047653241001e-09, + "grad_condition": 19442274.807418514, + "lr": 5.214411988029363e-05, + "time_sec": 66.77645683288574 + }, + { + "epoch": 129, + "train_loss": 2.9043918053436277, + "train_acc": 0.27058, + "test_loss": 7.705898820495605, + "test_acc": 0.0294, + "lyapunov": null, + "grad_norm": 0.5061548650342338, + "grad_max_sv": 0.1668264877051115, + "grad_min_sv": 9.293020419853803e-09, + "grad_condition": 22634656.7147369, + "lr": 4.7586473766990294e-05, + "time_sec": 66.68853044509888 + }, + { + "epoch": 130, + "train_loss": 2.9112479612731934, + "train_acc": 0.2704, + "test_loss": 7.656457232666016, + "test_acc": 0.0278, + "lyapunov": null, + "grad_norm": 0.5055330426804672, + "grad_max_sv": 0.162294964119792, + "grad_min_sv": 9.291567426572556e-09, + "grad_condition": 22558154.425069276, + "lr": 4.32272711786996e-05, + "time_sec": 66.69644737243652 + }, + { + "epoch": 131, + "train_loss": 2.9026712393951417, + "train_acc": 0.26934, + "test_loss": 7.7139065521240235, + "test_acc": 0.0274, + "lyapunov": null, + "grad_norm": 0.5078534676699445, + "grad_max_sv": 0.16336566992104054, + "grad_min_sv": 9.403588141498886e-09, + "grad_condition": 20579658.983666856, + "lr": 3.906842420574966e-05, + "time_sec": 66.69969606399536 + }, + { + "epoch": 132, + "train_loss": 2.8976589154815673, + "train_acc": 0.27122, + "test_loss": 7.718105026245118, + "test_acc": 0.026, + "lyapunov": null, + "grad_norm": 0.5077215533015317, + "grad_max_sv": 0.16301583163440228, + "grad_min_sv": 9.312006112038862e-09, + "grad_condition": 27087738.24954634, + "lr": 3.5111757055874305e-05, + "time_sec": 66.74734258651733 + }, + { + "epoch": 133, + "train_loss": 2.9053258415222167, + "train_acc": 0.26974, + "test_loss": 7.773404074859619, + "test_acc": 0.029, + "lyapunov": null, + "grad_norm": 0.5077078460971154, + "grad_max_sv": 0.16176522485911846, + "grad_min_sv": 9.38179235271397e-09, + "grad_condition": 22801102.593637146, + "lr": 3.1359005254054254e-05, + "time_sec": 66.71020007133484 + }, + { + "epoch": 134, + "train_loss": 2.90214939994812, + "train_acc": 0.2685, + "test_loss": 7.735068745422363, + "test_acc": 0.0283, + "lyapunov": null, + "grad_norm": 0.5056827916750407, + "grad_max_sv": 0.16394426934421064, + "grad_min_sv": 9.382484492375525e-09, + "grad_condition": 273849135.71961355, + "lr": 2.7811814881259484e-05, + "time_sec": 66.72329211235046 + }, + { + "epoch": 135, + "train_loss": 2.8955694792175293, + "train_acc": 0.27204, + "test_loss": 8.074042736816406, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.5072891279476816, + "grad_max_sv": 0.1647134818136692, + "grad_min_sv": 9.274373982681716e-09, + "grad_condition": 20878941.234711803, + "lr": 2.4471741852423218e-05, + "time_sec": 66.69911003112793 + }, + { + "epoch": 136, + "train_loss": 2.901527007369995, + "train_acc": 0.272, + "test_loss": 7.88837564239502, + "test_acc": 0.0256, + "lyapunov": null, + "grad_norm": 0.5069997382716037, + "grad_max_sv": 0.16248776540160179, + "grad_min_sv": 9.28558460677742e-09, + "grad_condition": 26142069.423716225, + "lr": 2.1340251233966362e-05, + "time_sec": 66.73573279380798 + }, + { + "epoch": 137, + "train_loss": 2.8907382415008547, + "train_acc": 0.2728, + "test_loss": 8.04134146270752, + "test_acc": 0.0266, + "lyapunov": null, + "grad_norm": 0.506922138474151, + "grad_max_sv": 0.16456650160253047, + "grad_min_sv": 9.394744830693025e-09, + "grad_condition": 22952282.106423754, + "lr": 1.8418716601170932e-05, + "time_sec": 66.72893476486206 + }, + { + "epoch": 138, + "train_loss": 2.8925764886474608, + "train_acc": 0.27096, + "test_loss": 7.848298292541504, + "test_acc": 0.0281, + "lyapunov": null, + "grad_norm": 0.5070877996969257, + "grad_max_sv": 0.16335688717663288, + "grad_min_sv": 9.458600758183167e-09, + "grad_condition": 21212816.652376812, + "lr": 1.570841943568445e-05, + "time_sec": 66.69498014450073 + }, + { + "epoch": 139, + "train_loss": 2.8905470305633547, + "train_acc": 0.2723, + "test_loss": 7.805370147705078, + "test_acc": 0.0276, + "lyapunov": null, + "grad_norm": 0.5091697345599102, + "grad_max_sv": 0.16748546734452247, + "grad_min_sv": 9.554275959278158e-09, + "grad_condition": 21817543.256782603, + "lr": 1.3210548563419845e-05, + "time_sec": 66.69882249832153 + }, + { + "epoch": 140, + "train_loss": 2.8900568451690676, + "train_acc": 0.2725, + "test_loss": 8.150068646240234, + "test_acc": 0.0263, + "lyapunov": null, + "grad_norm": 0.5094580986389692, + "grad_max_sv": 0.16614943966269494, + "grad_min_sv": 9.441066034510115e-09, + "grad_condition": 25708375.318254933, + "lr": 1.0926199633097203e-05, + "time_sec": 66.72957038879395 + }, + { + "epoch": 141, + "train_loss": 2.8928156049346923, + "train_acc": 0.27302, + "test_loss": 7.946534848022461, + "test_acc": 0.0271, + "lyapunov": null, + "grad_norm": 0.5089732688724395, + "grad_max_sv": 0.1660338044166565, + "grad_min_sv": 9.440311787671519e-09, + "grad_condition": 79734166.44560626, + "lr": 8.856374635655688e-06, + "time_sec": 66.7075400352478 + }, + { + "epoch": 142, + "train_loss": 2.88548219871521, + "train_acc": 0.27172, + "test_loss": 8.169772109985352, + "test_acc": 0.0265, + "lyapunov": null, + "grad_norm": 0.5086553359451463, + "grad_max_sv": 0.16840459816157818, + "grad_min_sv": 9.377848261826749e-09, + "grad_condition": 22023976.535071947, + "lr": 7.001981464747503e-06, + "time_sec": 66.71758651733398 + }, + { + "epoch": 143, + "train_loss": 2.89183920753479, + "train_acc": 0.27372, + "test_loss": 7.852110308837891, + "test_acc": 0.0275, + "lyapunov": null, + "grad_norm": 0.5094733139547303, + "grad_max_sv": 0.16687579974532127, + "grad_min_sv": 9.444928218693693e-09, + "grad_condition": 24477411.004352577, + "lr": 5.3638335185058295e-06, + "time_sec": 66.72722506523132 + }, + { + "epoch": 144, + "train_loss": 2.8904072105407717, + "train_acc": 0.27378, + "test_loss": 8.066141241455078, + "test_acc": 0.0255, + "lyapunov": null, + "grad_norm": 0.5089427679493953, + "grad_max_sv": 0.1690099250525236, + "grad_min_sv": 9.382681727398978e-09, + "grad_condition": 24070995.123834018, + "lr": 3.942649342761114e-06, + "time_sec": 66.73601293563843 + }, + { + "epoch": 145, + "train_loss": 2.8936181242370607, + "train_acc": 0.27214, + "test_loss": 8.10545317993164, + "test_acc": 0.0258, + "lyapunov": null, + "grad_norm": 0.507865092838002, + "grad_max_sv": 0.1655246399343014, + "grad_min_sv": 9.371320355833212e-09, + "grad_condition": 20893591.384689607, + "lr": 2.7390523158633524e-06, + "time_sec": 66.70678782463074 + }, + { + "epoch": 146, + "train_loss": 2.894159292755127, + "train_acc": 0.27236, + "test_loss": 7.739997250366211, + "test_acc": 0.0282, + "lyapunov": null, + "grad_norm": 0.5079666742519956, + "grad_max_sv": 0.16401765793561934, + "grad_min_sv": 9.365164058139363e-09, + "grad_condition": 30379279.137967873, + "lr": 1.7535703752478133e-06, + "time_sec": 66.73851418495178 + }, + { + "epoch": 147, + "train_loss": 2.892810397796631, + "train_acc": 0.27236, + "test_loss": 8.097870037841798, + "test_acc": 0.0261, + "lyapunov": null, + "grad_norm": 0.5083955380496783, + "grad_max_sv": 0.16239417865872383, + "grad_min_sv": 9.437153494773476e-09, + "grad_condition": 22581567.79918761, + "lr": 9.866357858642196e-07, + "time_sec": 66.69952964782715 + }, + { + "epoch": 148, + "train_loss": 2.8858398888397216, + "train_acc": 0.27292, + "test_loss": 7.955520216369629, + "test_acc": 0.0253, + "lyapunov": null, + "grad_norm": 0.5081646285749641, + "grad_max_sv": 0.1665601458400488, + "grad_min_sv": 9.4039764724082e-09, + "grad_condition": 2788122152.665894, + "lr": 4.38584950570808e-07, + "time_sec": 66.72941470146179 + }, + { + "epoch": 149, + "train_loss": 2.8937516955566407, + "train_acc": 0.27344, + "test_loss": 8.195967932128907, + "test_acc": 0.0259, + "lyapunov": null, + "grad_norm": 0.5088598826502255, + "grad_max_sv": 0.16467942893505097, + "grad_min_sv": 9.292379346548252e-09, + "grad_condition": 20098211.57433509, + "lr": 1.096582625772501e-07, + "time_sec": 66.7379686832428 + }, + { + "epoch": 150, + "train_loss": 2.8891425512695315, + "train_acc": 0.27354, + "test_loss": 8.199688424682618, + "test_acc": 0.0264, + "lyapunov": null, + "grad_norm": 0.5085081625178647, + "grad_max_sv": 0.17037647701799868, + "grad_min_sv": 9.396511368997551e-09, + "grad_condition": 30341616.600583784, + "lr": 0.0, + "time_sec": 66.7265522480011 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 4.600389208526611, + "train_acc": 0.07146, + "test_loss": 4.086850812530518, + "test_acc": 0.089, + "lyapunov": 2.088574398813955, + "grad_norm": 5.951641147060766, + "grad_max_sv": 4.604718941450119, + "grad_min_sv": 1.0862287848634189e-07, + "grad_condition": 102934308.40827194, + "lr": 0.0009998903417374227, + "time_sec": 41.90148162841797 + }, + { + "epoch": 2, + "train_loss": 4.154245112686157, + "train_acc": 0.09378, + "test_loss": 4.727289266204834, + "test_acc": 0.049, + "lyapunov": 1.675386021509195, + "grad_norm": 3.9336812922654714, + "grad_max_sv": 2.925524663925171, + "grad_min_sv": 7.262743817529338e-08, + "grad_condition": 424809238.9666936, + "lr": 0.0009995614150494292, + "time_sec": 41.78368663787842 + }, + { + "epoch": 3, + "train_loss": 4.027823886566162, + "train_acc": 0.1086, + "test_loss": 5.036119989776611, + "test_acc": 0.0347, + "lyapunov": 1.6001547501825006, + "grad_norm": 3.0745862198210694, + "grad_max_sv": 2.1295204132795336, + "grad_min_sv": 5.70765142704488e-08, + "grad_condition": 40571486.668118164, + "lr": 0.0009990133642141358, + "time_sec": 41.703768253326416 + }, + { + "epoch": 4, + "train_loss": 3.9490097280883787, + "train_acc": 0.1205, + "test_loss": 6.33214266204834, + "test_acc": 0.0188, + "lyapunov": 1.5750604392317555, + "grad_norm": 2.373335141934517, + "grad_max_sv": 1.5385636299848557, + "grad_min_sv": 4.3810931549259635e-08, + "grad_condition": 41690835.43861919, + "lr": 0.0009982464296247522, + "time_sec": 41.732722997665405 + }, + { + "epoch": 5, + "train_loss": 3.9766585917663573, + "train_acc": 0.11954, + "test_loss": 8.71332287902832, + "test_acc": 0.0188, + "lyapunov": 1.565549552593085, + "grad_norm": 2.0246690982621796, + "grad_max_sv": 1.2804439306259154, + "grad_min_sv": 3.6991484700377165e-08, + "grad_condition": 85372782.32745245, + "lr": 0.0009972609476841367, + "time_sec": 41.76529860496521 + }, + { + "epoch": 6, + "train_loss": 4.073858399047851, + "train_acc": 0.11056, + "test_loss": 9.466819995117188, + "test_acc": 0.0223, + "lyapunov": 1.5455034062685564, + "grad_norm": 1.7934086339665274, + "grad_max_sv": 1.104438428580761, + "grad_min_sv": 3.247254408700328e-08, + "grad_condition": 45291989.58759006, + "lr": 0.000996057350657239, + "time_sec": 41.74420213699341 + }, + { + "epoch": 7, + "train_loss": 4.1445047888183595, + "train_acc": 0.10608, + "test_loss": 10.480993731689454, + "test_acc": 0.0156, + "lyapunov": 1.5415380177900309, + "grad_norm": 1.5679408505934445, + "grad_max_sv": 0.9464981764554977, + "grad_min_sv": 2.8262019316493968e-08, + "grad_condition": 54295754.70226411, + "lr": 0.000994636166481494, + "time_sec": 41.73182463645935 + }, + { + "epoch": 8, + "train_loss": 4.26063258026123, + "train_acc": 0.09112, + "test_loss": 7.7578563934326175, + "test_acc": 0.0186, + "lyapunov": 1.5429353631670824, + "grad_norm": 1.3464117763442929, + "grad_max_sv": 0.7779564633965492, + "grad_min_sv": 2.375586672376251e-08, + "grad_condition": 62692972.26952485, + "lr": 0.0009929980185352525, + "time_sec": 41.739473819732666 + }, + { + "epoch": 9, + "train_loss": 4.513377053375244, + "train_acc": 0.05922, + "test_loss": 7.138281170654297, + "test_acc": 0.011, + "lyapunov": 1.5319068190996603, + "grad_norm": 1.139364674598679, + "grad_max_sv": 0.6511225394904614, + "grad_min_sv": 1.8816128205534354e-08, + "grad_condition": 44484041.03115648, + "lr": 0.0009911436253643444, + "time_sec": 41.73070311546326 + }, + { + "epoch": 10, + "train_loss": 4.696486204833985, + "train_acc": 0.03644, + "test_loss": 8.94805923461914, + "test_acc": 0.01, + "lyapunov": 1.4879300298593234, + "grad_norm": 0.9658719057515597, + "grad_max_sv": 0.6352818965911865, + "grad_min_sv": 1.4476460679876436e-08, + "grad_condition": 2057995491.241798, + "lr": 0.0009890738003669028, + "time_sec": 41.76564049720764 + }, + { + "epoch": 11, + "train_loss": 4.811119628295899, + "train_acc": 0.03002, + "test_loss": 8.594207092285156, + "test_acc": 0.01, + "lyapunov": 1.545145396381388, + "grad_norm": 0.9564458204494278, + "grad_max_sv": 0.6685591802001, + "grad_min_sv": 1.3870340914018398e-08, + "grad_condition": 146809154.0196677, + "lr": 0.00098678945143658, + "time_sec": 41.74543738365173 + }, + { + "epoch": 12, + "train_loss": 4.975349290466308, + "train_acc": 0.01658, + "test_loss": 8.6747091796875, + "test_acc": 0.0114, + "lyapunov": 1.4708023967645358, + "grad_norm": 0.7817948112887597, + "grad_max_sv": 0.603185323625803, + "grad_min_sv": 9.743947088081129e-09, + "grad_condition": 67868723.94202444, + "lr": 0.0009842915805643154, + "time_sec": 41.7559871673584 + }, + { + "epoch": 13, + "train_loss": 5.0296261746215825, + "train_acc": 0.01604, + "test_loss": 11.79697481994629, + "test_acc": 0.01, + "lyapunov": 1.5253148819784375, + "grad_norm": 0.5736780904158933, + "grad_max_sv": 0.42879281714558604, + "grad_min_sv": 6.762437510681764e-09, + "grad_condition": 1079134295.4881654, + "lr": 0.000981581283398829, + "time_sec": 41.76394009590149 + }, + { + "epoch": 14, + "train_loss": 5.057629988555909, + "train_acc": 0.00992, + "test_loss": 8.410659944152831, + "test_acc": 0.01, + "lyapunov": 1.4446861634169088, + "grad_norm": 0.39926683732439516, + "grad_max_sv": 0.33072102442383766, + "grad_min_sv": 4.070671115463664e-09, + "grad_condition": 171229170.03266063, + "lr": 0.0009786597487660333, + "time_sec": 41.78986120223999 + }, + { + "epoch": 15, + "train_loss": 5.068990168609619, + "train_acc": 0.01004, + "test_loss": 8.000550273132324, + "test_acc": 0.01, + "lyapunov": 1.4198117143357807, + "grad_norm": 0.31403539953973636, + "grad_max_sv": 0.261398883163929, + "grad_min_sv": 2.518455900589597e-09, + "grad_condition": 1889483827.2041466, + "lr": 0.0009755282581475766, + "time_sec": 41.803417682647705 + }, + { + "epoch": 16, + "train_loss": 5.098585692901612, + "train_acc": 0.00948, + "test_loss": 8.965616151428222, + "test_acc": 0.01, + "lyapunov": 1.4220252604130894, + "grad_norm": 0.2674000226215519, + "grad_max_sv": 0.2171985387802124, + "grad_min_sv": 6.561514876139448e-10, + "grad_condition": 51847368847.70773, + "lr": 0.0009721881851187403, + "time_sec": 41.763081789016724 + }, + { + "epoch": 17, + "train_loss": 5.128935182189942, + "train_acc": 0.0104, + "test_loss": 7.713327481842041, + "test_acc": 0.01, + "lyapunov": 1.4243087640503789, + "grad_norm": 0.2268635753508302, + "grad_max_sv": 0.17724891044199467, + "grad_min_sv": 1.1410712791450972e-12, + "grad_condition": 106447262687.9498, + "lr": 0.0009686409947459456, + "time_sec": 41.777748823165894 + }, + { + "epoch": 18, + "train_loss": 5.169684513702393, + "train_acc": 0.00924, + "test_loss": 9.309846389770508, + "test_acc": 0.01, + "lyapunov": 1.4357064035542482, + "grad_norm": 0.2142537464973637, + "grad_max_sv": 0.1502558846026659, + "grad_min_sv": 4.244580750085834e-13, + "grad_condition": 128309590371.45757, + "lr": 0.0009648882429441254, + "time_sec": 41.78967308998108 + }, + { + "epoch": 19, + "train_loss": 5.18758517288208, + "train_acc": 0.01042, + "test_loss": 9.819900524902344, + "test_acc": 0.01, + "lyapunov": 1.4233030394824875, + "grad_norm": 0.1952009554667118, + "grad_max_sv": 0.14073190968483687, + "grad_min_sv": 2.6230090465217223e-13, + "grad_condition": 123371153139.15, + "lr": 0.00096093157579425, + "time_sec": 41.77319002151489 + }, + { + "epoch": 20, + "train_loss": 5.217939367370605, + "train_acc": 0.00912, + "test_loss": 9.18544906463623, + "test_acc": 0.01, + "lyapunov": 1.4247246755053624, + "grad_norm": 0.15876002882735193, + "grad_max_sv": 0.10825764928013086, + "grad_min_sv": 3.338896381884262e-15, + "grad_condition": 107875834900.70416, + "lr": 0.0009567727288213001, + "time_sec": 41.805402517318726 + }, + { + "epoch": 21, + "train_loss": 5.2237202166748045, + "train_acc": 0.00884, + "test_loss": 7.853615603637695, + "test_acc": 0.01, + "lyapunov": 1.4316062283942768, + "grad_norm": 0.16150401588518373, + "grad_max_sv": 0.09900619480758906, + "grad_min_sv": 6.6800742534662695e-15, + "grad_condition": 98362933683.42502, + "lr": 0.0009524135262330095, + "time_sec": 41.81541037559509 + }, + { + "epoch": 22, + "train_loss": 5.223462156219482, + "train_acc": 0.00896, + "test_loss": 7.39350982055664, + "test_acc": 0.01, + "lyapunov": 1.4326209281106739, + "grad_norm": 0.1473213530853359, + "grad_max_sv": 0.07929724231362342, + "grad_min_sv": 1.359730040562078e-16, + "grad_condition": 79286860137.91084, + "lr": 0.0009478558801197061, + "time_sec": 41.77298974990845 + }, + { + "epoch": 23, + "train_loss": 5.2433684585571285, + "train_acc": 0.0104, + "test_loss": 7.137277140808106, + "test_acc": 0.01, + "lyapunov": 1.4520324453368516, + "grad_norm": 0.1808576226701931, + "grad_max_sv": 0.0958871865645051, + "grad_min_sv": 8.016626722354409e-12, + "grad_condition": 91441708516.60077, + "lr": 0.000943101789615607, + "time_sec": 41.78183579444885 + }, + { + "epoch": 24, + "train_loss": 5.227817250061035, + "train_acc": 0.01018, + "test_loss": 6.776467510986328, + "test_acc": 0.01, + "lyapunov": 1.4379125001180508, + "grad_norm": 0.12771270098590454, + "grad_max_sv": 0.06905819587409497, + "grad_min_sv": 2.599435841374051e-17, + "grad_condition": 69055853998.34868, + "lr": 0.0009381533400219313, + "time_sec": 41.771769285202026 + }, + { + "epoch": 25, + "train_loss": 5.245168194122314, + "train_acc": 0.0099, + "test_loss": 6.430454106140137, + "test_acc": 0.01, + "lyapunov": 1.4564172242913405, + "grad_norm": 0.12472749302013317, + "grad_max_sv": 0.05845061130821705, + "grad_min_sv": 1.194259418817754e-40, + "grad_condition": 58450611308.21704, + "lr": 0.0009330127018922189, + "time_sec": 41.770474433898926 + }, + { + "epoch": 26, + "train_loss": 5.246722939758301, + "train_acc": 0.00928, + "test_loss": 6.331733448791504, + "test_acc": 0.01, + "lyapunov": 1.4580842101055642, + "grad_norm": 0.1662077239803915, + "grad_max_sv": 0.06711247004568577, + "grad_min_sv": 3.516773949087515e-14, + "grad_condition": 65770012096.831566, + "lr": 0.000927682130080253, + "time_sec": 41.73953866958618 + }, + { + "epoch": 27, + "train_loss": 5.241074298706055, + "train_acc": 0.00908, + "test_loss": 5.877811084747314, + "test_acc": 0.01, + "lyapunov": 1.4511035900286702, + "grad_norm": 0.11653593515355255, + "grad_max_sv": 0.057695817202329636, + "grad_min_sv": 2.245335846475005e-19, + "grad_condition": 57695796508.56338, + "lr": 0.0009221639627510072, + "time_sec": 41.77058434486389 + }, + { + "epoch": 28, + "train_loss": 5.231804114685058, + "train_acc": 0.00918, + "test_loss": 5.65352537612915, + "test_acc": 0.01, + "lyapunov": 1.4424795046486818, + "grad_norm": 0.11846210716711081, + "grad_max_sv": 0.05332653652876616, + "grad_min_sv": 1.997381835377637e-16, + "grad_condition": 53305647188.1228, + "lr": 0.0009164606203550494, + "time_sec": 41.764750957489014 + }, + { + "epoch": 29, + "train_loss": 5.262847916870117, + "train_acc": 0.01024, + "test_loss": 6.106614427185058, + "test_acc": 0.01, + "lyapunov": 1.4771753000786236, + "grad_norm": 0.12029871369481651, + "grad_max_sv": 0.04656773656606674, + "grad_min_sv": 3.853570776893247e-46, + "grad_condition": 46567736566.06674, + "lr": 0.0009105746045668516, + "time_sec": 41.72984552383423 + }, + { + "epoch": 30, + "train_loss": 5.23929132598877, + "train_acc": 0.00934, + "test_loss": 5.9899550048828125, + "test_acc": 0.01, + "lyapunov": 1.4511136694637405, + "grad_norm": 0.11304905556902457, + "grad_max_sv": 0.047783416556194426, + "grad_min_sv": 9.917357230877788e-21, + "grad_condition": 47783415656.63218, + "lr": 0.0009045084971874733, + "time_sec": 41.7406222820282 + }, + { + "epoch": 31, + "train_loss": 5.248380351104736, + "train_acc": 0.01028, + "test_loss": 5.734669494628906, + "test_acc": 0.01, + "lyapunov": 1.461517483986857, + "grad_norm": 0.10074340116724037, + "grad_max_sv": 0.034037844324484465, + "grad_min_sv": 0.0, + "grad_condition": 34037844324.484474, + "lr": 0.0008982649590120977, + "time_sec": 41.74093008041382 + }, + { + "epoch": 32, + "train_loss": 5.236619085388184, + "train_acc": 0.00984, + "test_loss": 5.793693973541259, + "test_acc": 0.01, + "lyapunov": 1.4490889871821684, + "grad_norm": 0.10695665831734988, + "grad_max_sv": 0.04561040163971484, + "grad_min_sv": 0.0, + "grad_condition": 45610401639.71483, + "lr": 0.0008918467286629196, + "time_sec": 41.984901666641235 + }, + { + "epoch": 33, + "train_loss": 5.23296120513916, + "train_acc": 0.00958, + "test_loss": 5.439259308624267, + "test_acc": 0.01, + "lyapunov": 1.444964089661913, + "grad_norm": 0.10554551126822227, + "grad_max_sv": 0.042046601651236415, + "grad_min_sv": 0.0, + "grad_condition": 42046601651.23641, + "lr": 0.0008852566213878943, + "time_sec": 41.770121335983276 + }, + { + "epoch": 34, + "train_loss": 5.236159170837403, + "train_acc": 0.00974, + "test_loss": 5.683465595245361, + "test_acc": 0.01, + "lyapunov": 1.44912754269817, + "grad_norm": 0.10158597595404413, + "grad_max_sv": 0.0364499366376549, + "grad_min_sv": 0.0, + "grad_condition": 36449936637.6549, + "lr": 0.000878497527825878, + "time_sec": 41.73541307449341 + }, + { + "epoch": 35, + "train_loss": 5.244431438751221, + "train_acc": 0.00982, + "test_loss": 5.822091407775879, + "test_acc": 0.01, + "lyapunov": 1.4579007311550247, + "grad_norm": 0.10227185751901953, + "grad_max_sv": 0.04079357534646988, + "grad_min_sv": 0.0, + "grad_condition": 40793575346.46987, + "lr": 0.000871572412738697, + "time_sec": 41.72771143913269 + }, + { + "epoch": 36, + "train_loss": 5.242595237579346, + "train_acc": 0.00948, + "test_loss": 5.712351992797852, + "test_acc": 0.01, + "lyapunov": 1.4565396217433997, + "grad_norm": 0.09594442137602498, + "grad_max_sv": 0.023863840941339733, + "grad_min_sv": 0.0, + "grad_condition": 23863840941.33973, + "lr": 0.0008644843137107055, + "time_sec": 41.679956674575806 + }, + { + "epoch": 37, + "train_loss": 5.25272214477539, + "train_acc": 0.00774, + "test_loss": 5.519532617950439, + "test_acc": 0.01, + "lyapunov": 1.4673221968019101, + "grad_norm": 0.09989553017175994, + "grad_max_sv": 0.01326487297192216, + "grad_min_sv": 0.0, + "grad_condition": 13264872971.922161, + "lr": 0.0008572363398164014, + "time_sec": 41.665099143981934 + }, + { + "epoch": 38, + "train_loss": 5.239593379211426, + "train_acc": 0.00894, + "test_loss": 5.685215021514892, + "test_acc": 0.01, + "lyapunov": 1.4529655787646008, + "grad_norm": 0.09888602041808069, + "grad_max_sv": 0.03386777136474848, + "grad_min_sv": 0.0, + "grad_condition": 33867771364.748474, + "lr": 0.0008498316702566826, + "time_sec": 41.71084642410278 + }, + { + "epoch": 39, + "train_loss": 5.24351258758545, + "train_acc": 0.00926, + "test_loss": 5.718768641662598, + "test_acc": 0.01, + "lyapunov": 1.4566386227717485, + "grad_norm": 0.10344101016289994, + "grad_max_sv": 0.04082807558588684, + "grad_min_sv": 0.0, + "grad_condition": 40828075585.886826, + "lr": 0.0008422735529643442, + "time_sec": 41.73838138580322 + }, + { + "epoch": 40, + "train_loss": 5.241183159027099, + "train_acc": 0.00956, + "test_loss": 5.497510899353028, + "test_acc": 0.01, + "lyapunov": 1.4553583491488795, + "grad_norm": 0.09390993405990472, + "grad_max_sv": 0.015733347134664656, + "grad_min_sv": 0.0, + "grad_condition": 15733347134.664654, + "lr": 0.0008345653031794289, + "time_sec": 41.734697580337524 + }, + { + "epoch": 41, + "train_loss": 5.242352604675293, + "train_acc": 0.00974, + "test_loss": 5.167651419830322, + "test_acc": 0.01, + "lyapunov": 1.454840253076285, + "grad_norm": 0.11429776991375327, + "grad_max_sv": 0.05544604551978409, + "grad_min_sv": 2.0339863136307694e-16, + "grad_condition": 55425910698.75984, + "lr": 0.0008267103019950526, + "time_sec": 41.75088906288147 + }, + { + "epoch": 42, + "train_loss": 5.242215647735596, + "train_acc": 0.00988, + "test_loss": 5.260814582824707, + "test_acc": 0.01, + "lyapunov": 1.4554345080309816, + "grad_norm": 0.10783002802519942, + "grad_max_sv": 0.04959035101346672, + "grad_min_sv": 4.912822630335892e-20, + "grad_condition": 49590347491.3975, + "lr": 0.0008187119948743447, + "time_sec": 41.73639273643494 + }, + { + "epoch": 43, + "train_loss": 5.244567107543945, + "train_acc": 0.01008, + "test_loss": 4.993986747741699, + "test_acc": 0.01, + "lyapunov": 1.4585875352020459, + "grad_norm": 0.10047934695930735, + "grad_max_sv": 0.03824934270232916, + "grad_min_sv": 3.853570776893247e-46, + "grad_condition": 38249342702.329155, + "lr": 0.000810573890139155, + "time_sec": 41.74794268608093 + }, + { + "epoch": 44, + "train_loss": 5.244575652618408, + "train_acc": 0.0093, + "test_loss": 4.9594275024414065, + "test_acc": 0.01, + "lyapunov": 1.4588656959021489, + "grad_norm": 0.09576972429911833, + "grad_max_sv": 0.031089681945741177, + "grad_min_sv": 0.0, + "grad_condition": 31089681945.741173, + "lr": 0.0008022995574311873, + "time_sec": 41.72138214111328 + }, + { + "epoch": 45, + "train_loss": 5.2458512478637696, + "train_acc": 0.00958, + "test_loss": 4.983256524658203, + "test_acc": 0.01, + "lyapunov": 1.460322377017087, + "grad_norm": 0.09632514814173115, + "grad_max_sv": 0.02758595086634159, + "grad_min_sv": 0.0, + "grad_condition": 27585950866.34159, + "lr": 0.0007938926261462363, + "time_sec": 41.73388934135437 + }, + { + "epoch": 46, + "train_loss": 5.245156242980957, + "train_acc": 0.00914, + "test_loss": 5.5051834045410155, + "test_acc": 0.01, + "lyapunov": 1.459906402451303, + "grad_norm": 0.09376667391500292, + "grad_max_sv": 0.017312733735889197, + "grad_min_sv": 0.0, + "grad_condition": 17312733735.8892, + "lr": 0.0007853567838422158, + "time_sec": 41.682612657547 + }, + { + "epoch": 47, + "train_loss": 5.24946335647583, + "train_acc": 0.0092, + "test_loss": 5.037567407989502, + "test_acc": 0.01, + "lyapunov": 1.464009671260024, + "grad_norm": 0.09467776161020446, + "grad_max_sv": 0.01866090311668813, + "grad_min_sv": 0.0, + "grad_condition": 18660903116.688133, + "lr": 0.0007766957746216719, + "time_sec": 41.71859622001648 + }, + { + "epoch": 48, + "train_loss": 5.2716734535217284, + "train_acc": 0.00954, + "test_loss": 4.725313116455078, + "test_acc": 0.01, + "lyapunov": 1.4846527972794554, + "grad_norm": 0.12086822830734321, + "grad_max_sv": 0.020449956133961677, + "grad_min_sv": 0.0, + "grad_condition": 20449956133.961678, + "lr": 0.0007679133974894982, + "time_sec": 41.662288427352905 + }, + { + "epoch": 49, + "train_loss": 5.264281662597656, + "train_acc": 0.0094, + "test_loss": 4.704328326416015, + "test_acc": 0.01, + "lyapunov": 1.4808302587255493, + "grad_norm": 0.1006442361474557, + "grad_max_sv": 0.003648173250257969, + "grad_min_sv": 0.0, + "grad_condition": 3648173250.257969, + "lr": 0.000759013504686565, + "time_sec": 41.659945011138916 + }, + { + "epoch": 50, + "train_loss": 5.260963584136963, + "train_acc": 0.00864, + "test_loss": 4.687705662536621, + "test_acc": 0.01, + "lyapunov": 1.4764524859845485, + "grad_norm": 0.08983274926440024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007499999999999998, + "time_sec": 41.73585891723633 + }, + { + "epoch": 51, + "train_loss": 5.254029862213135, + "train_acc": 0.00892, + "test_loss": 4.650592637634277, + "test_acc": 0.01, + "lyapunov": 1.4702172300699727, + "grad_norm": 0.08943196133143812, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508575, + "time_sec": 41.63914966583252 + }, + { + "epoch": 52, + "train_loss": 5.253371743927002, + "train_acc": 0.00914, + "test_loss": 4.651584497070313, + "test_acc": 0.01, + "lyapunov": 1.469337931984221, + "grad_norm": 0.09050035162045282, + "grad_max_sv": 0.00823306110687554, + "grad_min_sv": 0.0, + "grad_condition": 8233061106.875539, + "lr": 0.0007316480175599307, + "time_sec": 41.676894187927246 + }, + { + "epoch": 53, + "train_loss": 5.25479355255127, + "train_acc": 0.00884, + "test_loss": 4.6638921875, + "test_acc": 0.01, + "lyapunov": 1.4709156809560477, + "grad_norm": 0.0923409314747527, + "grad_max_sv": 0.01720760380849242, + "grad_min_sv": 0.0, + "grad_condition": 17207603808.492424, + "lr": 0.0007223175895924635, + "time_sec": 41.68897199630737 + }, + { + "epoch": 54, + "train_loss": 5.255663233642578, + "train_acc": 0.0087, + "test_loss": 4.690281636047363, + "test_acc": 0.01, + "lyapunov": 1.4720432532717809, + "grad_norm": 0.09116086408440177, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825361, + "time_sec": 41.65702509880066 + }, + { + "epoch": 55, + "train_loss": 5.255450089111328, + "train_acc": 0.0089, + "test_loss": 4.664666540527343, + "test_acc": 0.01, + "lyapunov": 1.4717262035135723, + "grad_norm": 0.08960989934748306, + "grad_max_sv": 0.0027584049850702284, + "grad_min_sv": 0.0, + "grad_condition": 2758404985.0702286, + "lr": 0.0007033683215378998, + "time_sec": 41.68492293357849 + }, + { + "epoch": 56, + "train_loss": 5.25642558013916, + "train_acc": 0.00918, + "test_loss": 4.672654594421386, + "test_acc": 0.01, + "lyapunov": 1.4729856798411025, + "grad_norm": 0.08842004194228453, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006937577932260512, + "time_sec": 41.66422128677368 + }, + { + "epoch": 57, + "train_loss": 5.256343665313721, + "train_acc": 0.00928, + "test_loss": 4.675612693786621, + "test_acc": 0.01, + "lyapunov": 1.4728102668776841, + "grad_norm": 0.0894492177832343, + "grad_max_sv": 0.003824355313554406, + "grad_min_sv": 0.0, + "grad_condition": 3824355313.554406, + "lr": 0.0006840622763423388, + "time_sec": 41.66166043281555 + }, + { + "epoch": 58, + "train_loss": 5.256470738372803, + "train_acc": 0.00846, + "test_loss": 4.673555949401855, + "test_acc": 0.01, + "lyapunov": 1.473022796918669, + "grad_norm": 0.09415093095699927, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006742860236609073, + "time_sec": 41.72664546966553 + }, + { + "epoch": 59, + "train_loss": 5.257105118560791, + "train_acc": 0.0089, + "test_loss": 4.662265467834473, + "test_acc": 0.01, + "lyapunov": 1.4737855485638085, + "grad_norm": 0.08933320536804817, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006644333233692913, + "time_sec": 41.683704137802124 + }, + { + "epoch": 60, + "train_loss": 5.2567843800354, + "train_acc": 0.00894, + "test_loss": 4.67973249130249, + "test_acc": 0.01, + "lyapunov": 1.4734186650542043, + "grad_norm": 0.08845010319296705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874734, + "time_sec": 41.65764546394348 + }, + { + "epoch": 61, + "train_loss": 5.2586814794921874, + "train_acc": 0.00832, + "test_loss": 4.66929153137207, + "test_acc": 0.01, + "lyapunov": 1.4755458350071822, + "grad_norm": 0.08796570828809193, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006445158984722354, + "time_sec": 41.66641640663147 + }, + { + "epoch": 62, + "train_loss": 5.257138239135743, + "train_acc": 0.00822, + "test_loss": 4.672049102783203, + "test_acc": 0.01, + "lyapunov": 1.4738077528946234, + "grad_norm": 0.08897000656850247, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006344599103076324, + "time_sec": 41.66154670715332 + }, + { + "epoch": 63, + "train_loss": 5.25840109664917, + "train_acc": 0.00872, + "test_loss": 4.668118723297119, + "test_acc": 0.01, + "lyapunov": 1.4752026089012165, + "grad_norm": 0.08994871774610383, + "grad_max_sv": 0.0018751383759081364, + "grad_min_sv": 0.0, + "grad_condition": 1875138375.9081364, + "lr": 0.0006243449435824269, + "time_sec": 41.65010213851929 + }, + { + "epoch": 64, + "train_loss": 5.259331801910401, + "train_acc": 0.009, + "test_loss": 4.6509183990478515, + "test_acc": 0.01, + "lyapunov": 1.4761373133915465, + "grad_norm": 0.09230518416704733, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006141754350553275, + "time_sec": 41.68602395057678 + }, + { + "epoch": 65, + "train_loss": 5.259325382080078, + "train_acc": 0.00842, + "test_loss": 4.649483604431152, + "test_acc": 0.01, + "lyapunov": 1.4762441697327986, + "grad_norm": 0.09181035955304583, + "grad_max_sv": 0.002657032757997513, + "grad_min_sv": 0.0, + "grad_condition": 2657032757.997513, + "lr": 0.0006039558454088793, + "time_sec": 41.649319648742676 + }, + { + "epoch": 66, + "train_loss": 5.258703485870361, + "train_acc": 0.0089, + "test_loss": 4.659050286865234, + "test_acc": 0.01, + "lyapunov": 1.475566557911046, + "grad_norm": 0.08911107124283034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000593690657292862, + "time_sec": 41.66279911994934 + }, + { + "epoch": 67, + "train_loss": 5.258656344146728, + "train_acc": 0.00868, + "test_loss": 4.652145028686523, + "test_acc": 0.01, + "lyapunov": 1.4755408843155102, + "grad_norm": 0.08984660357930904, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005833843733580507, + "time_sec": 41.65086126327515 + }, + { + "epoch": 68, + "train_loss": 5.259207654724121, + "train_acc": 0.00934, + "test_loss": 4.644708920288086, + "test_acc": 0.01, + "lyapunov": 1.476156848470878, + "grad_norm": 0.08930414014303266, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005730415142812054, + "time_sec": 41.6753249168396 + }, + { + "epoch": 69, + "train_loss": 5.259739582061767, + "train_acc": 0.00962, + "test_loss": 4.635655142974853, + "test_acc": 0.01, + "lyapunov": 1.4767807136716136, + "grad_norm": 0.08868883564267036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821517, + "time_sec": 41.6395525932312 + }, + { + "epoch": 70, + "train_loss": 5.258972863311768, + "train_acc": 0.0098, + "test_loss": 4.630142547607422, + "test_acc": 0.01, + "lyapunov": 1.4758698986009564, + "grad_norm": 0.08847186803439672, + "grad_max_sv": 0.0013374987989664077, + "grad_min_sv": 0.0, + "grad_condition": 1337498798.9664078, + "lr": 0.0005522642316338265, + "time_sec": 41.64910697937012 + }, + { + "epoch": 71, + "train_loss": 5.259250410003662, + "train_acc": 0.00816, + "test_loss": 4.623734491729737, + "test_acc": 0.01, + "lyapunov": 1.4762009812133086, + "grad_norm": 0.0884158256705388, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005418389216661573, + "time_sec": 41.65673208236694 + }, + { + "epoch": 72, + "train_loss": 5.260035207519532, + "train_acc": 0.00856, + "test_loss": 4.622923696899414, + "test_acc": 0.01, + "lyapunov": 1.4770802146638446, + "grad_norm": 0.08974113871672654, + "grad_max_sv": 0.00768307838588953, + "grad_min_sv": 0.0, + "grad_condition": 7683078385.889531, + "lr": 0.0005313952597646563, + "time_sec": 41.65725779533386 + }, + { + "epoch": 73, + "train_loss": 5.258972092895508, + "train_acc": 0.0089, + "test_loss": 4.627894605255127, + "test_acc": 0.01, + "lyapunov": 1.4759459010780316, + "grad_norm": 0.08863002112233408, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005209378268645994, + "time_sec": 41.67947006225586 + }, + { + "epoch": 74, + "train_loss": 5.260160232849121, + "train_acc": 0.00854, + "test_loss": 4.623137206268311, + "test_acc": 0.01, + "lyapunov": 1.4772573081428741, + "grad_norm": 0.09051043005437374, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005104712099416781, + "time_sec": 41.64360570907593 + }, + { + "epoch": 75, + "train_loss": 5.261452306213379, + "train_acc": 0.0086, + "test_loss": 4.62108766708374, + "test_acc": 0.01, + "lyapunov": 1.478764491617832, + "grad_norm": 0.08870478754258258, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004999999999999996, + "time_sec": 41.64626455307007 + }, + { + "epoch": 76, + "train_loss": 5.2611726042175295, + "train_acc": 0.00886, + "test_loss": 4.623955220794678, + "test_acc": 0.01, + "lyapunov": 1.4784429673953434, + "grad_norm": 0.08878094000275963, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004895287900583212, + "time_sec": 41.656346797943115 + }, + { + "epoch": 77, + "train_loss": 5.261820520782471, + "train_acc": 0.00874, + "test_loss": 4.61466668548584, + "test_acc": 0.01, + "lyapunov": 1.479163033273214, + "grad_norm": 0.088273880644991, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004790621731353997, + "time_sec": 41.629544734954834 + }, + { + "epoch": 78, + "train_loss": 5.262518656311035, + "train_acc": 0.00864, + "test_loss": 4.618248620605469, + "test_acc": 0.01, + "lyapunov": 1.4799401089358513, + "grad_norm": 0.08861130102060333, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000468604740235343, + "time_sec": 41.636940240859985 + }, + { + "epoch": 79, + "train_loss": 5.262553581237793, + "train_acc": 0.009, + "test_loss": 4.612181239318848, + "test_acc": 0.01, + "lyapunov": 1.4799358280723358, + "grad_norm": 0.0903783960157925, + "grad_max_sv": 0.01033918051980436, + "grad_min_sv": 0.0, + "grad_condition": 10339180519.80436, + "lr": 0.00045816107833384175, + "time_sec": 41.68020677566528 + }, + { + "epoch": 80, + "train_loss": 5.261878743896484, + "train_acc": 0.00886, + "test_loss": 4.612385320281982, + "test_acc": 0.01, + "lyapunov": 1.4792317411173945, + "grad_norm": 0.08815903777083657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 41.65713667869568 + }, + { + "epoch": 81, + "train_loss": 5.270162540740967, + "train_acc": 0.00948, + "test_loss": 4.61169965209961, + "test_acc": 0.01, + "lyapunov": 1.4845762399151503, + "grad_norm": 0.08933321451984454, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784746, + "time_sec": 41.67780160903931 + }, + { + "epoch": 82, + "train_loss": 5.261875872955322, + "train_acc": 0.00904, + "test_loss": 4.612089576721192, + "test_acc": 0.01, + "lyapunov": 1.47926344438587, + "grad_norm": 0.08839554451712253, + "grad_max_sv": 0.0006388438399881124, + "grad_min_sv": 0.0, + "grad_condition": 638843839.9881124, + "lr": 0.0004269584857187939, + "time_sec": 41.646398305892944 + }, + { + "epoch": 83, + "train_loss": 5.260851752319336, + "train_acc": 0.00926, + "test_loss": 4.605935791778564, + "test_acc": 0.01, + "lyapunov": 1.4780823766727886, + "grad_norm": 0.08881372923156301, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004166156266419484, + "time_sec": 41.64280557632446 + }, + { + "epoch": 84, + "train_loss": 5.261813834838867, + "train_acc": 0.0087, + "test_loss": 4.608912050628662, + "test_acc": 0.01, + "lyapunov": 1.4791915989897746, + "grad_norm": 0.08828411260554986, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004063093427071373, + "time_sec": 41.650211811065674 + }, + { + "epoch": 85, + "train_loss": 5.26105229888916, + "train_acc": 0.00876, + "test_loss": 4.607143463134766, + "test_acc": 0.01, + "lyapunov": 1.4783552308826495, + "grad_norm": 0.08801037770330913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003960441545911199, + "time_sec": 41.64579463005066 + }, + { + "epoch": 86, + "train_loss": 5.262948518676758, + "train_acc": 0.0089, + "test_loss": 4.605761601257324, + "test_acc": 0.01, + "lyapunov": 1.4804744302769146, + "grad_norm": 0.08824824639135734, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003858245649446718, + "time_sec": 41.694432497024536 + }, + { + "epoch": 87, + "train_loss": 5.261626904449463, + "train_acc": 0.00888, + "test_loss": 4.605769618988037, + "test_acc": 0.01, + "lyapunov": 1.4789858986349667, + "grad_norm": 0.08846494510980996, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00037565505641757235, + "time_sec": 41.681015491485596 + }, + { + "epoch": 88, + "train_loss": 5.262741643371582, + "train_acc": 0.00854, + "test_loss": 4.60517066192627, + "test_acc": 0.01, + "lyapunov": 1.4802151354377533, + "grad_norm": 0.08805740561566744, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036554008969236695, + "time_sec": 41.71163582801819 + }, + { + "epoch": 89, + "train_loss": 5.263213445281982, + "train_acc": 0.00854, + "test_loss": 4.605359262847901, + "test_acc": 0.01, + "lyapunov": 1.480777892005413, + "grad_norm": 0.08816151399502117, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003554841015277638, + "time_sec": 41.67105174064636 + }, + { + "epoch": 90, + "train_loss": 5.262189238433838, + "train_acc": 0.00928, + "test_loss": 4.605318756103515, + "test_acc": 0.01, + "lyapunov": 1.4796337014269036, + "grad_norm": 0.08930367772167215, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000345491502812526, + "time_sec": 41.640591859817505 + }, + { + "epoch": 91, + "train_loss": 5.261863013916016, + "train_acc": 0.00846, + "test_loss": 4.605316780853271, + "test_acc": 0.01, + "lyapunov": 1.4792772080282421, + "grad_norm": 0.08825121039889311, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003355666766307081, + "time_sec": 41.705339193344116 + }, + { + "epoch": 92, + "train_loss": 5.263724805908203, + "train_acc": 0.0084, + "test_loss": 4.605317385101318, + "test_acc": 0.01, + "lyapunov": 1.4813950381925345, + "grad_norm": 0.0876042035379079, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00032571397633909225, + "time_sec": 41.64047455787659 + }, + { + "epoch": 93, + "train_loss": 5.263348481750488, + "train_acc": 0.00826, + "test_loss": 4.605170777893067, + "test_acc": 0.01, + "lyapunov": 1.480857576250725, + "grad_norm": 0.09205208782948476, + "grad_max_sv": 0.007683574734255671, + "grad_min_sv": 0.0, + "grad_condition": 7683574734.2556715, + "lr": 0.00031593772365766094, + "time_sec": 41.66976022720337 + }, + { + "epoch": 94, + "train_loss": 5.263678814697266, + "train_acc": 0.0087, + "test_loss": 4.605170695495605, + "test_acc": 0.01, + "lyapunov": 1.481314537775181, + "grad_norm": 0.09018876116473232, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003062422067739483, + "time_sec": 41.65629434585571 + }, + { + "epoch": 95, + "train_loss": 5.262105151977539, + "train_acc": 0.00832, + "test_loss": 4.605170751190186, + "test_acc": 0.01, + "lyapunov": 1.479619727110314, + "grad_norm": 0.08829391493330081, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00029663167846209965, + "time_sec": 41.637601375579834 + }, + { + "epoch": 96, + "train_loss": 5.261454503326416, + "train_acc": 0.00892, + "test_loss": 4.605170954895019, + "test_acc": 0.01, + "lyapunov": 1.4788271173491807, + "grad_norm": 0.08829025030553274, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00028711035421746345, + "time_sec": 41.64588212966919 + }, + { + "epoch": 97, + "train_loss": 5.2617424992370605, + "train_acc": 0.00796, + "test_loss": 4.605170453643799, + "test_acc": 0.01, + "lyapunov": 1.4791636610275034, + "grad_norm": 0.08832466346515266, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 41.67742967605591 + }, + { + "epoch": 98, + "train_loss": 5.263716314086914, + "train_acc": 0.00858, + "test_loss": 4.605170697784424, + "test_acc": 0.01, + "lyapunov": 1.4813884213147566, + "grad_norm": 0.08840081765609732, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00026835198244006903, + "time_sec": 41.668766260147095 + }, + { + "epoch": 99, + "train_loss": 5.263833166656494, + "train_acc": 0.0087, + "test_loss": 4.605170695495605, + "test_acc": 0.01, + "lyapunov": 1.4815085251313036, + "grad_norm": 0.08792820202741711, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 41.66829442977905 + }, + { + "epoch": 100, + "train_loss": 5.262581251525879, + "train_acc": 0.00938, + "test_loss": 4.605170309448242, + "test_acc": 0.01, + "lyapunov": 1.480138891188385, + "grad_norm": 0.08832421824906611, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 41.68127655982971 + }, + { + "epoch": 101, + "train_loss": 5.263155633087158, + "train_acc": 0.00926, + "test_loss": 4.605170729064941, + "test_acc": 0.01, + "lyapunov": 1.480774727928669, + "grad_norm": 0.08869235909302142, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00024098649531343477, + "time_sec": 41.64776301383972 + }, + { + "epoch": 102, + "train_loss": 5.263860197906494, + "train_acc": 0.00848, + "test_loss": 4.6051703002929685, + "test_acc": 0.01, + "lyapunov": 1.4815483535342204, + "grad_norm": 0.08903961910912474, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 41.674145460128784 + }, + { + "epoch": 103, + "train_loss": 5.262970734710693, + "train_acc": 0.00884, + "test_loss": 4.605170517730713, + "test_acc": 0.01, + "lyapunov": 1.4805596624798787, + "grad_norm": 0.08876501131615566, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 41.65722608566284 + }, + { + "epoch": 104, + "train_loss": 5.26228626159668, + "train_acc": 0.00864, + "test_loss": 4.6051704086303715, + "test_acc": 0.01, + "lyapunov": 1.4798069201466981, + "grad_norm": 0.08768680006785402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 41.67565131187439 + }, + { + "epoch": 105, + "train_loss": 5.262674415435791, + "train_acc": 0.00838, + "test_loss": 4.6051702949523925, + "test_acc": 0.01, + "lyapunov": 1.480235590654261, + "grad_norm": 0.08782166200414132, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 41.69558024406433 + }, + { + "epoch": 106, + "train_loss": 5.261244326171875, + "train_acc": 0.00838, + "test_loss": 4.605170240020752, + "test_acc": 0.01, + "lyapunov": 1.4786384803864656, + "grad_norm": 0.08788578987148214, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 41.650753021240234 + }, + { + "epoch": 107, + "train_loss": 5.261433357849121, + "train_acc": 0.00904, + "test_loss": 4.605170213317871, + "test_acc": 0.01, + "lyapunov": 1.47886505273297, + "grad_norm": 0.08770929414544659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 41.68164348602295 + }, + { + "epoch": 108, + "train_loss": 5.263026925201416, + "train_acc": 0.009, + "test_loss": 4.60517043762207, + "test_acc": 0.01, + "lyapunov": 1.480643398621503, + "grad_norm": 0.08785423875011682, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000181288005125655, + "time_sec": 41.660765647888184 + }, + { + "epoch": 109, + "train_loss": 5.263078652801513, + "train_acc": 0.00816, + "test_loss": 4.605601066589355, + "test_acc": 0.01, + "lyapunov": 1.4807295979136397, + "grad_norm": 0.08803442353918925, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001732896980049473, + "time_sec": 41.66913390159607 + }, + { + "epoch": 110, + "train_loss": 5.263812705535889, + "train_acc": 0.00886, + "test_loss": 4.605602632141113, + "test_acc": 0.01, + "lyapunov": 1.4815696554110789, + "grad_norm": 0.08891727786082522, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 41.659369230270386 + }, + { + "epoch": 111, + "train_loss": 5.262115261535644, + "train_acc": 0.0078, + "test_loss": 4.605170052337646, + "test_acc": 0.01, + "lyapunov": 1.479651604771919, + "grad_norm": 0.08875181240277763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 41.70141959190369 + }, + { + "epoch": 112, + "train_loss": 5.261109837646484, + "train_acc": 0.00874, + "test_loss": 4.605170468139648, + "test_acc": 0.01, + "lyapunov": 1.4785008156086172, + "grad_norm": 0.08816074014970703, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 41.72004580497742 + }, + { + "epoch": 113, + "train_loss": 5.262560579681397, + "train_acc": 0.0086, + "test_loss": 4.6051704193115235, + "test_acc": 0.01, + "lyapunov": 1.4801284751623793, + "grad_norm": 0.08840941179148938, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 41.699143409729004 + }, + { + "epoch": 114, + "train_loss": 5.263074327697754, + "train_acc": 0.00886, + "test_loss": 4.605170431518554, + "test_acc": 0.01, + "lyapunov": 1.4807007001793904, + "grad_norm": 0.08821068724217689, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 41.67876648902893 + }, + { + "epoch": 115, + "train_loss": 5.262186526947022, + "train_acc": 0.0086, + "test_loss": 4.60517013092041, + "test_acc": 0.01, + "lyapunov": 1.4797226050320793, + "grad_norm": 0.0883831455880719, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 41.696322202682495 + }, + { + "epoch": 116, + "train_loss": 5.263145412445068, + "train_acc": 0.00836, + "test_loss": 4.605170120239258, + "test_acc": 0.01, + "lyapunov": 1.480826344026629, + "grad_norm": 0.08792566727039719, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 41.70669603347778 + }, + { + "epoch": 117, + "train_loss": 5.263297129516602, + "train_acc": 0.00834, + "test_loss": 4.60517033996582, + "test_acc": 0.01, + "lyapunov": 1.4809697009718326, + "grad_norm": 0.0880297462141732, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 41.66155934333801 + }, + { + "epoch": 118, + "train_loss": 5.263041806030273, + "train_acc": 0.00838, + "test_loss": 4.605170127868653, + "test_acc": 0.01, + "lyapunov": 1.4806942784267922, + "grad_norm": 0.0885706870416634, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 41.6468141078949 + }, + { + "epoch": 119, + "train_loss": 5.2626050819396974, + "train_acc": 0.00882, + "test_loss": 4.6051702911376955, + "test_acc": 0.01, + "lyapunov": 1.4802038822027728, + "grad_norm": 0.08805401420662645, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 41.67359256744385 + }, + { + "epoch": 120, + "train_loss": 5.262915015411377, + "train_acc": 0.00904, + "test_loss": 4.605170024108887, + "test_acc": 0.01, + "lyapunov": 1.4805879507528241, + "grad_norm": 0.08796658508917193, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 41.736050844192505 + }, + { + "epoch": 121, + "train_loss": 5.263114930877686, + "train_acc": 0.0083, + "test_loss": 4.605170388031006, + "test_acc": 0.01, + "lyapunov": 1.4807836167952593, + "grad_norm": 0.08806195734422055, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 41.839574337005615 + }, + { + "epoch": 122, + "train_loss": 5.262788164825439, + "train_acc": 0.00866, + "test_loss": 4.605170208740234, + "test_acc": 0.01, + "lyapunov": 1.4804405013618567, + "grad_norm": 0.08816097534558247, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 41.688995599746704 + }, + { + "epoch": 123, + "train_loss": 5.26315210357666, + "train_acc": 0.00874, + "test_loss": 4.60517013168335, + "test_acc": 0.01, + "lyapunov": 1.480828346498787, + "grad_norm": 0.08865951427268862, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 41.67227745056152 + }, + { + "epoch": 124, + "train_loss": 5.261944111022949, + "train_acc": 0.00914, + "test_loss": 4.605170402526856, + "test_acc": 0.01, + "lyapunov": 1.4794809848756132, + "grad_norm": 0.08788803702349164, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 41.66115140914917 + }, + { + "epoch": 125, + "train_loss": 5.262568561401367, + "train_acc": 0.0084, + "test_loss": 4.60517010345459, + "test_acc": 0.01, + "lyapunov": 1.4801926018331972, + "grad_norm": 0.08788675914126909, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 41.66165113449097 + }, + { + "epoch": 126, + "train_loss": 5.262280065460205, + "train_acc": 0.00902, + "test_loss": 4.605170187377929, + "test_acc": 0.01, + "lyapunov": 1.479902151295596, + "grad_norm": 0.08819775554912056, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 41.69537806510925 + }, + { + "epoch": 127, + "train_loss": 5.263674239196777, + "train_acc": 0.00884, + "test_loss": 4.605170446777343, + "test_acc": 0.01, + "lyapunov": 1.48142600425369, + "grad_norm": 0.08796249954554257, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 41.79696488380432 + }, + { + "epoch": 128, + "train_loss": 5.270508392181396, + "train_acc": 0.00774, + "test_loss": 4.6051702003479, + "test_acc": 0.01, + "lyapunov": 1.4854568767425653, + "grad_norm": 0.0903277044807366, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 41.78498363494873 + }, + { + "epoch": 129, + "train_loss": 5.264521000213623, + "train_acc": 0.00884, + "test_loss": 4.60517049331665, + "test_acc": 0.01, + "lyapunov": 1.4823556894536518, + "grad_norm": 0.08791573530006377, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 41.75825619697571 + }, + { + "epoch": 130, + "train_loss": 5.263497207641602, + "train_acc": 0.00856, + "test_loss": 4.605170115661621, + "test_acc": 0.01, + "lyapunov": 1.4812386575562264, + "grad_norm": 0.08821103937271832, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 41.753769874572754 + }, + { + "epoch": 131, + "train_loss": 5.262869830932617, + "train_acc": 0.00886, + "test_loss": 4.605170347595215, + "test_acc": 0.01, + "lyapunov": 1.4805735938079523, + "grad_norm": 0.08785954608269858, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 41.688891649246216 + }, + { + "epoch": 132, + "train_loss": 5.261720856323242, + "train_acc": 0.0092, + "test_loss": 4.605170230865479, + "test_acc": 0.01, + "lyapunov": 1.4792467572195145, + "grad_norm": 0.087651258765062, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 41.77381873130798 + }, + { + "epoch": 133, + "train_loss": 5.262511810150147, + "train_acc": 0.0094, + "test_loss": 4.605170274353028, + "test_acc": 0.01, + "lyapunov": 1.480145969354283, + "grad_norm": 0.08750516435565067, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 41.82425284385681 + }, + { + "epoch": 134, + "train_loss": 5.2628221615600586, + "train_acc": 0.009, + "test_loss": 4.605170260620117, + "test_acc": 0.01, + "lyapunov": 1.480488061295141, + "grad_norm": 0.08767200957157907, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 41.67008709907532 + }, + { + "epoch": 135, + "train_loss": 5.262214541320801, + "train_acc": 0.00906, + "test_loss": 4.605170357513428, + "test_acc": 0.01, + "lyapunov": 1.479800993524244, + "grad_norm": 0.08833622992837174, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 41.68112754821777 + }, + { + "epoch": 136, + "train_loss": 5.261716612854004, + "train_acc": 0.00888, + "test_loss": 4.605170449829101, + "test_acc": 0.01, + "lyapunov": 1.4792663523608156, + "grad_norm": 0.0879915508382305, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 41.70846509933472 + }, + { + "epoch": 137, + "train_loss": 5.2621297309875485, + "train_acc": 0.00882, + "test_loss": 4.6051704208374025, + "test_acc": 0.01, + "lyapunov": 1.4797221123410003, + "grad_norm": 0.08806309329797692, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 41.68800139427185 + }, + { + "epoch": 138, + "train_loss": 5.262034148254394, + "train_acc": 0.009, + "test_loss": 4.6051704246520995, + "test_acc": 0.01, + "lyapunov": 1.4796448052691682, + "grad_norm": 0.08834842868525353, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 41.69483256340027 + }, + { + "epoch": 139, + "train_loss": 5.262303157958985, + "train_acc": 0.00964, + "test_loss": 4.605170336914062, + "test_acc": 0.01, + "lyapunov": 1.479908719696962, + "grad_norm": 0.08774925576434625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 41.66975927352905 + }, + { + "epoch": 140, + "train_loss": 5.262272278747559, + "train_acc": 0.0093, + "test_loss": 4.60517025756836, + "test_acc": 0.01, + "lyapunov": 1.4799000518706145, + "grad_norm": 0.08772068441716457, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 41.66502594947815 + }, + { + "epoch": 141, + "train_loss": 5.262688246459961, + "train_acc": 0.01, + "test_loss": 4.605170532226563, + "test_acc": 0.01, + "lyapunov": 1.4803482586770411, + "grad_norm": 0.08814041677323237, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 41.68389272689819 + }, + { + "epoch": 142, + "train_loss": 5.2666687211608885, + "train_acc": 0.01, + "test_loss": 4.605170266723633, + "test_acc": 0.01, + "lyapunov": 1.4834284483624236, + "grad_norm": 0.08808456177000348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 41.70149374008179 + }, + { + "epoch": 143, + "train_loss": 5.2625910409545895, + "train_acc": 0.00962, + "test_loss": 4.605170193481445, + "test_acc": 0.01, + "lyapunov": 1.4802313485108982, + "grad_norm": 0.08826750361435122, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 41.675010204315186 + }, + { + "epoch": 144, + "train_loss": 5.260678899536133, + "train_acc": 0.01, + "test_loss": 4.60517022857666, + "test_acc": 0.01, + "lyapunov": 1.4781028556701776, + "grad_norm": 0.08826672055694883, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 41.67730474472046 + }, + { + "epoch": 145, + "train_loss": 5.262034167785645, + "train_acc": 0.01, + "test_loss": 4.605170384216309, + "test_acc": 0.01, + "lyapunov": 1.47965680668726, + "grad_norm": 0.08792698291184464, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 41.711742639541626 + }, + { + "epoch": 146, + "train_loss": 5.262125458984375, + "train_acc": 0.01, + "test_loss": 4.605170105743408, + "test_acc": 0.01, + "lyapunov": 1.4797236641959461, + "grad_norm": 0.0878274682773103, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 41.72946882247925 + }, + { + "epoch": 147, + "train_loss": 5.263207815246582, + "train_acc": 0.01, + "test_loss": 4.605170260620117, + "test_acc": 0.01, + "lyapunov": 1.4809288390152289, + "grad_norm": 0.08780070915999844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 41.724937438964844 + }, + { + "epoch": 148, + "train_loss": 5.262101231384277, + "train_acc": 0.01, + "test_loss": 4.605170335388183, + "test_acc": 0.01, + "lyapunov": 1.4797268191261974, + "grad_norm": 0.08811462011437057, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 41.86608529090881 + }, + { + "epoch": 149, + "train_loss": 5.26564047592163, + "train_acc": 0.01, + "test_loss": 4.605170273590088, + "test_acc": 0.01, + "lyapunov": 1.4827746887646063, + "grad_norm": 0.088563737069616, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 41.668235540390015 + }, + { + "epoch": 150, + "train_loss": 5.263033789978027, + "train_acc": 0.01, + "test_loss": 4.605170249176026, + "test_acc": 0.01, + "lyapunov": 1.480735678197173, + "grad_norm": 0.08808051231477661, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 41.65666699409485 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 5.146603754577637, + "train_acc": 0.02116, + "test_loss": 4.799143431091308, + "test_acc": 0.0147, + "lyapunov": 2.247725067846001, + "grad_norm": 5.759558294617595, + "grad_max_sv": 4.593458223342895, + "grad_min_sv": 9.939812799508729e-08, + "grad_condition": 84468621.05560377, + "lr": 0.0009998903417374227, + "time_sec": 86.99692106246948 + }, + { + "epoch": 2, + "train_loss": 4.751044019317627, + "train_acc": 0.0261, + "test_loss": 4.781899060058594, + "test_acc": 0.0112, + "lyapunov": 1.7586963832225946, + "grad_norm": 3.669503755077576, + "grad_max_sv": 2.629068848490715, + "grad_min_sv": 6.128463263532779e-08, + "grad_condition": 51408050.19515464, + "lr": 0.0009995614150494292, + "time_sec": 86.99053359031677 + }, + { + "epoch": 3, + "train_loss": 4.5855533428955075, + "train_acc": 0.0302, + "test_loss": 4.783446264648438, + "test_acc": 0.0204, + "lyapunov": 1.650954161458613, + "grad_norm": 1.8760355114337364, + "grad_max_sv": 1.30306978225708, + "grad_min_sv": 3.0873310079282404e-08, + "grad_condition": 74135293.70537718, + "lr": 0.0009990133642141358, + "time_sec": 87.01290392875671 + }, + { + "epoch": 4, + "train_loss": 4.534848844451904, + "train_acc": 0.03702, + "test_loss": 4.8837289710998535, + "test_acc": 0.0149, + "lyapunov": 1.5894556011995087, + "grad_norm": 1.244556287523884, + "grad_max_sv": 0.7792816802859306, + "grad_min_sv": 1.8834766013497984e-08, + "grad_condition": 45093330.72508425, + "lr": 0.0009982464296247522, + "time_sec": 87.01876306533813 + }, + { + "epoch": 5, + "train_loss": 4.592422800903321, + "train_acc": 0.03296, + "test_loss": 4.848946441650391, + "test_acc": 0.0145, + "lyapunov": 1.5674470586849905, + "grad_norm": 0.9784603406000693, + "grad_max_sv": 0.5906251654028892, + "grad_min_sv": 1.3135394039365212e-08, + "grad_condition": 2765173736.408195, + "lr": 0.0009972609476841367, + "time_sec": 87.06145668029785 + }, + { + "epoch": 6, + "train_loss": 4.617396930847168, + "train_acc": 0.03438, + "test_loss": 5.069504800415039, + "test_acc": 0.0141, + "lyapunov": 1.5743840259054434, + "grad_norm": 0.8765996249293907, + "grad_max_sv": 0.4905373930931091, + "grad_min_sv": 1.1570106956413153e-08, + "grad_condition": 490506519.64879054, + "lr": 0.000996057350657239, + "time_sec": 86.98913550376892 + }, + { + "epoch": 7, + "train_loss": 4.673418109436035, + "train_acc": 0.03144, + "test_loss": 5.083357322692871, + "test_acc": 0.01, + "lyapunov": 1.5757776337206517, + "grad_norm": 0.842980463237632, + "grad_max_sv": 0.4635330677032471, + "grad_min_sv": 9.801791714218744e-09, + "grad_condition": 672093861.9243783, + "lr": 0.000994636166481494, + "time_sec": 87.02865362167358 + }, + { + "epoch": 8, + "train_loss": 4.715173123626709, + "train_acc": 0.02866, + "test_loss": 6.969320404052734, + "test_acc": 0.01, + "lyapunov": 1.572990819621269, + "grad_norm": 0.7658102895010526, + "grad_max_sv": 0.39840318709611894, + "grad_min_sv": 7.909037175684143e-09, + "grad_condition": 2689350489.23699, + "lr": 0.0009929980185352525, + "time_sec": 87.05855631828308 + }, + { + "epoch": 9, + "train_loss": 4.719650735931396, + "train_acc": 0.03378, + "test_loss": 6.69895283203125, + "test_acc": 0.01, + "lyapunov": 1.5739632753459998, + "grad_norm": 0.6951362665980956, + "grad_max_sv": 0.40656831562519075, + "grad_min_sv": 9.631129597315046e-09, + "grad_condition": 152979631.4939035, + "lr": 0.0009911436253643444, + "time_sec": 87.04356169700623 + }, + { + "epoch": 10, + "train_loss": 4.785277546691894, + "train_acc": 0.03084, + "test_loss": 7.56282477722168, + "test_acc": 0.01, + "lyapunov": 1.5731478392925409, + "grad_norm": 0.8027087514422708, + "grad_max_sv": 0.4249536793678999, + "grad_min_sv": 1.0233699096961427e-08, + "grad_condition": 2212458832.3035727, + "lr": 0.0009890738003669028, + "time_sec": 86.9918863773346 + }, + { + "epoch": 11, + "train_loss": 4.85365997543335, + "train_acc": 0.02776, + "test_loss": 6.083891798400879, + "test_acc": 0.01, + "lyapunov": 1.594173707315684, + "grad_norm": 0.6228665658651402, + "grad_max_sv": 0.3807309426367283, + "grad_min_sv": 7.858218521034076e-09, + "grad_condition": 142247255.9097917, + "lr": 0.00098678945143658, + "time_sec": 87.02730226516724 + }, + { + "epoch": 12, + "train_loss": 4.936503148193359, + "train_acc": 0.02734, + "test_loss": 4.648137149047852, + "test_acc": 0.01, + "lyapunov": 1.6324983204112333, + "grad_norm": 0.8180108242362618, + "grad_max_sv": 0.3168713390827179, + "grad_min_sv": 6.217847966746067e-09, + "grad_condition": 1904828726.2920518, + "lr": 0.0009842915805643154, + "time_sec": 86.98762059211731 + }, + { + "epoch": 13, + "train_loss": 4.989127286529541, + "train_acc": 0.02624, + "test_loss": 5.89718906326294, + "test_acc": 0.01, + "lyapunov": 1.6513543821051908, + "grad_norm": 0.8703418944824507, + "grad_max_sv": 0.3535689525306225, + "grad_min_sv": 6.494354365393917e-09, + "grad_condition": 75061975.40179494, + "lr": 0.000981581283398829, + "time_sec": 86.99741172790527 + }, + { + "epoch": 14, + "train_loss": 5.027360094604492, + "train_acc": 0.02734, + "test_loss": 5.6859222030639645, + "test_acc": 0.01, + "lyapunov": 1.66906841667107, + "grad_norm": 0.8955015428134906, + "grad_max_sv": 0.3326103314757347, + "grad_min_sv": 5.961173611852833e-09, + "grad_condition": 196184685.20064688, + "lr": 0.0009786597487660333, + "time_sec": 86.990553855896 + }, + { + "epoch": 15, + "train_loss": 5.103685426635742, + "train_acc": 0.0235, + "test_loss": 4.620827954101562, + "test_acc": 0.01, + "lyapunov": 1.6500021161325753, + "grad_norm": 0.7165299396921548, + "grad_max_sv": 0.29206431321799753, + "grad_min_sv": 3.742070758853766e-09, + "grad_condition": 11821452317.947672, + "lr": 0.0009755282581475766, + "time_sec": 86.99919128417969 + }, + { + "epoch": 16, + "train_loss": 5.046826876983642, + "train_acc": 0.02808, + "test_loss": 4.618471592712402, + "test_acc": 0.01, + "lyapunov": 1.6286348086183944, + "grad_norm": 0.8805208885120411, + "grad_max_sv": 0.34881011955440044, + "grad_min_sv": 5.4340508724715075e-09, + "grad_condition": 607977502.9364278, + "lr": 0.0009721881851187403, + "time_sec": 87.02350974082947 + }, + { + "epoch": 17, + "train_loss": 5.125038688812256, + "train_acc": 0.02188, + "test_loss": 5.0374674758911135, + "test_acc": 0.01, + "lyapunov": 1.6156021630977426, + "grad_norm": 0.7664664524159326, + "grad_max_sv": 0.31916227340698244, + "grad_min_sv": 3.2244314654420098e-09, + "grad_condition": 12300439770.56846, + "lr": 0.0009686409947459456, + "time_sec": 87.0214216709137 + }, + { + "epoch": 18, + "train_loss": 5.1917090243530275, + "train_acc": 0.02074, + "test_loss": 6.239829849243164, + "test_acc": 0.01, + "lyapunov": 1.6075686880999513, + "grad_norm": 0.8340839537949596, + "grad_max_sv": 0.2987551841884851, + "grad_min_sv": 1.3384357527406395e-09, + "grad_condition": 53090691786.99108, + "lr": 0.0009648882429441254, + "time_sec": 87.0026741027832 + }, + { + "epoch": 19, + "train_loss": 5.1467557635498045, + "train_acc": 0.02224, + "test_loss": 4.859098764038086, + "test_acc": 0.01, + "lyapunov": 1.5547950270840578, + "grad_norm": 0.5424186147523934, + "grad_max_sv": 0.2584996819496155, + "grad_min_sv": 1.7988151973410667e-10, + "grad_condition": 42973213975.62498, + "lr": 0.00096093157579425, + "time_sec": 87.0099880695343 + }, + { + "epoch": 20, + "train_loss": 5.253306176147461, + "train_acc": 0.01948, + "test_loss": 8.813103515625, + "test_acc": 0.01, + "lyapunov": 1.5798406722905385, + "grad_norm": 0.6790335216715864, + "grad_max_sv": 0.2796168942004442, + "grad_min_sv": 1.3123472687420754e-09, + "grad_condition": 55528903276.005905, + "lr": 0.0009567727288213001, + "time_sec": 87.00798654556274 + }, + { + "epoch": 21, + "train_loss": 5.3828185322570805, + "train_acc": 0.01028, + "test_loss": 8.961210163879395, + "test_acc": 0.01, + "lyapunov": 1.566893112933849, + "grad_norm": 0.9785357311156059, + "grad_max_sv": 0.4175733871757984, + "grad_min_sv": 5.038056967646815e-09, + "grad_condition": 2576596333.756474, + "lr": 0.0009524135262330095, + "time_sec": 87.24499773979187 + }, + { + "epoch": 22, + "train_loss": 5.318783715209961, + "train_acc": 0.01022, + "test_loss": 9.226270596313476, + "test_acc": 0.01, + "lyapunov": 1.515167183888233, + "grad_norm": 0.5897187117480035, + "grad_max_sv": 0.32070303708314896, + "grad_min_sv": 3.3304707929004972e-09, + "grad_condition": 145373104.26632357, + "lr": 0.0009478558801197061, + "time_sec": 87.02501797676086 + }, + { + "epoch": 23, + "train_loss": 5.311336210021973, + "train_acc": 0.00992, + "test_loss": 9.553670106506347, + "test_acc": 0.01, + "lyapunov": 1.5058710337294947, + "grad_norm": 0.42067884050272164, + "grad_max_sv": 0.3374065548181534, + "grad_min_sv": 3.917849118045824e-09, + "grad_condition": 148787617.53453642, + "lr": 0.000943101789615607, + "time_sec": 87.03109979629517 + }, + { + "epoch": 24, + "train_loss": 5.310154438018799, + "train_acc": 0.01036, + "test_loss": 7.603771569824219, + "test_acc": 0.01, + "lyapunov": 1.509728124379502, + "grad_norm": 0.3834815238141383, + "grad_max_sv": 0.3096462905406952, + "grad_min_sv": 2.737797575240686e-09, + "grad_condition": 22145829075.872944, + "lr": 0.0009381533400219313, + "time_sec": 86.98246717453003 + }, + { + "epoch": 25, + "train_loss": 5.301079537353516, + "train_acc": 0.00976, + "test_loss": 7.519319520568848, + "test_acc": 0.01, + "lyapunov": 1.5108507871627808, + "grad_norm": 0.30755221598797206, + "grad_max_sv": 0.2302608024328947, + "grad_min_sv": 2.0953720649433853e-11, + "grad_condition": 115571274953.14014, + "lr": 0.0009330127018922189, + "time_sec": 87.00150752067566 + }, + { + "epoch": 26, + "train_loss": 5.2993214897155765, + "train_acc": 0.00926, + "test_loss": 7.535327529907226, + "test_acc": 0.01, + "lyapunov": 1.5122191076693328, + "grad_norm": 0.2686555081361175, + "grad_max_sv": 0.1873680654913187, + "grad_min_sv": 1.1968037446042912e-12, + "grad_condition": 111356408601.78958, + "lr": 0.000927682130080253, + "time_sec": 87.06040525436401 + }, + { + "epoch": 27, + "train_loss": 5.301115319061279, + "train_acc": 0.01026, + "test_loss": 7.4256896377563475, + "test_acc": 0.01, + "lyapunov": 1.5147829875921655, + "grad_norm": 0.2584031825672629, + "grad_max_sv": 0.18733071088790892, + "grad_min_sv": 1.5532640335746842e-12, + "grad_condition": 105854162513.72067, + "lr": 0.0009221639627510072, + "time_sec": 87.0212287902832 + }, + { + "epoch": 28, + "train_loss": 5.300986379394531, + "train_acc": 0.00912, + "test_loss": 7.3856002044677735, + "test_acc": 0.01, + "lyapunov": 1.5147232972752407, + "grad_norm": 0.2414535578672304, + "grad_max_sv": 0.16182587593793868, + "grad_min_sv": 2.716757690251971e-13, + "grad_condition": 139096227622.95874, + "lr": 0.0009164606203550494, + "time_sec": 87.02124691009521 + }, + { + "epoch": 29, + "train_loss": 5.311827180175781, + "train_acc": 0.00958, + "test_loss": 9.537436566162109, + "test_acc": 0.01, + "lyapunov": 1.5239817428466913, + "grad_norm": 0.2934555140553008, + "grad_max_sv": 0.17254459988325835, + "grad_min_sv": 7.800315873566188e-13, + "grad_condition": 118094677554.4253, + "lr": 0.0009105746045668516, + "time_sec": 87.02146863937378 + }, + { + "epoch": 30, + "train_loss": 5.306949669952393, + "train_acc": 0.00986, + "test_loss": 9.629324139404297, + "test_acc": 0.01, + "lyapunov": 1.5190055486186387, + "grad_norm": 0.2568362833037679, + "grad_max_sv": 0.1871931992471218, + "grad_min_sv": 8.733775765521943e-13, + "grad_condition": 124328292229.6437, + "lr": 0.0009045084971874733, + "time_sec": 87.0063271522522 + }, + { + "epoch": 31, + "train_loss": 5.317695409240723, + "train_acc": 0.00946, + "test_loss": 9.857299293518066, + "test_acc": 0.01, + "lyapunov": 1.5297813034423478, + "grad_norm": 0.31967679371455754, + "grad_max_sv": 0.17166709154844284, + "grad_min_sv": 1.3052075569227142e-12, + "grad_condition": 105851795247.06416, + "lr": 0.0008982649590120977, + "time_sec": 87.03139019012451 + }, + { + "epoch": 32, + "train_loss": 5.306474250030518, + "train_acc": 0.00946, + "test_loss": 6.192124473571777, + "test_acc": 0.01, + "lyapunov": 1.5204204305663438, + "grad_norm": 0.22033885472694253, + "grad_max_sv": 0.1525889288634062, + "grad_min_sv": 4.756078352149119e-13, + "grad_condition": 128078379912.95, + "lr": 0.0008918467286629196, + "time_sec": 86.99606108665466 + }, + { + "epoch": 33, + "train_loss": 5.307142764892578, + "train_acc": 0.00976, + "test_loss": 7.497373861694336, + "test_acc": 0.01, + "lyapunov": 1.522810420721693, + "grad_norm": 0.20782539541327114, + "grad_max_sv": 0.13517180345952512, + "grad_min_sv": 1.1068227830043178e-13, + "grad_condition": 123350210961.5916, + "lr": 0.0008852566213878943, + "time_sec": 87.02485609054565 + }, + { + "epoch": 34, + "train_loss": 5.307786667785645, + "train_acc": 0.01036, + "test_loss": 6.049268864440918, + "test_acc": 0.01, + "lyapunov": 1.5257866547235748, + "grad_norm": 0.1890978405416262, + "grad_max_sv": 0.10800869315862656, + "grad_min_sv": 7.129825504179478e-15, + "grad_condition": 107252102588.7272, + "lr": 0.000878497527825878, + "time_sec": 87.10786271095276 + }, + { + "epoch": 35, + "train_loss": 5.3119341674804685, + "train_acc": 0.009, + "test_loss": 4.805781600952148, + "test_acc": 0.01, + "lyapunov": 1.5290101019622724, + "grad_norm": 0.1944266687511967, + "grad_max_sv": 0.11351412069052458, + "grad_min_sv": 1.0284869415209545e-14, + "grad_condition": 112374076474.89091, + "lr": 0.000871572412738697, + "time_sec": 87.02945756912231 + }, + { + "epoch": 36, + "train_loss": 5.30866313369751, + "train_acc": 0.01008, + "test_loss": 5.370443841552734, + "test_acc": 0.01, + "lyapunov": 1.5276334587570346, + "grad_norm": 0.16190926523802132, + "grad_max_sv": 0.09535483401268721, + "grad_min_sv": 3.195651304626571e-15, + "grad_condition": 94990079164.94656, + "lr": 0.0008644843137107055, + "time_sec": 86.99824213981628 + }, + { + "epoch": 37, + "train_loss": 5.308895555877686, + "train_acc": 0.0099, + "test_loss": 4.843223188781738, + "test_acc": 0.01, + "lyapunov": 1.5290613820790635, + "grad_norm": 0.15630460219006667, + "grad_max_sv": 0.08036092817783355, + "grad_min_sv": 1.1315139619811405e-17, + "grad_condition": 80360078431.92064, + "lr": 0.0008572363398164014, + "time_sec": 86.98283195495605 + }, + { + "epoch": 38, + "train_loss": 5.31004166229248, + "train_acc": 0.00976, + "test_loss": 4.780417753601074, + "test_acc": 0.01, + "lyapunov": 1.5300937909299455, + "grad_norm": 0.16356950260232017, + "grad_max_sv": 0.08305604849010706, + "grad_min_sv": 8.648904023608753e-17, + "grad_condition": 83049364241.033, + "lr": 0.0008498316702566826, + "time_sec": 87.12476921081543 + }, + { + "epoch": 39, + "train_loss": 5.308765927276611, + "train_acc": 0.00922, + "test_loss": 4.650610294342041, + "test_acc": 0.01, + "lyapunov": 1.529145797195337, + "grad_norm": 0.13936121996216216, + "grad_max_sv": 0.06846637381240725, + "grad_min_sv": 6.938789416330728e-18, + "grad_condition": 68465862650.46446, + "lr": 0.0008422735529643442, + "time_sec": 87.00707483291626 + }, + { + "epoch": 40, + "train_loss": 5.312034950561523, + "train_acc": 0.00936, + "test_loss": 8.73487543487549, + "test_acc": 0.01, + "lyapunov": 1.532078573465957, + "grad_norm": 0.18500833074783374, + "grad_max_sv": 0.078881626855582, + "grad_min_sv": 1.2209525522074501e-26, + "grad_condition": 78881626855.5808, + "lr": 0.0008345653031794289, + "time_sec": 86.97358655929565 + }, + { + "epoch": 41, + "train_loss": 5.3188898524475094, + "train_acc": 0.00938, + "test_loss": 6.380272773742676, + "test_acc": 0.01, + "lyapunov": 1.5366824176305396, + "grad_norm": 0.16899341003407245, + "grad_max_sv": 0.0827794061973691, + "grad_min_sv": 1.2491873132717773e-20, + "grad_condition": 82779405140.55663, + "lr": 0.0008267103019950526, + "time_sec": 86.98160243034363 + }, + { + "epoch": 42, + "train_loss": 5.311096598052979, + "train_acc": 0.00918, + "test_loss": 6.181304641723633, + "test_acc": 0.01, + "lyapunov": 1.53186220738589, + "grad_norm": 0.14945919124069362, + "grad_max_sv": 0.07147165723145008, + "grad_min_sv": 1.6261729001718281e-18, + "grad_condition": 71471530485.47403, + "lr": 0.0008187119948743447, + "time_sec": 86.98783445358276 + }, + { + "epoch": 43, + "train_loss": 5.311037984619141, + "train_acc": 0.00992, + "test_loss": 6.528422421264648, + "test_acc": 0.01, + "lyapunov": 1.5322752218417195, + "grad_norm": 0.13413981069527348, + "grad_max_sv": 0.05753951920196414, + "grad_min_sv": 5.739214042427294e-41, + "grad_condition": 57539519201.964134, + "lr": 0.000810573890139155, + "time_sec": 87.02233648300171 + }, + { + "epoch": 44, + "train_loss": 5.314179193420411, + "train_acc": 0.00976, + "test_loss": 6.383645655822754, + "test_acc": 0.01, + "lyapunov": 1.5352078728053882, + "grad_norm": 0.15018671176350665, + "grad_max_sv": 0.06426793411374092, + "grad_min_sv": 1.0144677449199871e-19, + "grad_condition": 64267926931.3136, + "lr": 0.0008022995574311873, + "time_sec": 86.99135541915894 + }, + { + "epoch": 45, + "train_loss": 5.3138120045471195, + "train_acc": 0.00972, + "test_loss": 6.1780305633544925, + "test_acc": 0.01, + "lyapunov": 1.53417928048107, + "grad_norm": 0.1546946181453632, + "grad_max_sv": 0.07538183946162462, + "grad_min_sv": 2.0235549254645516e-17, + "grad_condition": 75380064770.74498, + "lr": 0.0007938926261462363, + "time_sec": 86.9700219631195 + }, + { + "epoch": 46, + "train_loss": 5.31338122253418, + "train_acc": 0.01088, + "test_loss": 4.875375650024414, + "test_acc": 0.01, + "lyapunov": 1.5348101799445384, + "grad_norm": 0.13799834022044194, + "grad_max_sv": 0.05826565367169678, + "grad_min_sv": 1.2213807007518915e-19, + "grad_condition": 58265644274.60155, + "lr": 0.0007853567838422158, + "time_sec": 86.9914186000824 + }, + { + "epoch": 47, + "train_loss": 5.316119242401123, + "train_acc": 0.01028, + "test_loss": 7.579864669799805, + "test_acc": 0.01, + "lyapunov": 1.5372701596725933, + "grad_norm": 0.1318310224117309, + "grad_max_sv": 0.059043215587735176, + "grad_min_sv": 1.0278524235822533e-42, + "grad_condition": 59043215587.73517, + "lr": 0.0007766957746216719, + "time_sec": 86.99268984794617 + }, + { + "epoch": 48, + "train_loss": 5.3163630574035645, + "train_acc": 0.00918, + "test_loss": 8.10872494354248, + "test_acc": 0.01, + "lyapunov": 1.537570302443736, + "grad_norm": 0.14919853802284255, + "grad_max_sv": 0.059043734613806007, + "grad_min_sv": 1.9169802249728662e-27, + "grad_condition": 59043734613.80581, + "lr": 0.0007679133974894982, + "time_sec": 86.96942186355591 + }, + { + "epoch": 49, + "train_loss": 5.315186663513184, + "train_acc": 0.00982, + "test_loss": 10.137148637390137, + "test_acc": 0.01, + "lyapunov": 1.5357392169630435, + "grad_norm": 0.14339565437399782, + "grad_max_sv": 0.07659720163792372, + "grad_min_sv": 9.214212859750722e-16, + "grad_condition": 76509866898.91414, + "lr": 0.000759013504686565, + "time_sec": 87.01622128486633 + }, + { + "epoch": 50, + "train_loss": 5.314455534973145, + "train_acc": 0.0102, + "test_loss": 8.247185594177246, + "test_acc": 0.01, + "lyapunov": 1.5355263009400624, + "grad_norm": 0.13354715221640268, + "grad_max_sv": 0.06603035274893046, + "grad_min_sv": 4.3361800326764774e-19, + "grad_condition": 66030309212.30867, + "lr": 0.0007499999999999998, + "time_sec": 86.99394655227661 + }, + { + "epoch": 51, + "train_loss": 5.32153740737915, + "train_acc": 0.01, + "test_loss": 8.37662465057373, + "test_acc": 0.01, + "lyapunov": 1.5409153455968403, + "grad_norm": 0.14502327588857133, + "grad_max_sv": 0.06259518237784505, + "grad_min_sv": 4.890059136866219e-20, + "grad_condition": 62595178420.28666, + "lr": 0.0007408768370508575, + "time_sec": 86.97510194778442 + }, + { + "epoch": 52, + "train_loss": 5.316599715270996, + "train_acc": 0.00936, + "test_loss": 8.278748655700683, + "test_acc": 0.01, + "lyapunov": 1.5381617646692964, + "grad_norm": 0.1359300928840212, + "grad_max_sv": 0.05868045939132571, + "grad_min_sv": 2.1909536115890692e-21, + "grad_condition": 58680459216.2619, + "lr": 0.0007316480175599307, + "time_sec": 86.98001670837402 + }, + { + "epoch": 53, + "train_loss": 5.316536732788086, + "train_acc": 0.01016, + "test_loss": 5.486338158416748, + "test_acc": 0.01, + "lyapunov": 1.5382660676146407, + "grad_norm": 0.1271741910618785, + "grad_max_sv": 0.05760562280192971, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 57605622801.92971, + "lr": 0.0007223175895924635, + "time_sec": 86.99369311332703 + }, + { + "epoch": 54, + "train_loss": 5.316702398681641, + "train_acc": 0.0102, + "test_loss": 5.302798899841308, + "test_acc": 0.01, + "lyapunov": 1.5386110059440594, + "grad_norm": 0.15368852800875965, + "grad_max_sv": 0.0578720694873482, + "grad_min_sv": 1.7830822309301135e-42, + "grad_condition": 57872069487.348206, + "lr": 0.0007128896457825361, + "time_sec": 86.96624207496643 + }, + { + "epoch": 55, + "train_loss": 5.316231355743408, + "train_acc": 0.00948, + "test_loss": 8.74564740600586, + "test_acc": 0.01, + "lyapunov": 1.5383109363448588, + "grad_norm": 0.13190622008458677, + "grad_max_sv": 0.04535484011285007, + "grad_min_sv": 0.0, + "grad_condition": 45354840112.850075, + "lr": 0.0007033683215378998, + "time_sec": 86.97799372673035 + }, + { + "epoch": 56, + "train_loss": 5.317534141235352, + "train_acc": 0.00946, + "test_loss": 8.70028028869629, + "test_acc": 0.01, + "lyapunov": 1.5393455677934924, + "grad_norm": 0.13462977039802712, + "grad_max_sv": 0.06513494476675988, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 65134944766.75987, + "lr": 0.0006937577932260512, + "time_sec": 86.98487591743469 + }, + { + "epoch": 57, + "train_loss": 5.318079041290283, + "train_acc": 0.0097, + "test_loss": 9.145556756591796, + "test_acc": 0.01, + "lyapunov": 1.5401513216745517, + "grad_norm": 0.13118847481535986, + "grad_max_sv": 0.05173748955130577, + "grad_min_sv": 0.0, + "grad_condition": 51737489551.30577, + "lr": 0.0006840622763423388, + "time_sec": 87.00480890274048 + }, + { + "epoch": 58, + "train_loss": 5.316858307800293, + "train_acc": 0.00892, + "test_loss": 8.666381803894042, + "test_acc": 0.01, + "lyapunov": 1.5383905370522033, + "grad_norm": 0.12912610896619198, + "grad_max_sv": 0.06017917674034834, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 60179176740.34834, + "lr": 0.0006742860236609073, + "time_sec": 87.00866675376892 + }, + { + "epoch": 59, + "train_loss": 5.325099550476074, + "train_acc": 0.00954, + "test_loss": 8.285526527404786, + "test_acc": 0.01, + "lyapunov": 1.544173507739211, + "grad_norm": 0.15876381906710343, + "grad_max_sv": 0.06922355592250824, + "grad_min_sv": 2.3088949294307303e-16, + "grad_condition": 69207800483.04135, + "lr": 0.0006644333233692913, + "time_sec": 86.97984671592712 + }, + { + "epoch": 60, + "train_loss": 5.3204884049987795, + "train_acc": 0.0094, + "test_loss": 8.168935748291016, + "test_acc": 0.01, + "lyapunov": 1.5423277512840603, + "grad_norm": 0.12428279151580043, + "grad_max_sv": 0.05191116128116846, + "grad_min_sv": 0.0, + "grad_condition": 51911161281.168465, + "lr": 0.0006545084971874734, + "time_sec": 86.99251651763916 + }, + { + "epoch": 61, + "train_loss": 5.318557815551758, + "train_acc": 0.00974, + "test_loss": 11.625576313781739, + "test_acc": 0.01, + "lyapunov": 1.5408994303944776, + "grad_norm": 0.11981934242025526, + "grad_max_sv": 0.04157847780734301, + "grad_min_sv": 0.0, + "grad_condition": 41578477807.343, + "lr": 0.0006445158984722354, + "time_sec": 86.97000765800476 + }, + { + "epoch": 62, + "train_loss": 5.320785666503906, + "train_acc": 0.00938, + "test_loss": 12.541597724914551, + "test_acc": 0.01, + "lyapunov": 1.5433500727729115, + "grad_norm": 0.11919617488574552, + "grad_max_sv": 0.04310994283296168, + "grad_min_sv": 0.0, + "grad_condition": 43109942832.96168, + "lr": 0.0006344599103076324, + "time_sec": 86.96448731422424 + }, + { + "epoch": 63, + "train_loss": 5.32412813293457, + "train_acc": 0.0091, + "test_loss": 11.793109805297851, + "test_acc": 0.01, + "lyapunov": 1.5443742366702966, + "grad_norm": 0.118004366839836, + "grad_max_sv": 0.0428059502504766, + "grad_min_sv": 0.0, + "grad_condition": 42805950250.4766, + "lr": 0.0006243449435824269, + "time_sec": 86.93323230743408 + }, + { + "epoch": 64, + "train_loss": 5.318806624603272, + "train_acc": 0.00956, + "test_loss": 12.444959045410156, + "test_acc": 0.01, + "lyapunov": 1.5414444375830842, + "grad_norm": 0.11645932110555444, + "grad_max_sv": 0.030990714300423862, + "grad_min_sv": 0.0, + "grad_condition": 30990714300.42386, + "lr": 0.0006141754350553275, + "time_sec": 86.89740920066833 + }, + { + "epoch": 65, + "train_loss": 5.317045929870606, + "train_acc": 0.01018, + "test_loss": 10.023806936645508, + "test_acc": 0.01, + "lyapunov": 1.5395582572883353, + "grad_norm": 0.11276313707472024, + "grad_max_sv": 0.03361189742572605, + "grad_min_sv": 0.0, + "grad_condition": 33611897425.726055, + "lr": 0.0006039558454088793, + "time_sec": 86.97432947158813 + }, + { + "epoch": 66, + "train_loss": 5.32016941192627, + "train_acc": 0.00944, + "test_loss": 10.012617837524415, + "test_acc": 0.01, + "lyapunov": 1.5425440329115103, + "grad_norm": 0.10590387961842582, + "grad_max_sv": 0.02548480206169188, + "grad_min_sv": 0.0, + "grad_condition": 25484802061.691883, + "lr": 0.000593690657292862, + "time_sec": 86.97213578224182 + }, + { + "epoch": 67, + "train_loss": 5.320958078460693, + "train_acc": 0.00912, + "test_loss": 8.012544973754883, + "test_acc": 0.01, + "lyapunov": 1.5432329269321374, + "grad_norm": 0.11098177802612447, + "grad_max_sv": 0.028018432063981892, + "grad_min_sv": 0.0, + "grad_condition": 28018432063.98189, + "lr": 0.0005833843733580507, + "time_sec": 86.92108106613159 + }, + { + "epoch": 68, + "train_loss": 5.319859785614014, + "train_acc": 0.0098, + "test_loss": 9.247186422729492, + "test_acc": 0.01, + "lyapunov": 1.542363587852634, + "grad_norm": 0.1248664197770911, + "grad_max_sv": 0.04367699818685651, + "grad_min_sv": 0.0, + "grad_condition": 43676998186.85651, + "lr": 0.0005730415142812054, + "time_sec": 86.95592594146729 + }, + { + "epoch": 69, + "train_loss": 5.318826563873291, + "train_acc": 0.01016, + "test_loss": 10.35489285736084, + "test_acc": 0.01, + "lyapunov": 1.5414060040203201, + "grad_norm": 0.10987589074835707, + "grad_max_sv": 0.03276977320201695, + "grad_min_sv": 0.0, + "grad_condition": 32769773202.01695, + "lr": 0.0005626666167821517, + "time_sec": 86.91380739212036 + }, + { + "epoch": 70, + "train_loss": 5.317324656524658, + "train_acc": 0.01038, + "test_loss": 9.99694027709961, + "test_acc": 0.01, + "lyapunov": 1.5401056565896933, + "grad_norm": 0.10923451968148526, + "grad_max_sv": 0.026721618324518203, + "grad_min_sv": 0.0, + "grad_condition": 26721618324.518204, + "lr": 0.0005522642316338265, + "time_sec": 86.8878607749939 + }, + { + "epoch": 71, + "train_loss": 5.317690666198731, + "train_acc": 0.00962, + "test_loss": 8.448246655273438, + "test_acc": 0.01, + "lyapunov": 1.5407067177545688, + "grad_norm": 0.10993057282913465, + "grad_max_sv": 0.021391112776473164, + "grad_min_sv": 0.0, + "grad_condition": 21391112776.473164, + "lr": 0.0005418389216661573, + "time_sec": 86.89513158798218 + }, + { + "epoch": 72, + "train_loss": 5.317815923156738, + "train_acc": 0.01004, + "test_loss": 12.15319383392334, + "test_acc": 0.01, + "lyapunov": 1.5406005382537842, + "grad_norm": 0.11546754813601234, + "grad_max_sv": 0.04164923094213009, + "grad_min_sv": 0.0, + "grad_condition": 41649230942.13009, + "lr": 0.0005313952597646563, + "time_sec": 86.93751883506775 + }, + { + "epoch": 73, + "train_loss": 5.318552890930175, + "train_acc": 0.009, + "test_loss": 7.365837602996826, + "test_acc": 0.01, + "lyapunov": 1.5411235444685991, + "grad_norm": 0.11378399985617368, + "grad_max_sv": 0.03538390537723899, + "grad_min_sv": 0.0, + "grad_condition": 35383905377.23899, + "lr": 0.0005209378268645994, + "time_sec": 86.92508888244629 + }, + { + "epoch": 74, + "train_loss": 5.3266375039672855, + "train_acc": 0.00916, + "test_loss": 5.939176264190674, + "test_acc": 0.01, + "lyapunov": 1.5473728344568511, + "grad_norm": 0.112949937059148, + "grad_max_sv": 0.01943044299259782, + "grad_min_sv": 0.0, + "grad_condition": 19430442992.597816, + "lr": 0.0005104712099416781, + "time_sec": 86.87594652175903 + }, + { + "epoch": 75, + "train_loss": 5.3182286242675785, + "train_acc": 0.00916, + "test_loss": 7.4682364219665525, + "test_acc": 0.01, + "lyapunov": 1.5411189620757042, + "grad_norm": 0.11641453125231847, + "grad_max_sv": 0.01762835620902479, + "grad_min_sv": 0.0, + "grad_condition": 17628356209.024788, + "lr": 0.0004999999999999996, + "time_sec": 86.89264059066772 + }, + { + "epoch": 76, + "train_loss": 5.318416892242432, + "train_acc": 0.00958, + "test_loss": 6.8439142288208, + "test_acc": 0.01, + "lyapunov": 1.5413539412686281, + "grad_norm": 0.10777855944530633, + "grad_max_sv": 0.015298370318487287, + "grad_min_sv": 0.0, + "grad_condition": 15298370318.487286, + "lr": 0.0004895287900583212, + "time_sec": 86.88371872901917 + }, + { + "epoch": 77, + "train_loss": 5.3228406227111815, + "train_acc": 0.00964, + "test_loss": 10.02866414489746, + "test_acc": 0.01, + "lyapunov": 1.544968852606576, + "grad_norm": 0.1305888852844692, + "grad_max_sv": 0.01963789644651115, + "grad_min_sv": 0.0, + "grad_condition": 19637896446.51115, + "lr": 0.0004790621731353997, + "time_sec": 86.87340235710144 + }, + { + "epoch": 78, + "train_loss": 5.319401046447754, + "train_acc": 0.00956, + "test_loss": 8.256184762573243, + "test_acc": 0.01, + "lyapunov": 1.54242708158615, + "grad_norm": 0.11168685518140656, + "grad_max_sv": 0.02321814843453467, + "grad_min_sv": 0.0, + "grad_condition": 23218148434.534668, + "lr": 0.000468604740235343, + "time_sec": 86.87403607368469 + }, + { + "epoch": 79, + "train_loss": 5.319539002532959, + "train_acc": 0.00924, + "test_loss": 6.6485612655639645, + "test_acc": 0.01, + "lyapunov": 1.5427932879504036, + "grad_norm": 0.1281479832918265, + "grad_max_sv": 0.014649314666166901, + "grad_min_sv": 0.0, + "grad_condition": 14649314666.1669, + "lr": 0.00045816107833384175, + "time_sec": 86.86377239227295 + }, + { + "epoch": 80, + "train_loss": 5.321709277648925, + "train_acc": 0.00858, + "test_loss": 7.656314584350586, + "test_acc": 0.01, + "lyapunov": 1.5438944933664462, + "grad_norm": 0.1379118039308171, + "grad_max_sv": 0.006280570011585951, + "grad_min_sv": 0.0, + "grad_condition": 6280570011.585951, + "lr": 0.0004477357683661729, + "time_sec": 86.91206550598145 + }, + { + "epoch": 81, + "train_loss": 5.319362686614991, + "train_acc": 0.00904, + "test_loss": 7.019269757080078, + "test_acc": 0.01, + "lyapunov": 1.542548160723713, + "grad_norm": 0.12802539188386938, + "grad_max_sv": 0.019554349593818188, + "grad_min_sv": 0.0, + "grad_condition": 19554349593.818188, + "lr": 0.00043733338321784746, + "time_sec": 86.88340616226196 + }, + { + "epoch": 82, + "train_loss": 5.319549789886475, + "train_acc": 0.00932, + "test_loss": 7.563053443908691, + "test_acc": 0.01, + "lyapunov": 1.5428213295729265, + "grad_norm": 0.12962728912126797, + "grad_max_sv": 0.011001831339672207, + "grad_min_sv": 0.0, + "grad_condition": 11001831339.672207, + "lr": 0.0004269584857187939, + "time_sec": 87.12197208404541 + }, + { + "epoch": 83, + "train_loss": 5.3209361798095705, + "train_acc": 0.01004, + "test_loss": 8.245951638793946, + "test_acc": 0.01, + "lyapunov": 1.543517429810351, + "grad_norm": 0.12992986434807738, + "grad_max_sv": 0.011371771851554514, + "grad_min_sv": 0.0, + "grad_condition": 11371771851.554514, + "lr": 0.0004166156266419484, + "time_sec": 86.8549747467041 + }, + { + "epoch": 84, + "train_loss": 5.319158186340332, + "train_acc": 0.00988, + "test_loss": 11.181426934814453, + "test_acc": 0.01, + "lyapunov": 1.5418739129820138, + "grad_norm": 0.14570895237027714, + "grad_max_sv": 0.03400726960971952, + "grad_min_sv": 0.0, + "grad_condition": 34007269609.719513, + "lr": 0.0004063093427071373, + "time_sec": 86.95320224761963 + }, + { + "epoch": 85, + "train_loss": 5.319012271881103, + "train_acc": 0.0104, + "test_loss": 8.699293096923828, + "test_acc": 0.01, + "lyapunov": 1.5420828835128824, + "grad_norm": 0.15422110126668967, + "grad_max_sv": 0.0475749587174505, + "grad_min_sv": 0.0, + "grad_condition": 47574958717.4505, + "lr": 0.0003960441545911199, + "time_sec": 86.97516655921936 + }, + { + "epoch": 86, + "train_loss": 5.319778329925537, + "train_acc": 0.0099, + "test_loss": 8.610072163391113, + "test_acc": 0.01, + "lyapunov": 1.5427404270147729, + "grad_norm": 0.16350408468824804, + "grad_max_sv": 0.0467130537610501, + "grad_min_sv": 0.0, + "grad_condition": 46713053761.0501, + "lr": 0.0003858245649446718, + "time_sec": 86.97473764419556 + }, + { + "epoch": 87, + "train_loss": 5.320261403961181, + "train_acc": 0.01, + "test_loss": 9.01234596862793, + "test_acc": 0.01, + "lyapunov": 1.5430970234639199, + "grad_norm": 0.1987413764171708, + "grad_max_sv": 0.042272613104432824, + "grad_min_sv": 0.0, + "grad_condition": 42272613104.432816, + "lr": 0.00037565505641757235, + "time_sec": 86.94777846336365 + }, + { + "epoch": 88, + "train_loss": 5.328781169433594, + "train_acc": 0.00958, + "test_loss": 7.222933032226562, + "test_acc": 0.01, + "lyapunov": 1.5479203133326966, + "grad_norm": 0.20200984386229512, + "grad_max_sv": 0.037374650174751875, + "grad_min_sv": 2.888694869312344e-20, + "grad_condition": 37374645422.50441, + "lr": 0.00036554008969236695, + "time_sec": 86.9300582408905 + }, + { + "epoch": 89, + "train_loss": 5.3212895065307615, + "train_acc": 0.00972, + "test_loss": 7.341721871948242, + "test_acc": 0.01, + "lyapunov": 1.5442103443243314, + "grad_norm": 0.21135067798139123, + "grad_max_sv": 0.03894036049023271, + "grad_min_sv": 0.0, + "grad_condition": 38940360490.232704, + "lr": 0.0003554841015277638, + "time_sec": 87.02612471580505 + }, + { + "epoch": 90, + "train_loss": 5.319550964050293, + "train_acc": 0.0093, + "test_loss": 7.149930093383789, + "test_acc": 0.01, + "lyapunov": 1.5423216917325773, + "grad_norm": 0.17437221481494697, + "grad_max_sv": 0.04075719062238932, + "grad_min_sv": 0.0, + "grad_condition": 40757190622.38932, + "lr": 0.000345491502812526, + "time_sec": 86.95247411727905 + }, + { + "epoch": 91, + "train_loss": 5.319614014892578, + "train_acc": 0.00888, + "test_loss": 7.18144443359375, + "test_acc": 0.01, + "lyapunov": 1.5426533264882119, + "grad_norm": 0.17520092959369415, + "grad_max_sv": 0.022456927318125965, + "grad_min_sv": 0.0, + "grad_condition": 22456927318.125965, + "lr": 0.0003355666766307081, + "time_sec": 86.8960337638855 + }, + { + "epoch": 92, + "train_loss": 5.3187762687683104, + "train_acc": 0.00888, + "test_loss": 7.264889540863037, + "test_acc": 0.01, + "lyapunov": 1.5419618226683047, + "grad_norm": 0.1656377365844615, + "grad_max_sv": 0.015189866488799452, + "grad_min_sv": 0.0, + "grad_condition": 15189866488.799454, + "lr": 0.00032571397633909225, + "time_sec": 86.88141465187073 + }, + { + "epoch": 93, + "train_loss": 5.321614575958252, + "train_acc": 0.00952, + "test_loss": 7.152406310272217, + "test_acc": 0.01, + "lyapunov": 1.5444753560263786, + "grad_norm": 0.1783525963324978, + "grad_max_sv": 0.024426844296976925, + "grad_min_sv": 0.0, + "grad_condition": 24426844296.97692, + "lr": 0.00031593772365766094, + "time_sec": 86.87559199333191 + }, + { + "epoch": 94, + "train_loss": 5.319984560089111, + "train_acc": 0.0098, + "test_loss": 7.227280062866211, + "test_acc": 0.01, + "lyapunov": 1.543088520884209, + "grad_norm": 0.16043633002422977, + "grad_max_sv": 0.0368963482324034, + "grad_min_sv": 0.0, + "grad_condition": 36896348232.4034, + "lr": 0.0003062422067739483, + "time_sec": 86.98869109153748 + }, + { + "epoch": 95, + "train_loss": 5.318843619537353, + "train_acc": 0.00988, + "test_loss": 7.253403067016602, + "test_acc": 0.01, + "lyapunov": 1.5419552667671457, + "grad_norm": 0.15988427664274688, + "grad_max_sv": 0.03179542766883969, + "grad_min_sv": 0.0, + "grad_condition": 31795427668.83969, + "lr": 0.00029663167846209965, + "time_sec": 86.96610736846924 + }, + { + "epoch": 96, + "train_loss": 5.321573169403076, + "train_acc": 0.00976, + "test_loss": 6.988779404449463, + "test_acc": 0.01, + "lyapunov": 1.5446298613267786, + "grad_norm": 0.14208572570705744, + "grad_max_sv": 0.03598490892909467, + "grad_min_sv": 0.0, + "grad_condition": 35984908929.09467, + "lr": 0.00028711035421746345, + "time_sec": 86.90040850639343 + }, + { + "epoch": 97, + "train_loss": 5.325382752685547, + "train_acc": 0.00972, + "test_loss": 6.935153257751465, + "test_acc": 0.01, + "lyapunov": 1.5469825359256677, + "grad_norm": 0.18543936556050314, + "grad_max_sv": 0.024622759968042373, + "grad_min_sv": 0.0, + "grad_condition": 24622759968.042374, + "lr": 0.00027768241040753615, + "time_sec": 86.86737728118896 + }, + { + "epoch": 98, + "train_loss": 5.319345963439941, + "train_acc": 0.0094, + "test_loss": 6.679858758544922, + "test_acc": 0.01, + "lyapunov": 1.5427014974072157, + "grad_norm": 0.1365697052360637, + "grad_max_sv": 0.0006230609491467476, + "grad_min_sv": 0.0, + "grad_condition": 623060949.1467476, + "lr": 0.00026835198244006903, + "time_sec": 86.8515510559082 + }, + { + "epoch": 99, + "train_loss": 5.31858975479126, + "train_acc": 0.00966, + "test_loss": 6.5813590454101565, + "test_acc": 0.01, + "lyapunov": 1.5418859296442602, + "grad_norm": 0.13741337242075724, + "grad_max_sv": 0.0017974570393562317, + "grad_min_sv": 0.0, + "grad_condition": 1797457039.3562317, + "lr": 0.0002591231629491421, + "time_sec": 86.8734724521637 + }, + { + "epoch": 100, + "train_loss": 5.319550311279297, + "train_acc": 0.0096, + "test_loss": 6.593423309326172, + "test_acc": 0.01, + "lyapunov": 1.5429147582529756, + "grad_norm": 0.1428860474069435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 86.91073799133301 + }, + { + "epoch": 101, + "train_loss": 5.319647026672364, + "train_acc": 0.00946, + "test_loss": 6.644115385437011, + "test_acc": 0.01, + "lyapunov": 1.5430320498278685, + "grad_norm": 0.14070137371271418, + "grad_max_sv": 0.0011870765592902899, + "grad_min_sv": 0.0, + "grad_condition": 1187076559.2902899, + "lr": 0.00024098649531343477, + "time_sec": 86.85703229904175 + }, + { + "epoch": 102, + "train_loss": 5.320731920471191, + "train_acc": 0.01, + "test_loss": 6.511743521118164, + "test_acc": 0.01, + "lyapunov": 1.544078452202975, + "grad_norm": 0.16647090297400036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002320866025105016, + "time_sec": 86.84212875366211 + }, + { + "epoch": 103, + "train_loss": 5.320380414123536, + "train_acc": 0.0087, + "test_loss": 6.558885827636718, + "test_acc": 0.01, + "lyapunov": 1.5436865057786713, + "grad_norm": 0.16211214182978093, + "grad_max_sv": 0.0006886070128530264, + "grad_min_sv": 0.0, + "grad_condition": 688607012.8530264, + "lr": 0.0002233042253783278, + "time_sec": 86.84861445426941 + }, + { + "epoch": 104, + "train_loss": 5.320676337890625, + "train_acc": 0.0096, + "test_loss": 6.2893127243041995, + "test_acc": 0.01, + "lyapunov": 1.5437259469800593, + "grad_norm": 0.15756640000371477, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000214643216157784, + "time_sec": 86.85342407226562 + }, + { + "epoch": 105, + "train_loss": 5.318497552947998, + "train_acc": 0.00968, + "test_loss": 6.463031019592285, + "test_acc": 0.01, + "lyapunov": 1.5418586124239675, + "grad_norm": 0.16471254677440242, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376332, + "time_sec": 86.83621501922607 + }, + { + "epoch": 106, + "train_loss": 5.319013707885742, + "train_acc": 0.00958, + "test_loss": 8.393161967468261, + "test_acc": 0.01, + "lyapunov": 1.5424105264341739, + "grad_norm": 0.1697085900956353, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 86.87845063209534 + }, + { + "epoch": 107, + "train_loss": 5.319404435882569, + "train_acc": 0.01006, + "test_loss": 6.168719081115722, + "test_acc": 0.01, + "lyapunov": 1.5427791502164758, + "grad_norm": 0.16661392944132697, + "grad_max_sv": 0.008691688347607852, + "grad_min_sv": 0.0, + "grad_condition": 8691688347.607851, + "lr": 0.0001894261098608447, + "time_sec": 86.86028218269348 + }, + { + "epoch": 108, + "train_loss": 5.320062127532959, + "train_acc": 0.00946, + "test_loss": 6.123481111145019, + "test_acc": 0.01, + "lyapunov": 1.543502251510425, + "grad_norm": 0.1553396268788007, + "grad_max_sv": 0.0017994886264204979, + "grad_min_sv": 0.0, + "grad_condition": 1799488626.420498, + "lr": 0.000181288005125655, + "time_sec": 86.88756346702576 + }, + { + "epoch": 109, + "train_loss": 5.32126156539917, + "train_acc": 0.0097, + "test_loss": 6.113170930480957, + "test_acc": 0.01, + "lyapunov": 1.5443304225306986, + "grad_norm": 0.16827005574777967, + "grad_max_sv": 0.008998295897617936, + "grad_min_sv": 0.0, + "grad_condition": 8998295897.617935, + "lr": 0.0001732896980049473, + "time_sec": 86.87347865104675 + }, + { + "epoch": 110, + "train_loss": 5.319310050964355, + "train_acc": 0.00904, + "test_loss": 6.0610163803100585, + "test_acc": 0.01, + "lyapunov": 1.5427448618442505, + "grad_norm": 0.14666590598052404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016543469682057076, + "time_sec": 86.86950135231018 + }, + { + "epoch": 111, + "train_loss": 5.319597338256836, + "train_acc": 0.00972, + "test_loss": 6.453852326202393, + "test_acc": 0.01, + "lyapunov": 1.5429801303712303, + "grad_norm": 0.15909427151540545, + "grad_max_sv": 0.008126799669116735, + "grad_min_sv": 0.0, + "grad_condition": 8126799669.116735, + "lr": 0.00015772644703565552, + "time_sec": 86.88328433036804 + }, + { + "epoch": 112, + "train_loss": 5.3212175, + "train_acc": 0.00984, + "test_loss": 6.988222769927979, + "test_acc": 0.01, + "lyapunov": 1.5440433973546528, + "grad_norm": 0.15582154742531334, + "grad_max_sv": 0.023284211242571472, + "grad_min_sv": 0.0, + "grad_condition": 23284211242.571472, + "lr": 0.00015016832974331713, + "time_sec": 86.88312244415283 + }, + { + "epoch": 113, + "train_loss": 5.320971462249756, + "train_acc": 0.0098, + "test_loss": 6.753297560882569, + "test_acc": 0.01, + "lyapunov": 1.5437339016848513, + "grad_norm": 0.15454565641823212, + "grad_max_sv": 0.0231532484292984, + "grad_min_sv": 0.0, + "grad_condition": 23153248429.2984, + "lr": 0.00014276366018359834, + "time_sec": 86.87558174133301 + }, + { + "epoch": 114, + "train_loss": 5.318772131958008, + "train_acc": 0.00984, + "test_loss": 6.465322698974609, + "test_acc": 0.01, + "lyapunov": 1.5421108507439303, + "grad_norm": 0.15163809922079102, + "grad_max_sv": 0.017600245866924526, + "grad_min_sv": 0.0, + "grad_condition": 17600245866.924522, + "lr": 0.00013551568628929425, + "time_sec": 86.85901880264282 + }, + { + "epoch": 115, + "train_loss": 5.323592142486572, + "train_acc": 0.00918, + "test_loss": 5.990406560516357, + "test_acc": 0.01, + "lyapunov": 1.5453894397486811, + "grad_norm": 0.15673824664274916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 86.8471782207489 + }, + { + "epoch": 116, + "train_loss": 5.321912714385986, + "train_acc": 0.00934, + "test_loss": 5.642854423522949, + "test_acc": 0.01, + "lyapunov": 1.5451806213544763, + "grad_norm": 0.14873545301539315, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 86.82159352302551 + }, + { + "epoch": 117, + "train_loss": 5.319042910766601, + "train_acc": 0.00916, + "test_loss": 5.394878324890136, + "test_acc": 0.01, + "lyapunov": 1.5425118525009935, + "grad_norm": 0.15364989808867727, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 86.8501136302948 + }, + { + "epoch": 118, + "train_loss": 5.3216519416809085, + "train_acc": 0.0099, + "test_loss": 5.54234706954956, + "test_acc": 0.01, + "lyapunov": 1.544617168738714, + "grad_norm": 0.16204040482857374, + "grad_max_sv": 0.014768891455605625, + "grad_min_sv": 0.0, + "grad_condition": 14768891455.605625, + "lr": 0.00010815327133708009, + "time_sec": 86.8445405960083 + }, + { + "epoch": 119, + "train_loss": 5.318838922729492, + "train_acc": 0.00982, + "test_loss": 5.401806521606446, + "test_acc": 0.01, + "lyapunov": 1.5422493301694045, + "grad_norm": 0.16127338804024163, + "grad_max_sv": 0.00781935746781528, + "grad_min_sv": 0.0, + "grad_condition": 7819357467.81528, + "lr": 0.00010173504098790182, + "time_sec": 86.82885694503784 + }, + { + "epoch": 120, + "train_loss": 5.319433266448975, + "train_acc": 0.00962, + "test_loss": 5.87718871307373, + "test_acc": 0.01, + "lyapunov": 1.5428460543722753, + "grad_norm": 0.16811186230922795, + "grad_max_sv": 0.003142098290845752, + "grad_min_sv": 0.0, + "grad_condition": 3142098290.845752, + "lr": 9.549150281252629e-05, + "time_sec": 86.83435249328613 + }, + { + "epoch": 121, + "train_loss": 5.318956566009521, + "train_acc": 0.00864, + "test_loss": 5.642109811401367, + "test_acc": 0.01, + "lyapunov": 1.5424094806851634, + "grad_norm": 0.16401865280170627, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 86.84270787239075 + }, + { + "epoch": 122, + "train_loss": 5.320396621246338, + "train_acc": 0.00946, + "test_loss": 5.506566726684571, + "test_acc": 0.01, + "lyapunov": 1.543682734984571, + "grad_norm": 0.16574195620383422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 86.84029245376587 + }, + { + "epoch": 123, + "train_loss": 5.3207761328125, + "train_acc": 0.0098, + "test_loss": 5.753901168823242, + "test_acc": 0.01, + "lyapunov": 1.5442172185234402, + "grad_norm": 0.17475767067470402, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 86.83801436424255 + }, + { + "epoch": 124, + "train_loss": 5.318808111877441, + "train_acc": 0.00922, + "test_loss": 5.811789031982422, + "test_acc": 0.01, + "lyapunov": 1.5422291850190029, + "grad_norm": 0.16090202757718183, + "grad_max_sv": 0.003358612256124616, + "grad_min_sv": 0.0, + "grad_condition": 3358612256.1246157, + "lr": 7.231786991974666e-05, + "time_sec": 86.8513069152832 + }, + { + "epoch": 125, + "train_loss": 5.319976197967529, + "train_acc": 0.00978, + "test_loss": 5.7769184440612795, + "test_acc": 0.01, + "lyapunov": 1.543531141622597, + "grad_norm": 0.15700147429987782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 86.86197853088379 + }, + { + "epoch": 126, + "train_loss": 5.318454194946289, + "train_acc": 0.00986, + "test_loss": 6.11075336303711, + "test_acc": 0.01, + "lyapunov": 1.5418975673368216, + "grad_norm": 0.15336017967137117, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 86.86198329925537 + }, + { + "epoch": 127, + "train_loss": 5.3203326902771, + "train_acc": 0.00934, + "test_loss": 6.080118833160401, + "test_acc": 0.01, + "lyapunov": 1.5438893414519328, + "grad_norm": 0.15768179334274351, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 86.84648036956787 + }, + { + "epoch": 128, + "train_loss": 5.318091445770263, + "train_acc": 0.0093, + "test_loss": 6.249022463989258, + "test_acc": 0.01, + "lyapunov": 1.5415176842218774, + "grad_norm": 0.15317629834457977, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 86.83089065551758 + }, + { + "epoch": 129, + "train_loss": 5.319208795776367, + "train_acc": 0.00944, + "test_loss": 6.242862550354004, + "test_acc": 0.01, + "lyapunov": 1.5426923082307782, + "grad_norm": 0.1586342865712123, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 86.8825249671936 + }, + { + "epoch": 130, + "train_loss": 5.319570325469971, + "train_acc": 0.00932, + "test_loss": 6.273485357666016, + "test_acc": 0.01, + "lyapunov": 1.5430697696593108, + "grad_norm": 0.16288378510968, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 86.85678577423096 + }, + { + "epoch": 131, + "train_loss": 5.31834419998169, + "train_acc": 0.00966, + "test_loss": 6.162585590362549, + "test_acc": 0.01, + "lyapunov": 1.5417695389989088, + "grad_norm": 0.15701283230384563, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 86.83028483390808 + }, + { + "epoch": 132, + "train_loss": 5.319475943603516, + "train_acc": 0.0094, + "test_loss": 6.003315113067627, + "test_acc": 0.01, + "lyapunov": 1.5429863951090352, + "grad_norm": 0.1615796670941878, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 86.82017540931702 + }, + { + "epoch": 133, + "train_loss": 5.32576198135376, + "train_acc": 0.00958, + "test_loss": 5.846498718261719, + "test_acc": 0.01, + "lyapunov": 1.5467814566839078, + "grad_norm": 0.1814711768537964, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 86.84380340576172 + }, + { + "epoch": 134, + "train_loss": 5.321647165985107, + "train_acc": 0.00952, + "test_loss": 5.876250485229492, + "test_acc": 0.01, + "lyapunov": 1.544941949722407, + "grad_norm": 0.18078759337952854, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 86.84492230415344 + }, + { + "epoch": 135, + "train_loss": 5.31924706817627, + "train_acc": 0.0096, + "test_loss": 5.819815138244629, + "test_acc": 0.01, + "lyapunov": 1.5427488103851943, + "grad_norm": 0.16329066142016732, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 86.83999133110046 + }, + { + "epoch": 136, + "train_loss": 5.319398911132812, + "train_acc": 0.00982, + "test_loss": 6.490616073608399, + "test_acc": 0.01, + "lyapunov": 1.5429087801052785, + "grad_norm": 0.15926311416791136, + "grad_max_sv": 0.0018711634445935487, + "grad_min_sv": 0.0, + "grad_condition": 1871163444.5935485, + "lr": 2.1340251233966362e-05, + "time_sec": 86.86916947364807 + }, + { + "epoch": 137, + "train_loss": 5.318829065551758, + "train_acc": 0.00978, + "test_loss": 5.920670237731934, + "test_acc": 0.01, + "lyapunov": 1.5422979410347122, + "grad_norm": 0.16006466704199326, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 86.87598538398743 + }, + { + "epoch": 138, + "train_loss": 5.3190561383056645, + "train_acc": 0.00948, + "test_loss": 6.480327618408203, + "test_acc": 0.01, + "lyapunov": 1.5425209660664239, + "grad_norm": 0.16458438595098937, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 86.83726739883423 + }, + { + "epoch": 139, + "train_loss": 5.318953646392822, + "train_acc": 0.00984, + "test_loss": 5.952891006469726, + "test_acc": 0.01, + "lyapunov": 1.5424313371443688, + "grad_norm": 0.16278457254190812, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 86.83793210983276 + }, + { + "epoch": 140, + "train_loss": 5.3213463069152835, + "train_acc": 0.00976, + "test_loss": 6.456882773590088, + "test_acc": 0.01, + "lyapunov": 1.5445466053760266, + "grad_norm": 0.16371751816212385, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 86.85442423820496 + }, + { + "epoch": 141, + "train_loss": 5.318112189025879, + "train_acc": 0.00942, + "test_loss": 6.3592885223388675, + "test_acc": 0.01, + "lyapunov": 1.5415452919957582, + "grad_norm": 0.16093776786582448, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 86.8611011505127 + }, + { + "epoch": 142, + "train_loss": 5.319325820617676, + "train_acc": 0.00982, + "test_loss": 6.396855745697022, + "test_acc": 0.01, + "lyapunov": 1.5428402808011341, + "grad_norm": 0.16262217434072207, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 86.8790693283081 + }, + { + "epoch": 143, + "train_loss": 5.319489360198975, + "train_acc": 0.0098, + "test_loss": 6.390167568206787, + "test_acc": 0.01, + "lyapunov": 1.5430222728368266, + "grad_norm": 0.1599024522956201, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 86.8610942363739 + }, + { + "epoch": 144, + "train_loss": 5.3194953466796875, + "train_acc": 0.00936, + "test_loss": 6.3929207939147945, + "test_acc": 0.01, + "lyapunov": 1.5430299802814298, + "grad_norm": 0.15787151048989498, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 86.83452033996582 + }, + { + "epoch": 145, + "train_loss": 5.319091488189697, + "train_acc": 0.0099, + "test_loss": 6.387041884613037, + "test_acc": 0.01, + "lyapunov": 1.5425858250664324, + "grad_norm": 0.15981682340967285, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 86.84639286994934 + }, + { + "epoch": 146, + "train_loss": 5.319918049621582, + "train_acc": 0.01, + "test_loss": 6.390152045440674, + "test_acc": 0.01, + "lyapunov": 1.5434830600343397, + "grad_norm": 0.1664732055156118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 86.84289050102234 + }, + { + "epoch": 147, + "train_loss": 5.319467689819336, + "train_acc": 0.01, + "test_loss": 6.383955514526368, + "test_acc": 0.01, + "lyapunov": 1.5429968952827746, + "grad_norm": 0.16425908204350428, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 86.85825252532959 + }, + { + "epoch": 148, + "train_loss": 5.319666849975586, + "train_acc": 0.01, + "test_loss": 6.379462463378906, + "test_acc": 0.01, + "lyapunov": 1.5432310299495298, + "grad_norm": 0.1579801299018272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 86.90520691871643 + }, + { + "epoch": 149, + "train_loss": 5.318641065368652, + "train_acc": 0.01, + "test_loss": 6.385379031372071, + "test_acc": 0.01, + "lyapunov": 1.542139550609052, + "grad_norm": 0.1606682447514192, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 86.85262036323547 + }, + { + "epoch": 150, + "train_loss": 5.31824127532959, + "train_acc": 0.01, + "test_loss": 6.3839585464477535, + "test_acc": 0.01, + "lyapunov": 1.5416794817161072, + "grad_norm": 0.158152508901321, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 86.85510659217834 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 5.138188102111816, + "train_acc": 0.01868, + "test_loss": 4.947204817199707, + "test_acc": 0.0102, + "lyapunov": 2.4137888052274503, + "grad_norm": 5.2278560060516135, + "grad_max_sv": 4.450121748447418, + "grad_min_sv": 8.815894619873532e-08, + "grad_condition": 73462066.87031136, + "lr": 0.0009998903417374227, + "time_sec": 132.20039796829224 + }, + { + "epoch": 2, + "train_loss": 4.910357958526611, + "train_acc": 0.01772, + "test_loss": 4.974901505279541, + "test_acc": 0.0098, + "lyapunov": 1.8470725811960753, + "grad_norm": 5.334406474785501, + "grad_max_sv": 2.416768090268306, + "grad_min_sv": 4.845974281257734e-08, + "grad_condition": 156669965.4219852, + "lr": 0.0009995614150494292, + "time_sec": 132.20067143440247 + }, + { + "epoch": 3, + "train_loss": 4.789790082702637, + "train_acc": 0.01798, + "test_loss": 5.241659837341309, + "test_acc": 0.0152, + "lyapunov": 1.7693803560398425, + "grad_norm": 2.284868849655408, + "grad_max_sv": 1.6544225737452507, + "grad_min_sv": 3.7601093222372486e-08, + "grad_condition": 74204967.95678225, + "lr": 0.0009990133642141358, + "time_sec": 132.1939766407013 + }, + { + "epoch": 4, + "train_loss": 4.734155084381103, + "train_acc": 0.02012, + "test_loss": 4.736255917358398, + "test_acc": 0.01, + "lyapunov": 1.7185492494222148, + "grad_norm": 1.2969402037730182, + "grad_max_sv": 0.8527256481349468, + "grad_min_sv": 1.8718222001719557e-08, + "grad_condition": 3595934101.1830444, + "lr": 0.0009982464296247522, + "time_sec": 132.19083857536316 + }, + { + "epoch": 5, + "train_loss": 4.7501870367431644, + "train_acc": 0.01884, + "test_loss": 4.7008225593566895, + "test_acc": 0.01, + "lyapunov": 1.6784742927307363, + "grad_norm": 0.7283552366408743, + "grad_max_sv": 0.540743650496006, + "grad_min_sv": 6.143185659736945e-09, + "grad_condition": 20744559298.222054, + "lr": 0.0009972609476841367, + "time_sec": 132.19878315925598 + }, + { + "epoch": 6, + "train_loss": 4.777885425109863, + "train_acc": 0.01988, + "test_loss": 4.847038110351562, + "test_acc": 0.0163, + "lyapunov": 1.6714926692835814, + "grad_norm": 0.6978205109559127, + "grad_max_sv": 0.4112665578722954, + "grad_min_sv": 2.577558256003571e-09, + "grad_condition": 19293368058.44477, + "lr": 0.000996057350657239, + "time_sec": 132.22198057174683 + }, + { + "epoch": 7, + "train_loss": 4.817885786285401, + "train_acc": 0.01714, + "test_loss": 4.907033979797363, + "test_acc": 0.01, + "lyapunov": 1.6430019908548925, + "grad_norm": 0.538957530048536, + "grad_max_sv": 0.3900473590940237, + "grad_min_sv": 8.011143267797137e-10, + "grad_condition": 53520886424.44034, + "lr": 0.000994636166481494, + "time_sec": 132.18847823143005 + }, + { + "epoch": 8, + "train_loss": 4.866279851989746, + "train_acc": 0.01534, + "test_loss": 4.982185540008545, + "test_acc": 0.01, + "lyapunov": 1.622301935234948, + "grad_norm": 0.44743905036756576, + "grad_max_sv": 0.2975618153810501, + "grad_min_sv": 4.042702856767639e-12, + "grad_condition": 98919396245.19788, + "lr": 0.0009929980185352525, + "time_sec": 132.2019805908203 + }, + { + "epoch": 9, + "train_loss": 4.93485692489624, + "train_acc": 0.01296, + "test_loss": 5.24868205871582, + "test_acc": 0.01, + "lyapunov": 1.6329893876829416, + "grad_norm": 1.2710312604148948, + "grad_max_sv": 0.23227821737527848, + "grad_min_sv": 1.210631234207371e-10, + "grad_condition": 132050856729.70003, + "lr": 0.0009911436253643444, + "time_sec": 132.25901436805725 + }, + { + "epoch": 10, + "train_loss": 4.94441338470459, + "train_acc": 0.01662, + "test_loss": 4.9677005256652835, + "test_acc": 0.01, + "lyapunov": 1.6191197569717837, + "grad_norm": 0.5849346197331, + "grad_max_sv": 0.3103320188820362, + "grad_min_sv": 2.4441770461207573e-12, + "grad_condition": 142331552698.27188, + "lr": 0.0009890738003669028, + "time_sec": 132.24092388153076 + }, + { + "epoch": 11, + "train_loss": 4.978343018798828, + "train_acc": 0.01596, + "test_loss": 4.759020803070069, + "test_acc": 0.01, + "lyapunov": 1.607335550096029, + "grad_norm": 0.4668173173890936, + "grad_max_sv": 0.3271574813872576, + "grad_min_sv": 1.5228846413101469e-12, + "grad_condition": 163401069045.22977, + "lr": 0.00098678945143658, + "time_sec": 132.22342109680176 + }, + { + "epoch": 12, + "train_loss": 5.019883101348877, + "train_acc": 0.0154, + "test_loss": 4.942817668151855, + "test_acc": 0.01, + "lyapunov": 1.6049258376631286, + "grad_norm": 0.5264008543358515, + "grad_max_sv": 0.28871628642082214, + "grad_min_sv": 1.5745550588117867e-12, + "grad_condition": 141150096351.00974, + "lr": 0.0009842915805643154, + "time_sec": 132.17593479156494 + }, + { + "epoch": 13, + "train_loss": 5.055773426361084, + "train_acc": 0.01454, + "test_loss": 5.201871238708496, + "test_acc": 0.01, + "lyapunov": 1.5926724358287918, + "grad_norm": 0.5496018971790103, + "grad_max_sv": 0.3235856369137764, + "grad_min_sv": 1.5836317227272346e-12, + "grad_condition": 172440841867.61472, + "lr": 0.000981581283398829, + "time_sec": 132.19917631149292 + }, + { + "epoch": 14, + "train_loss": 5.1001338768005375, + "train_acc": 0.01374, + "test_loss": 6.031500621795654, + "test_acc": 0.01, + "lyapunov": 1.5873235156164145, + "grad_norm": 0.5347429702370289, + "grad_max_sv": 0.31967496164143083, + "grad_min_sv": 8.416411018220654e-13, + "grad_condition": 202636437942.46396, + "lr": 0.0009786597487660333, + "time_sec": 132.17077159881592 + }, + { + "epoch": 15, + "train_loss": 5.135957703857422, + "train_acc": 0.0124, + "test_loss": 5.739520129394531, + "test_acc": 0.01, + "lyapunov": 1.574544443803675, + "grad_norm": 0.6201173127889323, + "grad_max_sv": 0.32148296795785425, + "grad_min_sv": 1.8768859669293263e-11, + "grad_condition": 245017227140.7776, + "lr": 0.0009755282581475766, + "time_sec": 132.19619607925415 + }, + { + "epoch": 16, + "train_loss": 5.19933319366455, + "train_acc": 0.01332, + "test_loss": 6.819124224090576, + "test_acc": 0.01, + "lyapunov": 1.588761254649638, + "grad_norm": 0.7105947575125269, + "grad_max_sv": 0.3380855549126863, + "grad_min_sv": 1.0418656496584723e-09, + "grad_condition": 212026412736.4578, + "lr": 0.0009721881851187403, + "time_sec": 132.16591668128967 + }, + { + "epoch": 17, + "train_loss": 5.203327436523438, + "train_acc": 0.0158, + "test_loss": 7.679113117980957, + "test_acc": 0.01, + "lyapunov": 1.5917936892765563, + "grad_norm": 0.5687429696625533, + "grad_max_sv": 0.3429654061794281, + "grad_min_sv": 1.0535516342595844e-12, + "grad_condition": 208532854744.75134, + "lr": 0.0009686409947459456, + "time_sec": 132.23086404800415 + }, + { + "epoch": 18, + "train_loss": 5.227132577209472, + "train_acc": 0.01704, + "test_loss": 5.224352997589111, + "test_acc": 0.01, + "lyapunov": 1.590573813604272, + "grad_norm": 0.6501892893379347, + "grad_max_sv": 0.3389496423304081, + "grad_min_sv": 1.4743293232017855e-12, + "grad_condition": 179354691955.7947, + "lr": 0.0009648882429441254, + "time_sec": 132.17126607894897 + }, + { + "epoch": 19, + "train_loss": 5.268917711486816, + "train_acc": 0.01574, + "test_loss": 5.769149468994141, + "test_acc": 0.01, + "lyapunov": 1.5737659489102376, + "grad_norm": 0.7756970175394374, + "grad_max_sv": 0.33219469264149665, + "grad_min_sv": 1.3963206987681851e-12, + "grad_condition": 166340823567.4583, + "lr": 0.00096093157579425, + "time_sec": 132.3532431125641 + }, + { + "epoch": 20, + "train_loss": 5.388035034332275, + "train_acc": 0.01436, + "test_loss": 4.855289517211914, + "test_acc": 0.01, + "lyapunov": 1.6196008579200492, + "grad_norm": 3.273774802278225, + "grad_max_sv": 0.3476741284544914, + "grad_min_sv": 1.7954016832837687e-12, + "grad_condition": 163400108512.08075, + "lr": 0.0009567727288213001, + "time_sec": 132.18322706222534 + }, + { + "epoch": 21, + "train_loss": 5.477730575561523, + "train_acc": 0.0119, + "test_loss": 5.734935963439941, + "test_acc": 0.01, + "lyapunov": 1.6737558759386888, + "grad_norm": 0.7316822390940195, + "grad_max_sv": 0.41190238408744334, + "grad_min_sv": 1.4433235299420839e-09, + "grad_condition": 115946317202.22786, + "lr": 0.0009524135262330095, + "time_sec": 132.2254023551941 + }, + { + "epoch": 22, + "train_loss": 5.39889496673584, + "train_acc": 0.01078, + "test_loss": 4.648544214630127, + "test_acc": 0.01, + "lyapunov": 1.5598208084130836, + "grad_norm": 0.9136530334274789, + "grad_max_sv": 0.5729864671826362, + "grad_min_sv": 6.476590619830438e-09, + "grad_condition": 6966838482.173167, + "lr": 0.0009478558801197061, + "time_sec": 132.19873070716858 + }, + { + "epoch": 23, + "train_loss": 5.343370434570312, + "train_acc": 0.00934, + "test_loss": 4.6330633590698245, + "test_acc": 0.01, + "lyapunov": 1.544742999174406, + "grad_norm": 0.5447776712180945, + "grad_max_sv": 0.3971055932343006, + "grad_min_sv": 3.0723113141940555e-09, + "grad_condition": 10360739417.615135, + "lr": 0.000943101789615607, + "time_sec": 132.19472217559814 + }, + { + "epoch": 24, + "train_loss": 5.354044710998535, + "train_acc": 0.0106, + "test_loss": 4.758938900756836, + "test_acc": 0.01, + "lyapunov": 1.5540964880867687, + "grad_norm": 0.49799279906750776, + "grad_max_sv": 0.32289256788790227, + "grad_min_sv": 1.215183540768495e-09, + "grad_condition": 84138259698.76875, + "lr": 0.0009381533400219313, + "time_sec": 132.18565702438354 + }, + { + "epoch": 25, + "train_loss": 5.34166207687378, + "train_acc": 0.00954, + "test_loss": 4.616498927307129, + "test_acc": 0.01, + "lyapunov": 1.5548294105798082, + "grad_norm": 0.35224887377867997, + "grad_max_sv": 0.2050650805234909, + "grad_min_sv": 4.310481015545377e-10, + "grad_condition": 137027644012.72295, + "lr": 0.0009330127018922189, + "time_sec": 132.1707353591919 + }, + { + "epoch": 26, + "train_loss": 5.329114703826904, + "train_acc": 0.00962, + "test_loss": 4.608516737365723, + "test_acc": 0.01, + "lyapunov": 1.5478018071035595, + "grad_norm": 0.41152400199519606, + "grad_max_sv": 0.14391734022647143, + "grad_min_sv": 6.406558234285353e-11, + "grad_condition": 129739564652.99875, + "lr": 0.000927682130080253, + "time_sec": 132.1968698501587 + }, + { + "epoch": 27, + "train_loss": 5.333489670410156, + "train_acc": 0.0092, + "test_loss": 4.6180027542114255, + "test_acc": 0.01, + "lyapunov": 1.553746031068475, + "grad_norm": 0.395956424199356, + "grad_max_sv": 0.077771030459553, + "grad_min_sv": 3.8469886311157825e-16, + "grad_condition": 77730702472.31937, + "lr": 0.0009221639627510072, + "time_sec": 132.21505451202393 + }, + { + "epoch": 28, + "train_loss": 5.351277679595947, + "train_acc": 0.00942, + "test_loss": 4.7706145118713374, + "test_acc": 0.01, + "lyapunov": 1.564519799273947, + "grad_norm": 0.8070388432556335, + "grad_max_sv": 0.08204491948708892, + "grad_min_sv": 1.474816693019578e-15, + "grad_condition": 81835653341.89993, + "lr": 0.0009164606203550494, + "time_sec": 132.19659543037415 + }, + { + "epoch": 29, + "train_loss": 5.322618664703369, + "train_acc": 0.00872, + "test_loss": 5.576576512145996, + "test_acc": 0.01, + "lyapunov": 1.5448476557841386, + "grad_norm": 1.8211987840238726, + "grad_max_sv": 0.006918648211285472, + "grad_min_sv": 3.854375422071664e-17, + "grad_condition": 6914688932.083499, + "lr": 0.0009105746045668516, + "time_sec": 132.10211896896362 + }, + { + "epoch": 30, + "train_loss": 5.332048937377929, + "train_acc": 0.00954, + "test_loss": 5.513208132934571, + "test_acc": 0.01, + "lyapunov": 1.550695708035813, + "grad_norm": 1.1118821287367113, + "grad_max_sv": 0.019531637569889425, + "grad_min_sv": 1.0689040165877983e-16, + "grad_condition": 19522880900.554432, + "lr": 0.0009045084971874733, + "time_sec": 132.11267638206482 + }, + { + "epoch": 31, + "train_loss": 5.326176876373291, + "train_acc": 0.00918, + "test_loss": 5.386148994445801, + "test_acc": 0.01, + "lyapunov": 1.5464019519288827, + "grad_norm": 0.5069935542454341, + "grad_max_sv": 0.054698918107897045, + "grad_min_sv": 3.7386723818325515e-15, + "grad_condition": 54294495664.74051, + "lr": 0.0008982649590120977, + "time_sec": 132.1673936843872 + }, + { + "epoch": 32, + "train_loss": 5.322083574829102, + "train_acc": 0.01, + "test_loss": 4.707043412780762, + "test_acc": 0.01, + "lyapunov": 1.544298157667565, + "grad_norm": 0.42554937796746406, + "grad_max_sv": 0.04392390437424183, + "grad_min_sv": 2.3012806918730416e-16, + "grad_condition": 43903285638.58012, + "lr": 0.0008918467286629196, + "time_sec": 132.18636798858643 + }, + { + "epoch": 33, + "train_loss": 5.328476766967773, + "train_acc": 0.00958, + "test_loss": 5.157709109497071, + "test_acc": 0.01, + "lyapunov": 1.5494323496318534, + "grad_norm": 0.3948590073220422, + "grad_max_sv": 0.046419868059456346, + "grad_min_sv": 3.920453121241332e-16, + "grad_condition": 46387197576.51258, + "lr": 0.0008852566213878943, + "time_sec": 132.14906311035156 + }, + { + "epoch": 34, + "train_loss": 5.335322699432373, + "train_acc": 0.00912, + "test_loss": 4.63318578491211, + "test_acc": 0.01, + "lyapunov": 1.5560249096292365, + "grad_norm": 0.3431205276749687, + "grad_max_sv": 0.006924860086292029, + "grad_min_sv": 0.0, + "grad_condition": 6924860086.292028, + "lr": 0.000878497527825878, + "time_sec": 132.08630466461182 + }, + { + "epoch": 35, + "train_loss": 5.323294322357178, + "train_acc": 0.00884, + "test_loss": 4.605205520629883, + "test_acc": 0.01, + "lyapunov": 1.5453313735439955, + "grad_norm": 0.3024735245825119, + "grad_max_sv": 0.028930858056992293, + "grad_min_sv": 0.0, + "grad_condition": 28930858056.9923, + "lr": 0.000871572412738697, + "time_sec": 132.11405229568481 + }, + { + "epoch": 36, + "train_loss": 5.324136592712402, + "train_acc": 0.00868, + "test_loss": 4.605186470031739, + "test_acc": 0.01, + "lyapunov": 1.5469522064604113, + "grad_norm": 0.361219602695028, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107055, + "time_sec": 132.07118153572083 + }, + { + "epoch": 37, + "train_loss": 5.3209700448608395, + "train_acc": 0.00892, + "test_loss": 4.665984559631347, + "test_acc": 0.01, + "lyapunov": 1.5437110970392252, + "grad_norm": 0.3116729659195542, + "grad_max_sv": 0.020941149955615402, + "grad_min_sv": 0.0, + "grad_condition": 20941149955.6154, + "lr": 0.0008572363398164014, + "time_sec": 132.09318017959595 + }, + { + "epoch": 38, + "train_loss": 5.325020372467041, + "train_acc": 0.00874, + "test_loss": 4.663543145751953, + "test_acc": 0.01, + "lyapunov": 1.5469195239074396, + "grad_norm": 0.305903104498294, + "grad_max_sv": 0.024645538488402962, + "grad_min_sv": 0.0, + "grad_condition": 24645538488.40296, + "lr": 0.0008498316702566826, + "time_sec": 132.18630456924438 + }, + { + "epoch": 39, + "train_loss": 5.326424997558593, + "train_acc": 0.00926, + "test_loss": 4.710470159912109, + "test_acc": 0.01, + "lyapunov": 1.5472500924868962, + "grad_norm": 0.3315518442712431, + "grad_max_sv": 0.03559725326485932, + "grad_min_sv": 4.71556170988084e-33, + "grad_condition": 35597253264.859314, + "lr": 0.0008422735529643442, + "time_sec": 132.1392993927002 + }, + { + "epoch": 40, + "train_loss": 5.33426462966919, + "train_acc": 0.0096, + "test_loss": 4.689337516784668, + "test_acc": 0.01, + "lyapunov": 1.555562095568918, + "grad_norm": 0.3795118996689083, + "grad_max_sv": 0.028565633855760098, + "grad_min_sv": 0.0, + "grad_condition": 28565633855.760094, + "lr": 0.0008345653031794289, + "time_sec": 132.12650513648987 + }, + { + "epoch": 41, + "train_loss": 5.329594454193115, + "train_acc": 0.00962, + "test_loss": 4.677967825317383, + "test_acc": 0.01, + "lyapunov": 1.5518201217626977, + "grad_norm": 0.35226874238427724, + "grad_max_sv": 0.031289939628914, + "grad_min_sv": 0.0, + "grad_condition": 31289939628.913994, + "lr": 0.0008267103019950526, + "time_sec": 132.1842393875122 + }, + { + "epoch": 42, + "train_loss": 5.334290416412354, + "train_acc": 0.00948, + "test_loss": 4.7127025581359865, + "test_acc": 0.01, + "lyapunov": 1.55599294903943, + "grad_norm": 0.3150010140468872, + "grad_max_sv": 0.008952232170850038, + "grad_min_sv": 0.0, + "grad_condition": 8952232170.850039, + "lr": 0.0008187119948743447, + "time_sec": 132.16592741012573 + }, + { + "epoch": 43, + "train_loss": 5.330992495574951, + "train_acc": 0.00988, + "test_loss": 4.715853765869141, + "test_acc": 0.01, + "lyapunov": 1.5526615817223668, + "grad_norm": 0.32555598147833537, + "grad_max_sv": 0.025627513602375983, + "grad_min_sv": 0.0, + "grad_condition": 25627513602.375984, + "lr": 0.000810573890139155, + "time_sec": 132.1376314163208 + }, + { + "epoch": 44, + "train_loss": 5.342441840667725, + "train_acc": 0.009, + "test_loss": 4.814597158813476, + "test_acc": 0.01, + "lyapunov": 1.5608167011109764, + "grad_norm": 0.3705555621106487, + "grad_max_sv": 0.012277775909751654, + "grad_min_sv": 0.0, + "grad_condition": 12277775909.751654, + "lr": 0.0008022995574311873, + "time_sec": 132.10150909423828 + }, + { + "epoch": 45, + "train_loss": 5.330550760803223, + "train_acc": 0.00922, + "test_loss": 4.82506159362793, + "test_acc": 0.01, + "lyapunov": 1.552602043846989, + "grad_norm": 0.41377353743023604, + "grad_max_sv": 0.012684891000390053, + "grad_min_sv": 0.0, + "grad_condition": 12684891000.390053, + "lr": 0.0007938926261462363, + "time_sec": 132.13983154296875 + }, + { + "epoch": 46, + "train_loss": 5.346614602661133, + "train_acc": 0.00908, + "test_loss": 4.75941802444458, + "test_acc": 0.01, + "lyapunov": 1.565407470059212, + "grad_norm": 0.6666703677397586, + "grad_max_sv": 0.0006472387816756964, + "grad_min_sv": 0.0, + "grad_condition": 647238781.6756964, + "lr": 0.0007853567838422158, + "time_sec": 132.07343816757202 + }, + { + "epoch": 47, + "train_loss": 5.32947943145752, + "train_acc": 0.00898, + "test_loss": 4.822898616027832, + "test_acc": 0.01, + "lyapunov": 1.5532338082637933, + "grad_norm": 1.2230171967365666, + "grad_max_sv": 0.011994929099455477, + "grad_min_sv": 0.0, + "grad_condition": 11994929099.455475, + "lr": 0.0007766957746216719, + "time_sec": 132.13085794448853 + }, + { + "epoch": 48, + "train_loss": 5.3338893869018555, + "train_acc": 0.0092, + "test_loss": 4.843168624877929, + "test_acc": 0.01, + "lyapunov": 1.5537122622170412, + "grad_norm": 0.9355731457390791, + "grad_max_sv": 0.06068415185436606, + "grad_min_sv": 1.5809611954265782e-13, + "grad_condition": 46398377146.35246, + "lr": 0.0007679133974894982, + "time_sec": 132.11377477645874 + }, + { + "epoch": 49, + "train_loss": 5.340212641296387, + "train_acc": 0.00966, + "test_loss": 4.808492147827148, + "test_acc": 0.01, + "lyapunov": 1.556026118490702, + "grad_norm": 0.3770156243368251, + "grad_max_sv": 0.1463914191350341, + "grad_min_sv": 3.152568142733814e-13, + "grad_condition": 121760995460.97897, + "lr": 0.000759013504686565, + "time_sec": 132.2147512435913 + }, + { + "epoch": 50, + "train_loss": 5.332282363586426, + "train_acc": 0.0096, + "test_loss": 4.743034214782715, + "test_acc": 0.01, + "lyapunov": 1.5524532118111924, + "grad_norm": 0.3116530039130024, + "grad_max_sv": 0.10226385369896888, + "grad_min_sv": 3.0737180401130916e-15, + "grad_condition": 101953179254.12184, + "lr": 0.0007499999999999998, + "time_sec": 132.22958421707153 + }, + { + "epoch": 51, + "train_loss": 5.3305883631896975, + "train_acc": 0.00952, + "test_loss": 4.724603568267822, + "test_acc": 0.01, + "lyapunov": 1.5518521100968656, + "grad_norm": 0.3241210515609679, + "grad_max_sv": 0.08684249427169562, + "grad_min_sv": 6.328097683852358e-16, + "grad_condition": 86783867952.95651, + "lr": 0.0007408768370508575, + "time_sec": 132.19532179832458 + }, + { + "epoch": 52, + "train_loss": 5.332131455078125, + "train_acc": 0.00964, + "test_loss": 4.782391441345215, + "test_acc": 0.01, + "lyapunov": 1.5542255048556706, + "grad_norm": 0.32295260623787486, + "grad_max_sv": 0.077319351490587, + "grad_min_sv": 1.8882153881334225e-23, + "grad_condition": 77319351489.28442, + "lr": 0.0007316480175599307, + "time_sec": 132.21878457069397 + }, + { + "epoch": 53, + "train_loss": 5.333503689270019, + "train_acc": 0.00936, + "test_loss": 4.801981381225586, + "test_acc": 0.01, + "lyapunov": 1.5553877649404813, + "grad_norm": 0.31562374196715365, + "grad_max_sv": 0.06292690904811024, + "grad_min_sv": 1.0573404187094843e-32, + "grad_condition": 62926909048.110245, + "lr": 0.0007223175895924635, + "time_sec": 132.18660378456116 + }, + { + "epoch": 54, + "train_loss": 5.333852608795166, + "train_acc": 0.00896, + "test_loss": 4.810883659362793, + "test_acc": 0.01, + "lyapunov": 1.5559345386217318, + "grad_norm": 0.2781133113627033, + "grad_max_sv": 0.06129774982109666, + "grad_min_sv": 2.855284741973353e-38, + "grad_condition": 61297749821.09666, + "lr": 0.0007128896457825361, + "time_sec": 132.2198555469513 + }, + { + "epoch": 55, + "train_loss": 5.3339955087280275, + "train_acc": 0.00996, + "test_loss": 4.7569840606689455, + "test_acc": 0.01, + "lyapunov": 1.5569808833739336, + "grad_norm": 0.2566538491911281, + "grad_max_sv": 0.05556260636076331, + "grad_min_sv": 0.0, + "grad_condition": 55562606360.763306, + "lr": 0.0007033683215378998, + "time_sec": 132.21158051490784 + }, + { + "epoch": 56, + "train_loss": 5.3385576313781735, + "train_acc": 0.00902, + "test_loss": 4.754797148895264, + "test_acc": 0.01, + "lyapunov": 1.5597065461566075, + "grad_norm": 0.27047724542782614, + "grad_max_sv": 0.0640806739218533, + "grad_min_sv": 1.2193818893472967e-19, + "grad_condition": 64080664167.18032, + "lr": 0.0006937577932260512, + "time_sec": 132.19129037857056 + }, + { + "epoch": 57, + "train_loss": 5.334184418182373, + "train_acc": 0.0103, + "test_loss": 4.782689431762695, + "test_acc": 0.01, + "lyapunov": 1.556523521842859, + "grad_norm": 0.29259577039987816, + "grad_max_sv": 0.07542139226570725, + "grad_min_sv": 8.844145625485828e-17, + "grad_condition": 75415188010.71097, + "lr": 0.0006840622763423388, + "time_sec": 132.19539308547974 + }, + { + "epoch": 58, + "train_loss": 5.3342736126708985, + "train_acc": 0.00902, + "test_loss": 4.792922207641602, + "test_acc": 0.01, + "lyapunov": 1.556638328925423, + "grad_norm": 0.27651642414760924, + "grad_max_sv": 0.07381959799677133, + "grad_min_sv": 5.679191077750394e-25, + "grad_condition": 73819597996.72554, + "lr": 0.0006742860236609073, + "time_sec": 132.1646604537964 + }, + { + "epoch": 59, + "train_loss": 5.3365766784667965, + "train_acc": 0.00976, + "test_loss": 4.764654750061035, + "test_acc": 0.01, + "lyapunov": 1.559028771527283, + "grad_norm": 0.32368701389084115, + "grad_max_sv": 0.06830886630341411, + "grad_min_sv": 3.373213421233685e-18, + "grad_condition": 68308625699.52162, + "lr": 0.0006644333233692913, + "time_sec": 132.20315170288086 + }, + { + "epoch": 60, + "train_loss": 5.3372549061584476, + "train_acc": 0.00876, + "test_loss": 4.821174919128418, + "test_acc": 0.01, + "lyapunov": 1.5602548335824171, + "grad_norm": 0.3407373955115073, + "grad_max_sv": 0.05221205474808812, + "grad_min_sv": 0.0, + "grad_condition": 52212054748.08812, + "lr": 0.0006545084971874734, + "time_sec": 132.21871399879456 + }, + { + "epoch": 61, + "train_loss": 5.340573087158203, + "train_acc": 0.01004, + "test_loss": 4.814465225219727, + "test_acc": 0.01, + "lyapunov": 1.5639353786283137, + "grad_norm": 0.33445562902063697, + "grad_max_sv": 0.04306556633673608, + "grad_min_sv": 0.0, + "grad_condition": 43065566336.736084, + "lr": 0.0006445158984722354, + "time_sec": 132.16924214363098 + }, + { + "epoch": 62, + "train_loss": 5.343714674987793, + "train_acc": 0.0095, + "test_loss": 4.770381900024414, + "test_acc": 0.01, + "lyapunov": 1.566701197258347, + "grad_norm": 0.41600975854497274, + "grad_max_sv": 0.0407159102614969, + "grad_min_sv": 0.0, + "grad_condition": 40715910261.4969, + "lr": 0.0006344599103076324, + "time_sec": 132.14849257469177 + }, + { + "epoch": 63, + "train_loss": 5.340150414581299, + "train_acc": 0.00942, + "test_loss": 4.809834826660156, + "test_acc": 0.01, + "lyapunov": 1.5634946268232888, + "grad_norm": 0.4244404576721166, + "grad_max_sv": 0.046563083119690415, + "grad_min_sv": 0.0, + "grad_condition": 46563083119.690414, + "lr": 0.0006243449435824269, + "time_sec": 132.2440116405487 + }, + { + "epoch": 64, + "train_loss": 5.352264609527588, + "train_acc": 0.00968, + "test_loss": 4.719538593292237, + "test_acc": 0.01, + "lyapunov": 1.5730204283428924, + "grad_norm": 0.6484058447373605, + "grad_max_sv": 0.06881329002790153, + "grad_min_sv": 4.045636130762067e-11, + "grad_condition": 57057261120.16382, + "lr": 0.0006141754350553275, + "time_sec": 132.1377170085907 + }, + { + "epoch": 65, + "train_loss": 5.345465493011474, + "train_acc": 0.0095, + "test_loss": 4.807828170013428, + "test_acc": 0.01, + "lyapunov": 1.5668580141823616, + "grad_norm": 0.26811037405238153, + "grad_max_sv": 0.0895066935569048, + "grad_min_sv": 8.923440580685122e-16, + "grad_condition": 89405744261.32881, + "lr": 0.0006039558454088793, + "time_sec": 132.18963503837585 + }, + { + "epoch": 66, + "train_loss": 5.339095722351074, + "train_acc": 0.00992, + "test_loss": 4.79014116973877, + "test_acc": 0.01, + "lyapunov": 1.562422338044247, + "grad_norm": 0.2418134006072333, + "grad_max_sv": 0.04957848088815808, + "grad_min_sv": 0.0, + "grad_condition": 49578480888.15808, + "lr": 0.000593690657292862, + "time_sec": 132.18193554878235 + }, + { + "epoch": 67, + "train_loss": 5.339143208312988, + "train_acc": 0.00878, + "test_loss": 4.846720378875732, + "test_acc": 0.01, + "lyapunov": 1.5629626052153995, + "grad_norm": 0.23211875934280046, + "grad_max_sv": 0.04276521084830165, + "grad_min_sv": 0.0, + "grad_condition": 42765210848.30165, + "lr": 0.0005833843733580507, + "time_sec": 132.21098923683167 + }, + { + "epoch": 68, + "train_loss": 5.341660294799805, + "train_acc": 0.00926, + "test_loss": 4.93624571685791, + "test_acc": 0.01, + "lyapunov": 1.5647895671522525, + "grad_norm": 0.25226724531209027, + "grad_max_sv": 0.04243421019054949, + "grad_min_sv": 0.0, + "grad_condition": 42434210190.54949, + "lr": 0.0005730415142812054, + "time_sec": 132.18032026290894 + }, + { + "epoch": 69, + "train_loss": 5.3429354066467285, + "train_acc": 0.00964, + "test_loss": 4.963717977905273, + "test_acc": 0.01, + "lyapunov": 1.5658744921159866, + "grad_norm": 0.26387680813745, + "grad_max_sv": 0.044778031017631295, + "grad_min_sv": 0.0, + "grad_condition": 44778031017.63129, + "lr": 0.0005626666167821517, + "time_sec": 132.16022729873657 + }, + { + "epoch": 70, + "train_loss": 5.344523805389405, + "train_acc": 0.0091, + "test_loss": 4.810392481231689, + "test_acc": 0.01, + "lyapunov": 1.5665253672148565, + "grad_norm": 0.31439106456207916, + "grad_max_sv": 0.03966532703489065, + "grad_min_sv": 0.0, + "grad_condition": 39665327034.890656, + "lr": 0.0005522642316338265, + "time_sec": 132.1867744922638 + }, + { + "epoch": 71, + "train_loss": 5.346882275238037, + "train_acc": 0.00912, + "test_loss": 4.778971862792969, + "test_acc": 0.01, + "lyapunov": 1.568563460998828, + "grad_norm": 0.20952619953519083, + "grad_max_sv": 0.03776215887628496, + "grad_min_sv": 0.0, + "grad_condition": 37762158876.28496, + "lr": 0.0005418389216661573, + "time_sec": 132.18875670433044 + }, + { + "epoch": 72, + "train_loss": 5.353162684936524, + "train_acc": 0.00818, + "test_loss": 4.764224601745606, + "test_acc": 0.01, + "lyapunov": 1.5738632352760686, + "grad_norm": 0.21224191589739633, + "grad_max_sv": 0.02936461050994694, + "grad_min_sv": 0.0, + "grad_condition": 29364610509.94694, + "lr": 0.0005313952597646563, + "time_sec": 132.16054940223694 + }, + { + "epoch": 73, + "train_loss": 5.341572857055664, + "train_acc": 0.00934, + "test_loss": 4.764213945770264, + "test_acc": 0.01, + "lyapunov": 1.5656722372450183, + "grad_norm": 0.17131578138452824, + "grad_max_sv": 0.026255082851275802, + "grad_min_sv": 0.0, + "grad_condition": 26255082851.275803, + "lr": 0.0005209378268645994, + "time_sec": 132.11386466026306 + }, + { + "epoch": 74, + "train_loss": 5.34148181564331, + "train_acc": 0.00884, + "test_loss": 4.787430990600586, + "test_acc": 0.01, + "lyapunov": 1.5657289049509542, + "grad_norm": 0.20416273686306285, + "grad_max_sv": 0.03651727414689958, + "grad_min_sv": 0.0, + "grad_condition": 36517274146.89958, + "lr": 0.0005104712099416781, + "time_sec": 132.2018940448761 + }, + { + "epoch": 75, + "train_loss": 5.341119176330566, + "train_acc": 0.00948, + "test_loss": 4.769783227539063, + "test_acc": 0.01, + "lyapunov": 1.5654692183370176, + "grad_norm": 0.17080101166392242, + "grad_max_sv": 0.030799029115587472, + "grad_min_sv": 0.0, + "grad_condition": 30799029115.587475, + "lr": 0.0004999999999999996, + "time_sec": 132.12539839744568 + }, + { + "epoch": 76, + "train_loss": 5.345115729370117, + "train_acc": 0.00946, + "test_loss": 4.734894322967529, + "test_acc": 0.01, + "lyapunov": 1.5686149972174175, + "grad_norm": 0.18659944764551223, + "grad_max_sv": 0.012125130696222185, + "grad_min_sv": 0.0, + "grad_condition": 12125130696.222187, + "lr": 0.0004895287900583212, + "time_sec": 132.09123158454895 + }, + { + "epoch": 77, + "train_loss": 5.338459321289062, + "train_acc": 0.0094, + "test_loss": 4.7248460479736325, + "test_acc": 0.01, + "lyapunov": 1.5630621724116527, + "grad_norm": 0.176032379936258, + "grad_max_sv": 0.013429323118180037, + "grad_min_sv": 0.0, + "grad_condition": 13429323118.180037, + "lr": 0.0004790621731353997, + "time_sec": 132.07102465629578 + }, + { + "epoch": 78, + "train_loss": 5.345072369537354, + "train_acc": 0.00896, + "test_loss": 4.745542971801758, + "test_acc": 0.01, + "lyapunov": 1.5687669668051287, + "grad_norm": 0.2223520771526132, + "grad_max_sv": 0.00913866781629622, + "grad_min_sv": 0.0, + "grad_condition": 9138667816.29622, + "lr": 0.000468604740235343, + "time_sec": 132.31091713905334 + }, + { + "epoch": 79, + "train_loss": 5.338468246459961, + "train_acc": 0.00906, + "test_loss": 4.776708003234863, + "test_acc": 0.01, + "lyapunov": 1.5631554016981588, + "grad_norm": 0.18439021291098787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00045816107833384175, + "time_sec": 132.1099407672882 + }, + { + "epoch": 80, + "train_loss": 5.3392803921508785, + "train_acc": 0.0085, + "test_loss": 4.756961068725586, + "test_acc": 0.01, + "lyapunov": 1.5640239118005308, + "grad_norm": 0.1670344381602521, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004477357683661729, + "time_sec": 132.07850074768066 + }, + { + "epoch": 81, + "train_loss": 5.338647942352295, + "train_acc": 0.00896, + "test_loss": 4.738301519775391, + "test_acc": 0.01, + "lyapunov": 1.563378708441849, + "grad_norm": 0.15920625845312916, + "grad_max_sv": 0.012282294360920787, + "grad_min_sv": 0.0, + "grad_condition": 12282294360.920788, + "lr": 0.00043733338321784746, + "time_sec": 132.09186792373657 + }, + { + "epoch": 82, + "train_loss": 5.339479166107178, + "train_acc": 0.0092, + "test_loss": 4.714014392089844, + "test_acc": 0.01, + "lyapunov": 1.5639294709086113, + "grad_norm": 0.1731138874132484, + "grad_max_sv": 0.03721864921972155, + "grad_min_sv": 0.0, + "grad_condition": 37218649219.72156, + "lr": 0.0004269584857187939, + "time_sec": 132.1542615890503 + }, + { + "epoch": 83, + "train_loss": 5.345089318237305, + "train_acc": 0.00928, + "test_loss": 4.7151237457275395, + "test_acc": 0.01, + "lyapunov": 1.5680857643751842, + "grad_norm": 0.1866415261285155, + "grad_max_sv": 0.03729230999015272, + "grad_min_sv": 0.0, + "grad_condition": 37292309990.152725, + "lr": 0.0004166156266419484, + "time_sec": 132.18493914604187 + }, + { + "epoch": 84, + "train_loss": 5.345381183319092, + "train_acc": 0.00918, + "test_loss": 4.68825431060791, + "test_acc": 0.01, + "lyapunov": 1.568592563309633, + "grad_norm": 0.1882901347639973, + "grad_max_sv": 0.021022121235728265, + "grad_min_sv": 0.0, + "grad_condition": 21022121235.728264, + "lr": 0.0004063093427071373, + "time_sec": 132.12367796897888 + }, + { + "epoch": 85, + "train_loss": 5.340999842681884, + "train_acc": 0.00992, + "test_loss": 4.716685279846192, + "test_acc": 0.01, + "lyapunov": 1.5657545608632706, + "grad_norm": 0.20177951961733773, + "grad_max_sv": 0.01230331021361053, + "grad_min_sv": 0.0, + "grad_condition": 12303310213.610529, + "lr": 0.0003960441545911199, + "time_sec": 132.0947766304016 + }, + { + "epoch": 86, + "train_loss": 5.344697039794922, + "train_acc": 0.00906, + "test_loss": 4.770621002197266, + "test_acc": 0.01, + "lyapunov": 1.5692900818632083, + "grad_norm": 0.20891700571465235, + "grad_max_sv": 0.013876684103161096, + "grad_min_sv": 0.0, + "grad_condition": 13876684103.161098, + "lr": 0.0003858245649446718, + "time_sec": 132.09650421142578 + }, + { + "epoch": 87, + "train_loss": 5.346022133178711, + "train_acc": 0.00958, + "test_loss": 4.825743739318848, + "test_acc": 0.01, + "lyapunov": 1.5695690389179513, + "grad_norm": 0.23167422762918993, + "grad_max_sv": 0.0037465339992195368, + "grad_min_sv": 0.0, + "grad_condition": 3746533999.219537, + "lr": 0.00037565505641757235, + "time_sec": 132.0917444229126 + }, + { + "epoch": 88, + "train_loss": 5.346828841705323, + "train_acc": 0.00876, + "test_loss": 4.960531255340576, + "test_acc": 0.01, + "lyapunov": 1.5696865573258656, + "grad_norm": 0.1785675731490032, + "grad_max_sv": 0.005577366659417748, + "grad_min_sv": 0.0, + "grad_condition": 5577366659.417749, + "lr": 0.00036554008969236695, + "time_sec": 132.0870282649994 + }, + { + "epoch": 89, + "train_loss": 5.342154947357177, + "train_acc": 0.00878, + "test_loss": 4.975327129364014, + "test_acc": 0.01, + "lyapunov": 1.5665336716205567, + "grad_norm": 0.16793525655934358, + "grad_max_sv": 0.00797480964101851, + "grad_min_sv": 0.0, + "grad_condition": 7974809641.018509, + "lr": 0.0003554841015277638, + "time_sec": 132.12742161750793 + }, + { + "epoch": 90, + "train_loss": 5.346710361175537, + "train_acc": 0.00918, + "test_loss": 4.953879835510254, + "test_acc": 0.01, + "lyapunov": 1.5700483614831324, + "grad_norm": 0.18433712454121046, + "grad_max_sv": 0.012014600727707148, + "grad_min_sv": 0.0, + "grad_condition": 12014600727.707148, + "lr": 0.000345491502812526, + "time_sec": 132.0858714580536 + }, + { + "epoch": 91, + "train_loss": 5.341808082733154, + "train_acc": 0.00856, + "test_loss": 5.010934870910645, + "test_acc": 0.01, + "lyapunov": 1.566529265754973, + "grad_norm": 0.1758408454253638, + "grad_max_sv": 0.003343093441799283, + "grad_min_sv": 0.0, + "grad_condition": 3343093441.799283, + "lr": 0.0003355666766307081, + "time_sec": 132.0660150051117 + }, + { + "epoch": 92, + "train_loss": 5.351253204956055, + "train_acc": 0.00918, + "test_loss": 5.023424221801758, + "test_acc": 0.01, + "lyapunov": 1.5723978284069948, + "grad_norm": 0.17788255301821657, + "grad_max_sv": 0.014162034029141068, + "grad_min_sv": 0.0, + "grad_condition": 14162034029.141071, + "lr": 0.00032571397633909225, + "time_sec": 132.10221076011658 + }, + { + "epoch": 93, + "train_loss": 5.347586841278076, + "train_acc": 0.00884, + "test_loss": 4.963154336547851, + "test_acc": 0.01, + "lyapunov": 1.5719817017045472, + "grad_norm": 0.2369860248003482, + "grad_max_sv": 0.004905311437323689, + "grad_min_sv": 0.0, + "grad_condition": 4905311437.323689, + "lr": 0.00031593772365766094, + "time_sec": 132.1323049068451 + }, + { + "epoch": 94, + "train_loss": 5.343141855926514, + "train_acc": 0.00848, + "test_loss": 4.921149578094482, + "test_acc": 0.01, + "lyapunov": 1.5679576765850682, + "grad_norm": 0.1602509536119079, + "grad_max_sv": 0.019888732209801675, + "grad_min_sv": 0.0, + "grad_condition": 19888732209.801674, + "lr": 0.0003062422067739483, + "time_sec": 132.1422688961029 + }, + { + "epoch": 95, + "train_loss": 5.343594031066894, + "train_acc": 0.00906, + "test_loss": 4.905448650360108, + "test_acc": 0.01, + "lyapunov": 1.5682554074260584, + "grad_norm": 0.17541418565565223, + "grad_max_sv": 0.009854677692055702, + "grad_min_sv": 0.0, + "grad_condition": 9854677692.055702, + "lr": 0.00029663167846209965, + "time_sec": 132.11462831497192 + }, + { + "epoch": 96, + "train_loss": 5.341661099700928, + "train_acc": 0.00938, + "test_loss": 4.896561671447754, + "test_acc": 0.01, + "lyapunov": 1.566467627539964, + "grad_norm": 0.18126299601196125, + "grad_max_sv": 0.013893446559086442, + "grad_min_sv": 0.0, + "grad_condition": 13893446559.086445, + "lr": 0.00028711035421746345, + "time_sec": 132.183189868927 + }, + { + "epoch": 97, + "train_loss": 5.341162901000977, + "train_acc": 0.00872, + "test_loss": 4.906980642700195, + "test_acc": 0.01, + "lyapunov": 1.5660171655132948, + "grad_norm": 0.18389173404235654, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00027768241040753615, + "time_sec": 132.1316442489624 + }, + { + "epoch": 98, + "train_loss": 5.340904234008789, + "train_acc": 0.0087, + "test_loss": 4.880604965209961, + "test_acc": 0.01, + "lyapunov": 1.5657722669489242, + "grad_norm": 0.16941469287847527, + "grad_max_sv": 0.0025681605096906424, + "grad_min_sv": 0.0, + "grad_condition": 2568160509.6906424, + "lr": 0.00026835198244006903, + "time_sec": 132.0789442062378 + }, + { + "epoch": 99, + "train_loss": 5.342495626068115, + "train_acc": 0.00838, + "test_loss": 4.8667546737670895, + "test_acc": 0.01, + "lyapunov": 1.56737110986734, + "grad_norm": 0.2098824320936581, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002591231629491421, + "time_sec": 132.06338381767273 + }, + { + "epoch": 100, + "train_loss": 5.341140549468994, + "train_acc": 0.00882, + "test_loss": 4.923036535644531, + "test_acc": 0.01, + "lyapunov": 1.5660716353170097, + "grad_norm": 0.16309007942968, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002499999999999997, + "time_sec": 132.0798683166504 + }, + { + "epoch": 101, + "train_loss": 5.367573778076172, + "train_acc": 0.00942, + "test_loss": 4.8419834274291995, + "test_acc": 0.01, + "lyapunov": 1.5839073743356769, + "grad_norm": 0.17849770970668777, + "grad_max_sv": 0.006972884247079492, + "grad_min_sv": 0.0, + "grad_condition": 6972884247.079493, + "lr": 0.00024098649531343477, + "time_sec": 132.07039666175842 + }, + { + "epoch": 102, + "train_loss": 5.3430040219116215, + "train_acc": 0.00878, + "test_loss": 4.867986113739014, + "test_acc": 0.01, + "lyapunov": 1.5680094472587567, + "grad_norm": 0.17231990573343864, + "grad_max_sv": 0.002580128749832511, + "grad_min_sv": 0.0, + "grad_condition": 2580128749.832511, + "lr": 0.0002320866025105016, + "time_sec": 132.0873384475708 + }, + { + "epoch": 103, + "train_loss": 5.342889985504151, + "train_acc": 0.00874, + "test_loss": 4.840346334075928, + "test_acc": 0.01, + "lyapunov": 1.5678095716954497, + "grad_norm": 0.18603931144131847, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002233042253783278, + "time_sec": 132.0669243335724 + }, + { + "epoch": 104, + "train_loss": 5.345595389709473, + "train_acc": 0.00906, + "test_loss": 4.82763256072998, + "test_acc": 0.01, + "lyapunov": 1.5700134941379127, + "grad_norm": 0.17962506167998699, + "grad_max_sv": 0.0006658073514699935, + "grad_min_sv": 0.0, + "grad_condition": 665807351.4699936, + "lr": 0.000214643216157784, + "time_sec": 132.0985701084137 + }, + { + "epoch": 105, + "train_loss": 5.354534033508301, + "train_acc": 0.00898, + "test_loss": 4.813229525756836, + "test_acc": 0.01, + "lyapunov": 1.5754887292452175, + "grad_norm": 0.2002013331480914, + "grad_max_sv": 0.004350297572091222, + "grad_min_sv": 0.0, + "grad_condition": 4350297572.091222, + "lr": 0.00020610737385376332, + "time_sec": 132.09686851501465 + }, + { + "epoch": 106, + "train_loss": 5.3426032342529295, + "train_acc": 0.00804, + "test_loss": 4.823688924407959, + "test_acc": 0.01, + "lyapunov": 1.567502071485495, + "grad_norm": 0.177797147662824, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019770044256881242, + "time_sec": 132.1264684200287 + }, + { + "epoch": 107, + "train_loss": 5.349622652893067, + "train_acc": 0.00884, + "test_loss": 4.844220027923584, + "test_acc": 0.01, + "lyapunov": 1.571947547176, + "grad_norm": 0.16292252305474791, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001894261098608447, + "time_sec": 132.10880613327026 + }, + { + "epoch": 108, + "train_loss": 5.345900168304444, + "train_acc": 0.00918, + "test_loss": 4.840348344421387, + "test_acc": 0.01, + "lyapunov": 1.5703127265281385, + "grad_norm": 0.17468920430563006, + "grad_max_sv": 0.0029470635578036307, + "grad_min_sv": 0.0, + "grad_condition": 2947063557.803631, + "lr": 0.000181288005125655, + "time_sec": 132.11736822128296 + }, + { + "epoch": 109, + "train_loss": 5.345384422454834, + "train_acc": 0.00874, + "test_loss": 4.8622421981811526, + "test_acc": 0.01, + "lyapunov": 1.5698327935870042, + "grad_norm": 0.21177276682423293, + "grad_max_sv": 0.0007724121678620577, + "grad_min_sv": 0.0, + "grad_condition": 772412167.8620577, + "lr": 0.0001732896980049473, + "time_sec": 132.07746076583862 + }, + { + "epoch": 110, + "train_loss": 5.342875657653809, + "train_acc": 0.00912, + "test_loss": 4.856573393249512, + "test_acc": 0.01, + "lyapunov": 1.5677888875117387, + "grad_norm": 0.16084383685322373, + "grad_max_sv": 0.013493797415867448, + "grad_min_sv": 0.0, + "grad_condition": 13493797415.867447, + "lr": 0.00016543469682057076, + "time_sec": 132.08074021339417 + }, + { + "epoch": 111, + "train_loss": 5.355080330505371, + "train_acc": 0.00822, + "test_loss": 4.830239296722412, + "test_acc": 0.01, + "lyapunov": 1.5756983775312028, + "grad_norm": 0.1959747570871713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 132.07752227783203 + }, + { + "epoch": 112, + "train_loss": 5.342228624572754, + "train_acc": 0.00892, + "test_loss": 4.84301993560791, + "test_acc": 0.01, + "lyapunov": 1.5673401697212472, + "grad_norm": 0.14204259013530204, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 132.06180357933044 + }, + { + "epoch": 113, + "train_loss": 5.3422714726257325, + "train_acc": 0.00928, + "test_loss": 4.821010319519043, + "test_acc": 0.01, + "lyapunov": 1.5673690311744084, + "grad_norm": 0.1572610072392831, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 132.09343099594116 + }, + { + "epoch": 114, + "train_loss": 5.3444528672790526, + "train_acc": 0.0086, + "test_loss": 4.83043311843872, + "test_acc": 0.01, + "lyapunov": 1.5691952199277366, + "grad_norm": 0.15397404749427382, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 132.07117557525635 + }, + { + "epoch": 115, + "train_loss": 5.342576068572998, + "train_acc": 0.00892, + "test_loss": 4.83036664352417, + "test_acc": 0.01, + "lyapunov": 1.5677011345353578, + "grad_norm": 0.13531666387620547, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 132.1246190071106 + }, + { + "epoch": 116, + "train_loss": 5.342390079040527, + "train_acc": 0.009, + "test_loss": 4.818707986450195, + "test_acc": 0.01, + "lyapunov": 1.5674945427023845, + "grad_norm": 0.11755267765049923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 132.10427331924438 + }, + { + "epoch": 117, + "train_loss": 5.346578267517089, + "train_acc": 0.00914, + "test_loss": 4.808753877258301, + "test_acc": 0.01, + "lyapunov": 1.571015379617891, + "grad_norm": 0.14739866079910954, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 132.09667372703552 + }, + { + "epoch": 118, + "train_loss": 5.341421314849853, + "train_acc": 0.00888, + "test_loss": 4.8178321044921875, + "test_acc": 0.01, + "lyapunov": 1.5664617289667544, + "grad_norm": 0.15196598686273202, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010815327133708009, + "time_sec": 132.09818243980408 + }, + { + "epoch": 119, + "train_loss": 5.342278069915771, + "train_acc": 0.00846, + "test_loss": 4.809390866088867, + "test_acc": 0.01, + "lyapunov": 1.5673773797881572, + "grad_norm": 0.17015255493793316, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010173504098790182, + "time_sec": 132.13357877731323 + }, + { + "epoch": 120, + "train_loss": 5.341155296783447, + "train_acc": 0.00878, + "test_loss": 4.819783433532715, + "test_acc": 0.01, + "lyapunov": 1.56620217955021, + "grad_norm": 0.13456226708171515, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 132.0805094242096 + }, + { + "epoch": 121, + "train_loss": 5.344341220397949, + "train_acc": 0.00942, + "test_loss": 4.812504239654541, + "test_acc": 0.01, + "lyapunov": 1.5690714410503808, + "grad_norm": 0.15635175889858405, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 132.10770106315613 + }, + { + "epoch": 122, + "train_loss": 5.341316756591797, + "train_acc": 0.00872, + "test_loss": 4.791230865478516, + "test_acc": 0.01, + "lyapunov": 1.5663795004720273, + "grad_norm": 0.13120586242402146, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 132.12851881980896 + }, + { + "epoch": 123, + "train_loss": 5.343846289520264, + "train_acc": 0.00826, + "test_loss": 4.791252892303467, + "test_acc": 0.01, + "lyapunov": 1.5686628943514032, + "grad_norm": 0.12574649548787997, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 132.11882972717285 + }, + { + "epoch": 124, + "train_loss": 5.341886834716797, + "train_acc": 0.00924, + "test_loss": 4.7894229957580565, + "test_acc": 0.01, + "lyapunov": 1.566991005712153, + "grad_norm": 0.12125233233583547, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 132.1242277622223 + }, + { + "epoch": 125, + "train_loss": 5.341545905151367, + "train_acc": 0.00844, + "test_loss": 4.781455255126953, + "test_acc": 0.01, + "lyapunov": 1.566652334559604, + "grad_norm": 0.11877593044343822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 132.1204969882965 + }, + { + "epoch": 126, + "train_loss": 5.343738833465576, + "train_acc": 0.0089, + "test_loss": 4.782108512115479, + "test_acc": 0.01, + "lyapunov": 1.5686877148840435, + "grad_norm": 0.14685494918897216, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 132.1582751274109 + }, + { + "epoch": 127, + "train_loss": 5.340985955505371, + "train_acc": 0.0095, + "test_loss": 4.780940398406982, + "test_acc": 0.01, + "lyapunov": 1.5660363987583639, + "grad_norm": 0.11589911056077733, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.6898210384392595e-05, + "time_sec": 132.11265683174133 + }, + { + "epoch": 128, + "train_loss": 5.343754200744629, + "train_acc": 0.00968, + "test_loss": 4.7895281066894535, + "test_acc": 0.01, + "lyapunov": 1.5686014985184535, + "grad_norm": 0.14358686229070586, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 132.08578968048096 + }, + { + "epoch": 129, + "train_loss": 5.345564033660889, + "train_acc": 0.00894, + "test_loss": 4.789863642883301, + "test_acc": 0.01, + "lyapunov": 1.5702618372714734, + "grad_norm": 0.15311883643219684, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.7586473766990294e-05, + "time_sec": 132.07862830162048 + }, + { + "epoch": 130, + "train_loss": 5.342584033355713, + "train_acc": 0.00908, + "test_loss": 4.779020539093017, + "test_acc": 0.01, + "lyapunov": 1.5677639367940175, + "grad_norm": 0.15329364714098923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.32272711786996e-05, + "time_sec": 132.16318249702454 + }, + { + "epoch": 131, + "train_loss": 5.341682634429931, + "train_acc": 0.00944, + "test_loss": 4.782007501220703, + "test_acc": 0.01, + "lyapunov": 1.5667803564949718, + "grad_norm": 0.13761474702045567, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 132.10979580879211 + }, + { + "epoch": 132, + "train_loss": 5.342693343200684, + "train_acc": 0.00874, + "test_loss": 4.785680311584473, + "test_acc": 0.01, + "lyapunov": 1.5677480008596045, + "grad_norm": 0.14227357176692468, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 132.14933609962463 + }, + { + "epoch": 133, + "train_loss": 5.339641748504639, + "train_acc": 0.00948, + "test_loss": 4.7827409004211425, + "test_acc": 0.01, + "lyapunov": 1.5646268839726363, + "grad_norm": 0.11276908599413558, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 132.07238721847534 + }, + { + "epoch": 134, + "train_loss": 5.341200107269287, + "train_acc": 0.00926, + "test_loss": 4.787122599792481, + "test_acc": 0.01, + "lyapunov": 1.566309593217757, + "grad_norm": 0.11577298218878175, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7811814881259484e-05, + "time_sec": 132.08721160888672 + }, + { + "epoch": 135, + "train_loss": 5.341790512847901, + "train_acc": 0.0089, + "test_loss": 4.78599192199707, + "test_acc": 0.01, + "lyapunov": 1.5669051058152144, + "grad_norm": 0.11406538673568321, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.4471741852423218e-05, + "time_sec": 132.13204169273376 + }, + { + "epoch": 136, + "train_loss": 5.342709656066894, + "train_acc": 0.0095, + "test_loss": 4.784429030609131, + "test_acc": 0.01, + "lyapunov": 1.5678098799322573, + "grad_norm": 0.1301621255904577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 132.10533571243286 + }, + { + "epoch": 137, + "train_loss": 5.341824940795899, + "train_acc": 0.00922, + "test_loss": 4.7872933067321775, + "test_acc": 0.01, + "lyapunov": 1.5669465708305768, + "grad_norm": 0.11590542924579983, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 132.09704732894897 + }, + { + "epoch": 138, + "train_loss": 5.341511313171386, + "train_acc": 0.00974, + "test_loss": 4.7792837577819824, + "test_acc": 0.01, + "lyapunov": 1.5666430996507026, + "grad_norm": 0.11256165029712978, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568445e-05, + "time_sec": 132.12034392356873 + }, + { + "epoch": 139, + "train_loss": 5.341457148132324, + "train_acc": 0.00972, + "test_loss": 4.780789426422119, + "test_acc": 0.01, + "lyapunov": 1.5665654376949496, + "grad_norm": 0.10204898242159913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.3210548563419845e-05, + "time_sec": 132.14241123199463 + }, + { + "epoch": 140, + "train_loss": 5.3405984710693355, + "train_acc": 0.00948, + "test_loss": 4.778655993652344, + "test_acc": 0.01, + "lyapunov": 1.5656854539271206, + "grad_norm": 0.12809073544865285, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.0926199633097203e-05, + "time_sec": 132.08009314537048 + }, + { + "epoch": 141, + "train_loss": 5.340534744262695, + "train_acc": 0.0091, + "test_loss": 4.780472738647461, + "test_acc": 0.01, + "lyapunov": 1.5655692928587384, + "grad_norm": 0.10313184635997721, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.856374635655688e-06, + "time_sec": 132.0838325023651 + }, + { + "epoch": 142, + "train_loss": 5.340677046051026, + "train_acc": 0.00992, + "test_loss": 4.781814497375488, + "test_acc": 0.01, + "lyapunov": 1.5657385788915101, + "grad_norm": 0.10334450883525552, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 132.11706686019897 + }, + { + "epoch": 143, + "train_loss": 5.341100224914551, + "train_acc": 0.01, + "test_loss": 4.7812304672241215, + "test_acc": 0.01, + "lyapunov": 1.5661775379839455, + "grad_norm": 0.1264085338408933, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.3638335185058295e-06, + "time_sec": 132.12464785575867 + }, + { + "epoch": 144, + "train_loss": 5.341793058776855, + "train_acc": 0.01, + "test_loss": 4.78042247467041, + "test_acc": 0.01, + "lyapunov": 1.5669281586356785, + "grad_norm": 0.09436149541511535, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761114e-06, + "time_sec": 132.1470422744751 + }, + { + "epoch": 145, + "train_loss": 5.349506974182129, + "train_acc": 0.01, + "test_loss": 4.78042266998291, + "test_acc": 0.01, + "lyapunov": 1.5731076300906404, + "grad_norm": 0.1178995174742038, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 132.09918355941772 + }, + { + "epoch": 146, + "train_loss": 5.342189108886719, + "train_acc": 0.01, + "test_loss": 4.781454308319092, + "test_acc": 0.01, + "lyapunov": 1.5673414352909683, + "grad_norm": 0.09081347881139741, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 132.10713911056519 + }, + { + "epoch": 147, + "train_loss": 5.341546408996582, + "train_acc": 0.01, + "test_loss": 4.781454162597656, + "test_acc": 0.01, + "lyapunov": 1.5666629228445574, + "grad_norm": 0.09019678612458548, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 132.1311194896698 + }, + { + "epoch": 148, + "train_loss": 5.341715382995606, + "train_acc": 0.01, + "test_loss": 4.782687770843506, + "test_acc": 0.01, + "lyapunov": 1.5668335332894874, + "grad_norm": 0.09070167126439822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 132.13174676895142 + }, + { + "epoch": 149, + "train_loss": 5.342021694946289, + "train_acc": 0.01, + "test_loss": 4.782687942504883, + "test_acc": 0.01, + "lyapunov": 1.5671642540056077, + "grad_norm": 0.09082797851606526, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 132.09515190124512 + }, + { + "epoch": 150, + "train_loss": 5.339607263183594, + "train_acc": 0.01, + "test_loss": 4.782687832641601, + "test_acc": 0.01, + "lyapunov": 1.5645978752609409, + "grad_norm": 0.090368422289998, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 132.06873154640198 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 5.170418347930908, + "train_acc": 0.01482, + "test_loss": 4.874806223297119, + "test_acc": 0.0107, + "lyapunov": 2.4393880626429683, + "grad_norm": 5.345734057581178, + "grad_max_sv": 4.483905690908432, + "grad_min_sv": 8.954973220731688e-08, + "grad_condition": 129025189.7290709, + "lr": 0.0009998903417374227, + "time_sec": 177.46578431129456 + }, + { + "epoch": 2, + "train_loss": 4.886182316741944, + "train_acc": 0.01718, + "test_loss": 4.80269637298584, + "test_acc": 0.0102, + "lyapunov": 1.9971744041613606, + "grad_norm": 3.4433992950689616, + "grad_max_sv": 2.739058768749237, + "grad_min_sv": 5.745658385736263e-08, + "grad_condition": 84538548.49489692, + "lr": 0.0009995614150494292, + "time_sec": 177.3906273841858 + }, + { + "epoch": 3, + "train_loss": 4.783107050323486, + "train_acc": 0.01528, + "test_loss": 4.738721482086182, + "test_acc": 0.01, + "lyapunov": 1.8048184826550886, + "grad_norm": 2.047885898328211, + "grad_max_sv": 1.4787879481911659, + "grad_min_sv": 3.2768289852033726e-08, + "grad_condition": 566050825.5696664, + "lr": 0.0009990133642141358, + "time_sec": 177.4175295829773 + }, + { + "epoch": 4, + "train_loss": 4.751416029052734, + "train_acc": 0.01606, + "test_loss": 4.630446166992187, + "test_acc": 0.01, + "lyapunov": 1.707960840991086, + "grad_norm": 1.4476075782979456, + "grad_max_sv": 0.836699303984642, + "grad_min_sv": 1.4332362594222718e-08, + "grad_condition": 24679971260.08811, + "lr": 0.0009982464296247522, + "time_sec": 177.5156271457672 + }, + { + "epoch": 5, + "train_loss": 4.7807122309875485, + "train_acc": 0.01428, + "test_loss": 4.622669477844238, + "test_acc": 0.01, + "lyapunov": 1.7041781695602496, + "grad_norm": 1.050316146928851, + "grad_max_sv": 0.498383151658345, + "grad_min_sv": 3.796087105340611e-11, + "grad_condition": 139863529616.57062, + "lr": 0.0009972609476841367, + "time_sec": 177.43440508842468 + }, + { + "epoch": 6, + "train_loss": 4.8388256774902345, + "train_acc": 0.01308, + "test_loss": 4.649810864257812, + "test_acc": 0.01, + "lyapunov": 1.6965309613196136, + "grad_norm": 0.6788898927695144, + "grad_max_sv": 0.42595611810684203, + "grad_min_sv": 1.5628448124239113e-12, + "grad_condition": 206494283007.18826, + "lr": 0.000996057350657239, + "time_sec": 177.44785737991333 + }, + { + "epoch": 7, + "train_loss": 4.8986459965515134, + "train_acc": 0.01186, + "test_loss": 4.708990380859375, + "test_acc": 0.01, + "lyapunov": 1.7017012535763518, + "grad_norm": 0.48731250728585107, + "grad_max_sv": 0.33343438915908336, + "grad_min_sv": 5.53908882765212e-13, + "grad_condition": 254093723126.4781, + "lr": 0.000994636166481494, + "time_sec": 177.37777757644653 + }, + { + "epoch": 8, + "train_loss": 4.943858919830323, + "train_acc": 0.01104, + "test_loss": 5.26636118927002, + "test_acc": 0.01, + "lyapunov": 1.7182561540237777, + "grad_norm": 0.48999999014626605, + "grad_max_sv": 0.25608402006328107, + "grad_min_sv": 9.286946471073546e-14, + "grad_condition": 242351728116.98883, + "lr": 0.0009929980185352525, + "time_sec": 177.387188911438 + }, + { + "epoch": 9, + "train_loss": 4.979513124542236, + "train_acc": 0.01144, + "test_loss": 5.497952555084228, + "test_acc": 0.01, + "lyapunov": 1.7062027213518576, + "grad_norm": 0.42079758157884545, + "grad_max_sv": 0.2485219370573759, + "grad_min_sv": 1.885935727798404e-14, + "grad_condition": 245798317000.96808, + "lr": 0.0009911436253643444, + "time_sec": 177.38124251365662 + }, + { + "epoch": 10, + "train_loss": 5.0166656953430175, + "train_acc": 0.01076, + "test_loss": 4.605617906188965, + "test_acc": 0.01, + "lyapunov": 1.6932507491172732, + "grad_norm": 0.420321050632811, + "grad_max_sv": 0.2404270452912897, + "grad_min_sv": 9.577507932467198e-25, + "grad_condition": 240427045291.03647, + "lr": 0.0009890738003669028, + "time_sec": 177.3316354751587 + }, + { + "epoch": 11, + "train_loss": 5.0578450691223145, + "train_acc": 0.0114, + "test_loss": 4.605764473724365, + "test_acc": 0.01, + "lyapunov": 1.6895873580137482, + "grad_norm": 0.49178900029145406, + "grad_max_sv": 0.26607779785990715, + "grad_min_sv": 5.082064100170326e-21, + "grad_condition": 266077796409.95917, + "lr": 0.00098678945143658, + "time_sec": 177.35666227340698 + }, + { + "epoch": 12, + "train_loss": 5.092576569976806, + "train_acc": 0.01182, + "test_loss": 4.60662777633667, + "test_acc": 0.01, + "lyapunov": 1.6848897119922102, + "grad_norm": 0.6934058402651867, + "grad_max_sv": 0.34772998839616776, + "grad_min_sv": 1.6804705504564466e-13, + "grad_condition": 311062929805.2175, + "lr": 0.0009842915805643154, + "time_sec": 177.45647644996643 + }, + { + "epoch": 13, + "train_loss": 5.15109172531128, + "train_acc": 0.01186, + "test_loss": 4.608129429626465, + "test_acc": 0.01, + "lyapunov": 1.7015191944663788, + "grad_norm": 0.6846074227630976, + "grad_max_sv": 0.32766890451312064, + "grad_min_sv": 2.4578391875654614e-18, + "grad_condition": 327668018219.02893, + "lr": 0.000981581283398829, + "time_sec": 177.36489033699036 + }, + { + "epoch": 14, + "train_loss": 5.2939554736328125, + "train_acc": 0.0105, + "test_loss": 5.4404556137084965, + "test_acc": 0.01, + "lyapunov": 1.733636704247321, + "grad_norm": 2.0585577176009484, + "grad_max_sv": 0.5351610340178012, + "grad_min_sv": 6.043698563311623e-09, + "grad_condition": 125123088585.82278, + "lr": 0.0009786597487660333, + "time_sec": 177.41271114349365 + }, + { + "epoch": 15, + "train_loss": 5.339356228485108, + "train_acc": 0.01, + "test_loss": 5.634622732543946, + "test_acc": 0.01, + "lyapunov": 1.7321220276605747, + "grad_norm": 1.2474576611019448, + "grad_max_sv": 0.5749046392738819, + "grad_min_sv": 7.0887550281236514e-09, + "grad_condition": 17881232094.586456, + "lr": 0.0009755282581475766, + "time_sec": 177.42803382873535 + }, + { + "epoch": 16, + "train_loss": 5.213154935302734, + "train_acc": 0.00934, + "test_loss": 5.393290295410156, + "test_acc": 0.01, + "lyapunov": 1.5737932243615465, + "grad_norm": 0.46647750812487915, + "grad_max_sv": 0.27153575848788025, + "grad_min_sv": 1.5242528473500716e-09, + "grad_condition": 77568831402.5238, + "lr": 0.0009721881851187403, + "time_sec": 177.44743824005127 + }, + { + "epoch": 17, + "train_loss": 5.262427766418457, + "train_acc": 0.01022, + "test_loss": 4.925324077606201, + "test_acc": 0.01, + "lyapunov": 1.5760375502164408, + "grad_norm": 0.6268713729269668, + "grad_max_sv": 0.37553633116185664, + "grad_min_sv": 3.283041272093994e-09, + "grad_condition": 31488669291.59237, + "lr": 0.0009686409947459456, + "time_sec": 177.47271943092346 + }, + { + "epoch": 18, + "train_loss": 5.289855928497315, + "train_acc": 0.009, + "test_loss": 5.166483688354492, + "test_acc": 0.01, + "lyapunov": 1.5759224303238226, + "grad_norm": 0.4193761222715419, + "grad_max_sv": 0.26443815175443885, + "grad_min_sv": 1.8233460938992724e-09, + "grad_condition": 83574980362.08054, + "lr": 0.0009648882429441254, + "time_sec": 177.47960138320923 + }, + { + "epoch": 19, + "train_loss": 5.3201322650146485, + "train_acc": 0.0104, + "test_loss": 5.085500339508057, + "test_acc": 0.01, + "lyapunov": 1.5752660103161316, + "grad_norm": 0.35145865174653673, + "grad_max_sv": 0.1685528600588441, + "grad_min_sv": 5.831233779827688e-12, + "grad_condition": 106917248964.36707, + "lr": 0.00096093157579425, + "time_sec": 177.47897052764893 + }, + { + "epoch": 20, + "train_loss": 5.3543471484375, + "train_acc": 0.00944, + "test_loss": 5.246659634399414, + "test_acc": 0.01, + "lyapunov": 1.575355000812989, + "grad_norm": 0.5222583225299012, + "grad_max_sv": 0.10507027432322502, + "grad_min_sv": 7.849948703277934e-12, + "grad_condition": 72947428086.86752, + "lr": 0.0009567727288213001, + "time_sec": 177.43105292320251 + }, + { + "epoch": 21, + "train_loss": 5.354224435882569, + "train_acc": 0.00964, + "test_loss": 5.22655355682373, + "test_acc": 0.01, + "lyapunov": 1.577795330520786, + "grad_norm": 1.7696193327514464, + "grad_max_sv": 0.04788816105574369, + "grad_min_sv": 3.098440861051027e-15, + "grad_condition": 47515160306.08334, + "lr": 0.0009524135262330095, + "time_sec": 177.38868117332458 + }, + { + "epoch": 22, + "train_loss": 5.359287767486572, + "train_acc": 0.00866, + "test_loss": 5.144994302368164, + "test_acc": 0.01, + "lyapunov": 1.5772388463130083, + "grad_norm": 0.521407113480236, + "grad_max_sv": 0.16268486455082892, + "grad_min_sv": 1.0480323490539272e-12, + "grad_condition": 114294670712.50664, + "lr": 0.0009478558801197061, + "time_sec": 177.4581241607666 + }, + { + "epoch": 23, + "train_loss": 5.359366517028809, + "train_acc": 0.00984, + "test_loss": 5.14449934387207, + "test_acc": 0.01, + "lyapunov": 1.5788166193705995, + "grad_norm": 0.47520625785430726, + "grad_max_sv": 0.14188788905739785, + "grad_min_sv": 7.763794243203392e-13, + "grad_condition": 90263258979.91963, + "lr": 0.000943101789615607, + "time_sec": 177.4587037563324 + }, + { + "epoch": 24, + "train_loss": 5.363788315887451, + "train_acc": 0.00998, + "test_loss": 5.219554689025879, + "test_acc": 0.01, + "lyapunov": 1.5823031307181434, + "grad_norm": 0.45933897983850147, + "grad_max_sv": 0.1220944058150053, + "grad_min_sv": 8.70957522797587e-13, + "grad_condition": 79316477379.01375, + "lr": 0.0009381533400219313, + "time_sec": 177.45913338661194 + }, + { + "epoch": 25, + "train_loss": 5.365634008026123, + "train_acc": 0.0094, + "test_loss": 5.931232183074951, + "test_acc": 0.01, + "lyapunov": 1.5886532437161107, + "grad_norm": 0.43344753842757794, + "grad_max_sv": 0.017200349643826485, + "grad_min_sv": 1.0856606585118899e-15, + "grad_condition": 17078915149.903616, + "lr": 0.0009330127018922189, + "time_sec": 177.41433334350586 + }, + { + "epoch": 26, + "train_loss": 5.356309142761231, + "train_acc": 0.00862, + "test_loss": 5.939939945220948, + "test_acc": 0.01, + "lyapunov": 1.5817654276138071, + "grad_norm": 0.3773119512884375, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000927682130080253, + "time_sec": 177.42445373535156 + }, + { + "epoch": 27, + "train_loss": 5.356818426208496, + "train_acc": 0.00902, + "test_loss": 6.903866325378418, + "test_acc": 0.01, + "lyapunov": 1.5823859988576006, + "grad_norm": 0.4182139130247132, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009221639627510072, + "time_sec": 177.31799745559692 + }, + { + "epoch": 28, + "train_loss": 5.391271570739746, + "train_acc": 0.00976, + "test_loss": 5.460548217773438, + "test_acc": 0.01, + "lyapunov": 1.5841533107220973, + "grad_norm": 0.523477636772141, + "grad_max_sv": 0.3192333810031414, + "grad_min_sv": 2.9275436547182563e-09, + "grad_condition": 203519819.7178569, + "lr": 0.0009164606203550494, + "time_sec": 177.46226978302002 + }, + { + "epoch": 29, + "train_loss": 5.375988426361084, + "train_acc": 0.00942, + "test_loss": 5.342045057678223, + "test_acc": 0.01, + "lyapunov": 1.584143414521766, + "grad_norm": 0.4275297259535999, + "grad_max_sv": 0.29515107311308386, + "grad_min_sv": 1.5519966579252698e-09, + "grad_condition": 5083754884.994722, + "lr": 0.0009105746045668516, + "time_sec": 177.49048447608948 + }, + { + "epoch": 30, + "train_loss": 5.3762526119995115, + "train_acc": 0.00992, + "test_loss": 5.335840890502929, + "test_acc": 0.01, + "lyapunov": 1.5899017634599104, + "grad_norm": 0.46512305667247905, + "grad_max_sv": 0.24659424126148224, + "grad_min_sv": 2.2743761505509726e-12, + "grad_condition": 128688559196.96506, + "lr": 0.0009045084971874733, + "time_sec": 177.4821593761444 + }, + { + "epoch": 31, + "train_loss": 5.376188383178711, + "train_acc": 0.00954, + "test_loss": 5.376922852325439, + "test_acc": 0.01, + "lyapunov": 1.5906847974528437, + "grad_norm": 0.40698064884293045, + "grad_max_sv": 0.2344340980052948, + "grad_min_sv": 1.6077615594515009e-12, + "grad_condition": 119697955045.46411, + "lr": 0.0008982649590120977, + "time_sec": 177.51625323295593 + }, + { + "epoch": 32, + "train_loss": 5.373684441070557, + "train_acc": 0.00944, + "test_loss": 5.2473334838867185, + "test_acc": 0.01, + "lyapunov": 1.5879211066019199, + "grad_norm": 0.3720940356738668, + "grad_max_sv": 0.20825780294835566, + "grad_min_sv": 3.7871002154344376e-10, + "grad_condition": 69233328517.31859, + "lr": 0.0008918467286629196, + "time_sec": 177.5158429145813 + }, + { + "epoch": 33, + "train_loss": 5.369580058288574, + "train_acc": 0.00906, + "test_loss": 5.292366073608399, + "test_acc": 0.01, + "lyapunov": 1.5872128549439217, + "grad_norm": 0.36741579981339867, + "grad_max_sv": 0.16275404021143913, + "grad_min_sv": 3.5290433862002075e-13, + "grad_condition": 135525270524.32925, + "lr": 0.0008852566213878943, + "time_sec": 177.54218769073486 + }, + { + "epoch": 34, + "train_loss": 5.364965376129151, + "train_acc": 0.00946, + "test_loss": 5.301969288635254, + "test_acc": 0.01, + "lyapunov": 1.5879910906867298, + "grad_norm": 0.40385833520326136, + "grad_max_sv": 0.09459194829687476, + "grad_min_sv": 2.8168103316895143e-14, + "grad_condition": 90889833007.94754, + "lr": 0.000878497527825878, + "time_sec": 177.56994581222534 + }, + { + "epoch": 35, + "train_loss": 5.367663076019287, + "train_acc": 0.01036, + "test_loss": 5.347993537902832, + "test_acc": 0.01, + "lyapunov": 1.5875165621033105, + "grad_norm": 0.3132720633072883, + "grad_max_sv": 0.1425728589296341, + "grad_min_sv": 2.007235616198558e-14, + "grad_condition": 139708753283.34723, + "lr": 0.000871572412738697, + "time_sec": 177.49852347373962 + }, + { + "epoch": 36, + "train_loss": 5.370810558624267, + "train_acc": 0.01022, + "test_loss": 5.382797595214844, + "test_acc": 0.01, + "lyapunov": 1.5899634550294608, + "grad_norm": 0.30370352801828593, + "grad_max_sv": 0.16092172265052795, + "grad_min_sv": 4.485897177730539e-14, + "grad_condition": 154470905347.59918, + "lr": 0.0008644843137107055, + "time_sec": 177.4556074142456 + }, + { + "epoch": 37, + "train_loss": 5.384568545379639, + "train_acc": 0.01018, + "test_loss": 5.296823876953125, + "test_acc": 0.01, + "lyapunov": 1.5977905272217967, + "grad_norm": 0.266373358722962, + "grad_max_sv": 0.14979717023670674, + "grad_min_sv": 7.171554109546675e-14, + "grad_condition": 140879720678.9068, + "lr": 0.0008572363398164014, + "time_sec": 177.47119235992432 + }, + { + "epoch": 38, + "train_loss": 5.370039872131348, + "train_acc": 0.01028, + "test_loss": 5.444481262207031, + "test_acc": 0.01, + "lyapunov": 1.5899496447399755, + "grad_norm": 0.3096876275058644, + "grad_max_sv": 0.15369951017200947, + "grad_min_sv": 9.48148632228887e-14, + "grad_condition": 141735332362.74988, + "lr": 0.0008498316702566826, + "time_sec": 177.47467923164368 + }, + { + "epoch": 39, + "train_loss": 5.369657610778809, + "train_acc": 0.01024, + "test_loss": 5.390600685119629, + "test_acc": 0.01, + "lyapunov": 1.5896801790008155, + "grad_norm": 0.3108555116352423, + "grad_max_sv": 0.1614890903234482, + "grad_min_sv": 9.349701492890973e-14, + "grad_condition": 149566173130.64127, + "lr": 0.0008422735529643442, + "time_sec": 177.4328293800354 + }, + { + "epoch": 40, + "train_loss": 5.3822917242431645, + "train_acc": 0.0093, + "test_loss": 5.184299499511718, + "test_acc": 0.01, + "lyapunov": 1.6002484066102205, + "grad_norm": 0.24882538015615607, + "grad_max_sv": 0.04936090065166354, + "grad_min_sv": 6.934642584876431e-15, + "grad_condition": 48367763332.42686, + "lr": 0.0008345653031794289, + "time_sec": 177.37197065353394 + }, + { + "epoch": 41, + "train_loss": 5.373546744842529, + "train_acc": 0.00964, + "test_loss": 5.196872940063477, + "test_acc": 0.01, + "lyapunov": 1.5940455433047946, + "grad_norm": 0.2191391775580976, + "grad_max_sv": 0.09365939311683177, + "grad_min_sv": 1.5882716898553207e-15, + "grad_condition": 93493384840.27858, + "lr": 0.0008267103019950526, + "time_sec": 177.47450184822083 + }, + { + "epoch": 42, + "train_loss": 5.368149404144287, + "train_acc": 0.00874, + "test_loss": 5.14538009185791, + "test_acc": 0.01, + "lyapunov": 1.590694589383157, + "grad_norm": 0.22212098932442453, + "grad_max_sv": 0.10206865929067135, + "grad_min_sv": 2.3133067448522557e-15, + "grad_condition": 101840784421.61417, + "lr": 0.0008187119948743447, + "time_sec": 177.46074080467224 + }, + { + "epoch": 43, + "train_loss": 5.367429432983398, + "train_acc": 0.00892, + "test_loss": 5.233426832580567, + "test_acc": 0.01, + "lyapunov": 1.591343494327477, + "grad_norm": 0.23543493742380756, + "grad_max_sv": 0.08834987077862025, + "grad_min_sv": 5.952270134521069e-16, + "grad_condition": 88299394994.77124, + "lr": 0.000810573890139155, + "time_sec": 177.47843408584595 + }, + { + "epoch": 44, + "train_loss": 5.3674171057128905, + "train_acc": 0.00878, + "test_loss": 5.2093109710693355, + "test_acc": 0.01, + "lyapunov": 1.5915821013243303, + "grad_norm": 0.1990598758819041, + "grad_max_sv": 0.07391932224854827, + "grad_min_sv": 4.4595190727564784e-24, + "grad_condition": 73919322248.21725, + "lr": 0.0008022995574311873, + "time_sec": 177.49818992614746 + }, + { + "epoch": 45, + "train_loss": 5.367794494018555, + "train_acc": 0.00928, + "test_loss": 5.287538707733154, + "test_acc": 0.01, + "lyapunov": 1.5911102807125472, + "grad_norm": 0.23659112992785783, + "grad_max_sv": 0.0903646806254983, + "grad_min_sv": 2.044203469301876e-16, + "grad_condition": 90346621799.15851, + "lr": 0.0007938926261462363, + "time_sec": 177.41696000099182 + }, + { + "epoch": 46, + "train_loss": 5.376998851623535, + "train_acc": 0.00968, + "test_loss": 5.387116500854492, + "test_acc": 0.01, + "lyapunov": 1.5990899456736376, + "grad_norm": 0.2197692685737557, + "grad_max_sv": 0.09713525734841824, + "grad_min_sv": 1.4019481757585365e-15, + "grad_condition": 96996163686.28548, + "lr": 0.0007853567838422158, + "time_sec": 177.49049758911133 + }, + { + "epoch": 47, + "train_loss": 5.367403378448486, + "train_acc": 0.00904, + "test_loss": 5.152558483886719, + "test_acc": 0.01, + "lyapunov": 1.5909755915936912, + "grad_norm": 0.20354351323110018, + "grad_max_sv": 0.09671832993626595, + "grad_min_sv": 1.7095434307863795e-15, + "grad_condition": 96550067706.91704, + "lr": 0.0007766957746216719, + "time_sec": 177.440682888031 + }, + { + "epoch": 48, + "train_loss": 5.3691537622070316, + "train_acc": 0.009, + "test_loss": 5.103178468322754, + "test_acc": 0.01, + "lyapunov": 1.5926780014696633, + "grad_norm": 0.20080565969562386, + "grad_max_sv": 0.09486224502325058, + "grad_min_sv": 1.5909231309062707e-15, + "grad_condition": 94698098961.85327, + "lr": 0.0007679133974894982, + "time_sec": 177.45987153053284 + }, + { + "epoch": 49, + "train_loss": 5.367714106140137, + "train_acc": 0.0093, + "test_loss": 5.090968506622314, + "test_acc": 0.01, + "lyapunov": 1.5918231150683235, + "grad_norm": 0.21785142639292177, + "grad_max_sv": 0.08113837614655495, + "grad_min_sv": 1.754494669434441e-20, + "grad_condition": 81138374637.8342, + "lr": 0.000759013504686565, + "time_sec": 177.4056305885315 + }, + { + "epoch": 50, + "train_loss": 5.370782024841309, + "train_acc": 0.00932, + "test_loss": 5.1753190261840825, + "test_acc": 0.01, + "lyapunov": 1.5940865891059037, + "grad_norm": 0.20444563688390227, + "grad_max_sv": 0.07656172616407275, + "grad_min_sv": 2.696277782642207e-17, + "grad_condition": 76559876296.83813, + "lr": 0.0007499999999999998, + "time_sec": 177.39811301231384 + }, + { + "epoch": 51, + "train_loss": 5.368595368652343, + "train_acc": 0.0093, + "test_loss": 5.130212609863281, + "test_acc": 0.01, + "lyapunov": 1.5924014548206573, + "grad_norm": 0.2110899983642968, + "grad_max_sv": 0.09537852350622415, + "grad_min_sv": 2.1267942984928308e-15, + "grad_condition": 95172191574.00798, + "lr": 0.0007408768370508575, + "time_sec": 177.437908411026 + }, + { + "epoch": 52, + "train_loss": 5.368308511657715, + "train_acc": 0.0095, + "test_loss": 5.122430040740967, + "test_acc": 0.01, + "lyapunov": 1.5921837594503028, + "grad_norm": 0.22274269152603762, + "grad_max_sv": 0.09443439822643995, + "grad_min_sv": 1.7298829634439422e-15, + "grad_condition": 94273467470.68217, + "lr": 0.0007316480175599307, + "time_sec": 177.40578150749207 + }, + { + "epoch": 53, + "train_loss": 5.369929014434814, + "train_acc": 0.01008, + "test_loss": 5.085774603271484, + "test_acc": 0.01, + "lyapunov": 1.5937723787239446, + "grad_norm": 0.20295993227713832, + "grad_max_sv": 0.09454309139400721, + "grad_min_sv": 6.450947046344728e-16, + "grad_condition": 94479862712.68396, + "lr": 0.0007223175895924635, + "time_sec": 177.40152430534363 + }, + { + "epoch": 54, + "train_loss": 5.373923838806152, + "train_acc": 0.00952, + "test_loss": 5.077367216491699, + "test_acc": 0.01, + "lyapunov": 1.5964158435002007, + "grad_norm": 0.2154712788436217, + "grad_max_sv": 0.09458265658468008, + "grad_min_sv": 2.433638441241118e-15, + "grad_condition": 94352900611.06958, + "lr": 0.0007128896457825361, + "time_sec": 177.4158182144165 + }, + { + "epoch": 55, + "train_loss": 5.367228227386475, + "train_acc": 0.01046, + "test_loss": 5.130655932617188, + "test_acc": 0.01, + "lyapunov": 1.5918423345936534, + "grad_norm": 0.21491158085488357, + "grad_max_sv": 0.07526904288679362, + "grad_min_sv": 2.528540900743907e-16, + "grad_condition": 75246607455.27087, + "lr": 0.0007033683215378998, + "time_sec": 177.39575290679932 + }, + { + "epoch": 56, + "train_loss": 5.367513545684814, + "train_acc": 0.00982, + "test_loss": 5.064245509338379, + "test_acc": 0.01, + "lyapunov": 1.5908652431214862, + "grad_norm": 0.20945675875630285, + "grad_max_sv": 0.07764090299606323, + "grad_min_sv": 1.3979459340183045e-15, + "grad_condition": 77513163313.73227, + "lr": 0.0006937577932260512, + "time_sec": 177.41370344161987 + }, + { + "epoch": 57, + "train_loss": 5.378045714263916, + "train_acc": 0.0097, + "test_loss": 5.010745031738281, + "test_acc": 0.01, + "lyapunov": 1.5985675842865654, + "grad_norm": 0.21081504402843954, + "grad_max_sv": 0.08188115861266851, + "grad_min_sv": 5.212303423583328e-17, + "grad_condition": 81876236542.23714, + "lr": 0.0006840622763423388, + "time_sec": 177.4101119041443 + }, + { + "epoch": 58, + "train_loss": 5.369592454376221, + "train_acc": 0.00954, + "test_loss": 5.001489561462402, + "test_acc": 0.01, + "lyapunov": 1.594169369743913, + "grad_norm": 0.22207129747707732, + "grad_max_sv": 0.06061144880950451, + "grad_min_sv": 8.52425895192004e-34, + "grad_condition": 60611448809.5045, + "lr": 0.0006742860236609073, + "time_sec": 177.40956783294678 + }, + { + "epoch": 59, + "train_loss": 5.369317971343994, + "train_acc": 0.00942, + "test_loss": 5.000968522644043, + "test_acc": 0.01, + "lyapunov": 1.593946976429971, + "grad_norm": 0.21723304995593648, + "grad_max_sv": 0.06631144480779767, + "grad_min_sv": 5.644079889684282e-43, + "grad_condition": 66311444807.79767, + "lr": 0.0006644333233692913, + "time_sec": 177.41563248634338 + }, + { + "epoch": 60, + "train_loss": 5.367086203613281, + "train_acc": 0.00986, + "test_loss": 4.980809173583984, + "test_acc": 0.01, + "lyapunov": 1.5923281987304883, + "grad_norm": 0.22232157475356287, + "grad_max_sv": 0.05571612091735005, + "grad_min_sv": 0.0, + "grad_condition": 55716120917.35005, + "lr": 0.0006545084971874734, + "time_sec": 177.36889171600342 + }, + { + "epoch": 61, + "train_loss": 5.372129827270508, + "train_acc": 0.00924, + "test_loss": 5.0162686882019045, + "test_acc": 0.01, + "lyapunov": 1.5957943103502474, + "grad_norm": 0.2315139450623546, + "grad_max_sv": 0.05857418505474925, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 58574185054.74925, + "lr": 0.0006445158984722354, + "time_sec": 177.3955101966858 + }, + { + "epoch": 62, + "train_loss": 5.376675976257324, + "train_acc": 0.01028, + "test_loss": 4.951765003204346, + "test_acc": 0.01, + "lyapunov": 1.5998592873668427, + "grad_norm": 0.23053009469996935, + "grad_max_sv": 0.049639166425913574, + "grad_min_sv": 3.503246160812043e-47, + "grad_condition": 49639166425.913574, + "lr": 0.0006344599103076324, + "time_sec": 177.38628578186035 + }, + { + "epoch": 63, + "train_loss": 5.3675309051513675, + "train_acc": 0.00898, + "test_loss": 4.976654839324951, + "test_acc": 0.01, + "lyapunov": 1.59307188481626, + "grad_norm": 0.247010688591046, + "grad_max_sv": 0.04920805087313056, + "grad_min_sv": 0.0, + "grad_condition": 49208050873.13057, + "lr": 0.0006243449435824269, + "time_sec": 177.40613865852356 + }, + { + "epoch": 64, + "train_loss": 5.367255066528321, + "train_acc": 0.0097, + "test_loss": 5.067697259521484, + "test_acc": 0.01, + "lyapunov": 1.5924071750372573, + "grad_norm": 0.2341571351131304, + "grad_max_sv": 0.05343637596815824, + "grad_min_sv": 0.0, + "grad_condition": 53436375968.15825, + "lr": 0.0006141754350553275, + "time_sec": 177.3703956604004 + }, + { + "epoch": 65, + "train_loss": 5.367540504302979, + "train_acc": 0.00908, + "test_loss": 4.9729307174682615, + "test_acc": 0.01, + "lyapunov": 1.5929816647258865, + "grad_norm": 0.23218078781210785, + "grad_max_sv": 0.05375193590298295, + "grad_min_sv": 0.0, + "grad_condition": 53751935902.98295, + "lr": 0.0006039558454088793, + "time_sec": 177.38945150375366 + }, + { + "epoch": 66, + "train_loss": 5.366137564239502, + "train_acc": 0.00936, + "test_loss": 4.934913189697266, + "test_acc": 0.01, + "lyapunov": 1.5917930770713045, + "grad_norm": 0.21702876886168843, + "grad_max_sv": 0.04379821689799428, + "grad_min_sv": 0.0, + "grad_condition": 43798216897.99428, + "lr": 0.000593690657292862, + "time_sec": 177.4724154472351 + }, + { + "epoch": 67, + "train_loss": 5.370335599822998, + "train_acc": 0.00978, + "test_loss": 4.938832836914062, + "test_acc": 0.01, + "lyapunov": 1.5958915979356108, + "grad_norm": 0.26747204938928953, + "grad_max_sv": 0.038104135124012825, + "grad_min_sv": 0.0, + "grad_condition": 38104135124.01283, + "lr": 0.0005833843733580507, + "time_sec": 177.42428302764893 + }, + { + "epoch": 68, + "train_loss": 5.367096372375488, + "train_acc": 0.00948, + "test_loss": 4.961852867126465, + "test_acc": 0.01, + "lyapunov": 1.5927841407258798, + "grad_norm": 0.24628304430345999, + "grad_max_sv": 0.037431048322469, + "grad_min_sv": 0.0, + "grad_condition": 37431048322.468994, + "lr": 0.0005730415142812054, + "time_sec": 177.35656356811523 + }, + { + "epoch": 69, + "train_loss": 5.367298457641602, + "train_acc": 0.00942, + "test_loss": 4.985350135040283, + "test_acc": 0.01, + "lyapunov": 1.5926642820353398, + "grad_norm": 0.26713274620852084, + "grad_max_sv": 0.0558107316493988, + "grad_min_sv": 0.0, + "grad_condition": 55810731649.3988, + "lr": 0.0005626666167821517, + "time_sec": 177.404226064682 + }, + { + "epoch": 70, + "train_loss": 5.370034771118164, + "train_acc": 0.01, + "test_loss": 4.9722988952636715, + "test_acc": 0.01, + "lyapunov": 1.5953361000246404, + "grad_norm": 0.2772668383220675, + "grad_max_sv": 0.059619830828160046, + "grad_min_sv": 0.0, + "grad_condition": 59619830828.16006, + "lr": 0.0005522642316338265, + "time_sec": 177.41033554077148 + }, + { + "epoch": 71, + "train_loss": 5.3663228466796875, + "train_acc": 0.0097, + "test_loss": 4.996751819610596, + "test_acc": 0.01, + "lyapunov": 1.592004930881588, + "grad_norm": 0.27122147817442865, + "grad_max_sv": 0.051365063060075045, + "grad_min_sv": 0.0, + "grad_condition": 51365063060.07505, + "lr": 0.0005418389216661573, + "time_sec": 177.41588258743286 + }, + { + "epoch": 72, + "train_loss": 5.3688113453674315, + "train_acc": 0.00906, + "test_loss": 4.95511130065918, + "test_acc": 0.01, + "lyapunov": 1.5943079513052236, + "grad_norm": 0.2940023518744728, + "grad_max_sv": 0.043863069359213115, + "grad_min_sv": 0.0, + "grad_condition": 43863069359.21311, + "lr": 0.0005313952597646563, + "time_sec": 177.4312937259674 + }, + { + "epoch": 73, + "train_loss": 5.369862328338623, + "train_acc": 0.00916, + "test_loss": 4.928821298217773, + "test_acc": 0.01, + "lyapunov": 1.5948649678388824, + "grad_norm": 0.337053679491892, + "grad_max_sv": 0.03650999316014349, + "grad_min_sv": 0.0, + "grad_condition": 36509993160.14349, + "lr": 0.0005209378268645994, + "time_sec": 177.47835731506348 + }, + { + "epoch": 74, + "train_loss": 5.366141536560058, + "train_acc": 0.00956, + "test_loss": 4.951869967651367, + "test_acc": 0.01, + "lyapunov": 1.591574984133396, + "grad_norm": 0.34688609459259695, + "grad_max_sv": 0.0532405337318778, + "grad_min_sv": 0.0, + "grad_condition": 53240533731.87779, + "lr": 0.0005104712099416781, + "time_sec": 177.39541888237 + }, + { + "epoch": 75, + "train_loss": 5.3659246875, + "train_acc": 0.00862, + "test_loss": 4.96804543762207, + "test_acc": 0.01, + "lyapunov": 1.5917583252767773, + "grad_norm": 0.49942333201069317, + "grad_max_sv": 0.04099391270428896, + "grad_min_sv": 0.0, + "grad_condition": 40993912704.288956, + "lr": 0.0004999999999999996, + "time_sec": 177.3808958530426 + }, + { + "epoch": 76, + "train_loss": 5.3697430253601075, + "train_acc": 0.00932, + "test_loss": 4.843025128173828, + "test_acc": 0.01, + "lyapunov": 1.5954608170272748, + "grad_norm": 0.5592194591464297, + "grad_max_sv": 0.03530313139781356, + "grad_min_sv": 0.0, + "grad_condition": 35303131397.81356, + "lr": 0.0004895287900583212, + "time_sec": 177.36198616027832 + }, + { + "epoch": 77, + "train_loss": 5.369125059814453, + "train_acc": 0.00908, + "test_loss": 4.996518075561523, + "test_acc": 0.01, + "lyapunov": 1.5947885577331113, + "grad_norm": 0.5290088024656862, + "grad_max_sv": 0.017188509553670885, + "grad_min_sv": 0.0, + "grad_condition": 17188509553.670883, + "lr": 0.0004790621731353997, + "time_sec": 177.27709126472473 + }, + { + "epoch": 78, + "train_loss": 5.368183317260742, + "train_acc": 0.01024, + "test_loss": 4.973466501617431, + "test_acc": 0.01, + "lyapunov": 1.5941324002297639, + "grad_norm": 0.6809743973398079, + "grad_max_sv": 0.029488482885062693, + "grad_min_sv": 0.0, + "grad_condition": 29488482885.062695, + "lr": 0.000468604740235343, + "time_sec": 177.3189423084259 + }, + { + "epoch": 79, + "train_loss": 5.367250970458985, + "train_acc": 0.00956, + "test_loss": 4.950716239929199, + "test_acc": 0.01, + "lyapunov": 1.5930783117518705, + "grad_norm": 1.411636125689672, + "grad_max_sv": 0.031192977959290148, + "grad_min_sv": 0.0, + "grad_condition": 31192977959.29015, + "lr": 0.00045816107833384175, + "time_sec": 177.3485884666443 + }, + { + "epoch": 80, + "train_loss": 5.366609226837158, + "train_acc": 0.01002, + "test_loss": 4.952863761901855, + "test_acc": 0.01, + "lyapunov": 1.5922869257914745, + "grad_norm": 1.0613102889069541, + "grad_max_sv": 0.042383548151701686, + "grad_min_sv": 0.0, + "grad_condition": 42383548151.70168, + "lr": 0.0004477357683661729, + "time_sec": 177.41135001182556 + }, + { + "epoch": 81, + "train_loss": 5.367390147705078, + "train_acc": 0.00896, + "test_loss": 4.965977513885498, + "test_acc": 0.01, + "lyapunov": 1.5931403121679946, + "grad_norm": 1.113579115473781, + "grad_max_sv": 0.039911494683474304, + "grad_min_sv": 0.0, + "grad_condition": 39911494683.474304, + "lr": 0.00043733338321784746, + "time_sec": 177.3696448802948 + }, + { + "epoch": 82, + "train_loss": 5.374857454833984, + "train_acc": 0.0098, + "test_loss": 4.912637939453125, + "test_acc": 0.01, + "lyapunov": 1.5992167480766315, + "grad_norm": 1.3681227141701577, + "grad_max_sv": 0.032051424495875835, + "grad_min_sv": 0.0, + "grad_condition": 32051424495.875835, + "lr": 0.0004269584857187939, + "time_sec": 177.33939170837402 + }, + { + "epoch": 83, + "train_loss": 5.365830071716308, + "train_acc": 0.01, + "test_loss": 4.93360542678833, + "test_acc": 0.01, + "lyapunov": 1.5919503589420367, + "grad_norm": 1.2908239754732598, + "grad_max_sv": 0.018338044127449393, + "grad_min_sv": 0.0, + "grad_condition": 18338044127.449394, + "lr": 0.0004166156266419484, + "time_sec": 177.30572271347046 + }, + { + "epoch": 84, + "train_loss": 5.369314513549805, + "train_acc": 0.01032, + "test_loss": 4.962402893066407, + "test_acc": 0.01, + "lyapunov": 1.5951606830977418, + "grad_norm": 1.2430323961128404, + "grad_max_sv": 0.014490698464214802, + "grad_min_sv": 0.0, + "grad_condition": 14490698464.214802, + "lr": 0.0004063093427071373, + "time_sec": 177.2841637134552 + }, + { + "epoch": 85, + "train_loss": 5.377282650604248, + "train_acc": 0.00908, + "test_loss": 4.969677833557129, + "test_acc": 0.01, + "lyapunov": 1.5993056263765106, + "grad_norm": 1.0935450948855057, + "grad_max_sv": 0.03076445385813713, + "grad_min_sv": 0.0, + "grad_condition": 30764453858.137135, + "lr": 0.0003960441545911199, + "time_sec": 177.35037755966187 + }, + { + "epoch": 86, + "train_loss": 5.365991982879638, + "train_acc": 0.00934, + "test_loss": 4.960339687347412, + "test_acc": 0.01, + "lyapunov": 1.591959211527539, + "grad_norm": 1.0249256686134756, + "grad_max_sv": 0.03798610083758831, + "grad_min_sv": 0.0, + "grad_condition": 37986100837.5883, + "lr": 0.0003858245649446718, + "time_sec": 177.35586881637573 + }, + { + "epoch": 87, + "train_loss": 5.36631558807373, + "train_acc": 0.00936, + "test_loss": 4.948922778320313, + "test_acc": 0.01, + "lyapunov": 1.5924714169538845, + "grad_norm": 0.8096413328413968, + "grad_max_sv": 0.033394893538206814, + "grad_min_sv": 0.0, + "grad_condition": 33394893538.206818, + "lr": 0.00037565505641757235, + "time_sec": 177.3941514492035 + }, + { + "epoch": 88, + "train_loss": 5.372631300354004, + "train_acc": 0.01006, + "test_loss": 4.890858795166015, + "test_acc": 0.01, + "lyapunov": 1.5971073076853057, + "grad_norm": 0.3735195103580093, + "grad_max_sv": 0.02607831247150898, + "grad_min_sv": 0.0, + "grad_condition": 26078312471.50898, + "lr": 0.00036554008969236695, + "time_sec": 177.28741931915283 + }, + { + "epoch": 89, + "train_loss": 5.367757025299072, + "train_acc": 0.0093, + "test_loss": 4.9563854202270505, + "test_acc": 0.01, + "lyapunov": 1.593846448242207, + "grad_norm": 0.4162028440796633, + "grad_max_sv": 0.030028719501569868, + "grad_min_sv": 0.0, + "grad_condition": 30028719501.569862, + "lr": 0.0003554841015277638, + "time_sec": 177.30004262924194 + }, + { + "epoch": 90, + "train_loss": 5.369390062561036, + "train_acc": 0.01028, + "test_loss": 4.903431629943848, + "test_acc": 0.01, + "lyapunov": 1.5944386360895297, + "grad_norm": 0.45537462137938906, + "grad_max_sv": 0.03309078188613057, + "grad_min_sv": 0.0, + "grad_condition": 33090781886.130573, + "lr": 0.000345491502812526, + "time_sec": 177.33181858062744 + }, + { + "epoch": 91, + "train_loss": 5.36617555480957, + "train_acc": 0.0097, + "test_loss": 4.973295672607422, + "test_acc": 0.01, + "lyapunov": 1.5924281744700868, + "grad_norm": 0.42959416759344066, + "grad_max_sv": 0.02529722950421274, + "grad_min_sv": 0.0, + "grad_condition": 25297229504.212738, + "lr": 0.0003355666766307081, + "time_sec": 177.29152536392212 + }, + { + "epoch": 92, + "train_loss": 5.3661282931518555, + "train_acc": 0.0106, + "test_loss": 4.874008221435547, + "test_acc": 0.01, + "lyapunov": 1.5923549528317074, + "grad_norm": 0.4739333324657675, + "grad_max_sv": 0.027486719330772756, + "grad_min_sv": 0.0, + "grad_condition": 27486719330.77276, + "lr": 0.00032571397633909225, + "time_sec": 177.3095293045044 + }, + { + "epoch": 93, + "train_loss": 5.36726612121582, + "train_acc": 0.00952, + "test_loss": 4.844555052947998, + "test_acc": 0.01, + "lyapunov": 1.5933535443547437, + "grad_norm": 0.4489090651028355, + "grad_max_sv": 0.027935726940631865, + "grad_min_sv": 0.0, + "grad_condition": 27935726940.631866, + "lr": 0.00031593772365766094, + "time_sec": 177.29880285263062 + }, + { + "epoch": 94, + "train_loss": 5.367507637634278, + "train_acc": 0.00938, + "test_loss": 4.85123999710083, + "test_acc": 0.01, + "lyapunov": 1.593514009509855, + "grad_norm": 0.49488308768779743, + "grad_max_sv": 0.03786678058095276, + "grad_min_sv": 0.0, + "grad_condition": 37866780580.95277, + "lr": 0.0003062422067739483, + "time_sec": 177.66627550125122 + }, + { + "epoch": 95, + "train_loss": 5.367161036987305, + "train_acc": 0.01, + "test_loss": 4.919075784301758, + "test_acc": 0.01, + "lyapunov": 1.593309577468716, + "grad_norm": 0.49632556697910357, + "grad_max_sv": 0.03764305226504803, + "grad_min_sv": 0.0, + "grad_condition": 37643052265.04803, + "lr": 0.00029663167846209965, + "time_sec": 177.35125970840454 + }, + { + "epoch": 96, + "train_loss": 5.368773625488282, + "train_acc": 0.00952, + "test_loss": 4.886889329528809, + "test_acc": 0.01, + "lyapunov": 1.5946083480439832, + "grad_norm": 0.5634579068593676, + "grad_max_sv": 0.033481535781174895, + "grad_min_sv": 0.0, + "grad_condition": 33481535781.174904, + "lr": 0.00028711035421746345, + "time_sec": 177.33729600906372 + }, + { + "epoch": 97, + "train_loss": 5.373278410797119, + "train_acc": 0.0092, + "test_loss": 4.919860540771484, + "test_acc": 0.01, + "lyapunov": 1.5970366150521866, + "grad_norm": 0.5241288299265501, + "grad_max_sv": 0.02991771958768368, + "grad_min_sv": 0.0, + "grad_condition": 29917719587.683678, + "lr": 0.00027768241040753615, + "time_sec": 177.3373203277588 + }, + { + "epoch": 98, + "train_loss": 5.367487851867676, + "train_acc": 0.00984, + "test_loss": 4.922154154968262, + "test_acc": 0.01, + "lyapunov": 1.5938531629874577, + "grad_norm": 0.6102489153602656, + "grad_max_sv": 0.02815253552980721, + "grad_min_sv": 0.0, + "grad_condition": 28152535529.807213, + "lr": 0.00026835198244006903, + "time_sec": 177.35172653198242 + }, + { + "epoch": 99, + "train_loss": 5.367893275756836, + "train_acc": 0.01038, + "test_loss": 4.930574498748779, + "test_acc": 0.01, + "lyapunov": 1.593941973908173, + "grad_norm": 0.5921377439478998, + "grad_max_sv": 0.03409935408271849, + "grad_min_sv": 0.0, + "grad_condition": 34099354082.718487, + "lr": 0.0002591231629491421, + "time_sec": 177.36736416816711 + }, + { + "epoch": 100, + "train_loss": 5.372079080200195, + "train_acc": 0.01062, + "test_loss": 4.915191829681397, + "test_acc": 0.01, + "lyapunov": 1.596833938832783, + "grad_norm": 0.5930918441111938, + "grad_max_sv": 0.033569992519915104, + "grad_min_sv": 0.0, + "grad_condition": 33569992519.915108, + "lr": 0.0002499999999999997, + "time_sec": 177.3853051662445 + }, + { + "epoch": 101, + "train_loss": 5.365807982940674, + "train_acc": 0.00976, + "test_loss": 4.926369466400146, + "test_acc": 0.01, + "lyapunov": 1.5920866029646696, + "grad_norm": 1.2269794373451623, + "grad_max_sv": 0.03278505662456155, + "grad_min_sv": 0.0, + "grad_condition": 32785056624.561546, + "lr": 0.00024098649531343477, + "time_sec": 177.41039776802063 + }, + { + "epoch": 102, + "train_loss": 5.3670011302185054, + "train_acc": 0.00968, + "test_loss": 5.182023647308349, + "test_acc": 0.01, + "lyapunov": 1.5932530469601722, + "grad_norm": 0.5812477341116522, + "grad_max_sv": 0.03314556856639683, + "grad_min_sv": 0.0, + "grad_condition": 33145568566.39683, + "lr": 0.0002320866025105016, + "time_sec": 177.37316060066223 + }, + { + "epoch": 103, + "train_loss": 5.371551856231689, + "train_acc": 0.01004, + "test_loss": 4.899476731109619, + "test_acc": 0.01, + "lyapunov": 1.5966654973261802, + "grad_norm": 0.610767105839377, + "grad_max_sv": 0.02582362242974341, + "grad_min_sv": 0.0, + "grad_condition": 25823622429.74341, + "lr": 0.0002233042253783278, + "time_sec": 177.36590600013733 + }, + { + "epoch": 104, + "train_loss": 5.368561768646241, + "train_acc": 0.00946, + "test_loss": 4.930848654174805, + "test_acc": 0.01, + "lyapunov": 1.5947173150908915, + "grad_norm": 0.6422628015235555, + "grad_max_sv": 0.025343496771529316, + "grad_min_sv": 0.0, + "grad_condition": 25343496771.529316, + "lr": 0.000214643216157784, + "time_sec": 177.3882737159729 + }, + { + "epoch": 105, + "train_loss": 5.36991615814209, + "train_acc": 0.0091, + "test_loss": 4.899362311553955, + "test_acc": 0.01, + "lyapunov": 1.5956382519753693, + "grad_norm": 0.5876379942472394, + "grad_max_sv": 0.02119842660613358, + "grad_min_sv": 0.0, + "grad_condition": 21198426606.133583, + "lr": 0.00020610737385376332, + "time_sec": 177.41758513450623 + }, + { + "epoch": 106, + "train_loss": 5.366515799407959, + "train_acc": 0.01026, + "test_loss": 4.887499784851074, + "test_acc": 0.01, + "lyapunov": 1.592897226743381, + "grad_norm": 0.6201818264513558, + "grad_max_sv": 0.0033281870651990174, + "grad_min_sv": 0.0, + "grad_condition": 3328187065.1990175, + "lr": 0.00019770044256881242, + "time_sec": 177.3366186618805 + }, + { + "epoch": 107, + "train_loss": 5.368152584533691, + "train_acc": 0.00916, + "test_loss": 4.894157613372803, + "test_acc": 0.01, + "lyapunov": 1.5942484835529571, + "grad_norm": 0.7280576803690416, + "grad_max_sv": 0.027869051974266767, + "grad_min_sv": 0.0, + "grad_condition": 27869051974.266766, + "lr": 0.0001894261098608447, + "time_sec": 177.37792563438416 + }, + { + "epoch": 108, + "train_loss": 5.3665059283447265, + "train_acc": 0.00976, + "test_loss": 4.915471728515625, + "test_acc": 0.01, + "lyapunov": 1.592840023662733, + "grad_norm": 0.7424554492649038, + "grad_max_sv": 0.026440556207671762, + "grad_min_sv": 0.0, + "grad_condition": 26440556207.67176, + "lr": 0.000181288005125655, + "time_sec": 177.35853958129883 + }, + { + "epoch": 109, + "train_loss": 5.376394969329834, + "train_acc": 0.01022, + "test_loss": 4.922409371948242, + "test_acc": 0.01, + "lyapunov": 1.6003244386609559, + "grad_norm": 0.8040426103005965, + "grad_max_sv": 0.024923838768154384, + "grad_min_sv": 0.0, + "grad_condition": 24923838768.15438, + "lr": 0.0001732896980049473, + "time_sec": 177.31202268600464 + }, + { + "epoch": 110, + "train_loss": 5.376544867401123, + "train_acc": 0.01006, + "test_loss": 4.9106194869995115, + "test_acc": 0.01, + "lyapunov": 1.5990420381736268, + "grad_norm": 0.7808973134784486, + "grad_max_sv": 0.023315236158668994, + "grad_min_sv": 0.0, + "grad_condition": 23315236158.668995, + "lr": 0.00016543469682057076, + "time_sec": 177.3295497894287 + }, + { + "epoch": 111, + "train_loss": 5.366748910522461, + "train_acc": 0.01, + "test_loss": 4.904478953552246, + "test_acc": 0.01, + "lyapunov": 1.5930900046282717, + "grad_norm": 0.8315740534061841, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015772644703565552, + "time_sec": 177.3059582710266 + }, + { + "epoch": 112, + "train_loss": 5.365462461242676, + "train_acc": 0.0097, + "test_loss": 4.909817778778076, + "test_acc": 0.01, + "lyapunov": 1.591839042770893, + "grad_norm": 1.0644316030188519, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00015016832974331713, + "time_sec": 177.3259735107422 + }, + { + "epoch": 113, + "train_loss": 5.366983929290772, + "train_acc": 0.01, + "test_loss": 4.893335526275635, + "test_acc": 0.01, + "lyapunov": 1.5934227226335373, + "grad_norm": 1.0331708046855217, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014276366018359834, + "time_sec": 177.29799342155457 + }, + { + "epoch": 114, + "train_loss": 5.367780682678223, + "train_acc": 0.01, + "test_loss": 4.896582912445068, + "test_acc": 0.01, + "lyapunov": 1.5942320003533912, + "grad_norm": 1.09308769834869, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00013551568628929425, + "time_sec": 177.33024215698242 + }, + { + "epoch": 115, + "train_loss": 5.367718472900391, + "train_acc": 0.01, + "test_loss": 4.895343659973144, + "test_acc": 0.01, + "lyapunov": 1.5940615042396213, + "grad_norm": 1.2673802568939343, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012842758726130276, + "time_sec": 177.3362259864807 + }, + { + "epoch": 116, + "train_loss": 5.3657911352539065, + "train_acc": 0.01, + "test_loss": 4.906929530334473, + "test_acc": 0.01, + "lyapunov": 1.5921993859283758, + "grad_norm": 1.2617224687326039, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001215024721741218, + "time_sec": 177.28457856178284 + }, + { + "epoch": 117, + "train_loss": 5.366755274505615, + "train_acc": 0.00962, + "test_loss": 4.891025592041015, + "test_acc": 0.01, + "lyapunov": 1.5932053120239922, + "grad_norm": 1.3667828520013348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210538, + "time_sec": 177.260840177536 + }, + { + "epoch": 118, + "train_loss": 5.369936829376221, + "train_acc": 0.00938, + "test_loss": 4.908762777709961, + "test_acc": 0.01, + "lyapunov": 1.5956426922927427, + "grad_norm": 1.4737347393486513, + "grad_max_sv": 0.002789213368669152, + "grad_min_sv": 0.0, + "grad_condition": 2789213368.6691523, + "lr": 0.00010815327133708009, + "time_sec": 177.28786754608154 + }, + { + "epoch": 119, + "train_loss": 5.367702166290283, + "train_acc": 0.01006, + "test_loss": 4.900025549316406, + "test_acc": 0.01, + "lyapunov": 1.5938852357742426, + "grad_norm": 1.445693487120252, + "grad_max_sv": 0.004225540207698941, + "grad_min_sv": 0.0, + "grad_condition": 4225540207.698941, + "lr": 0.00010173504098790182, + "time_sec": 177.32281279563904 + }, + { + "epoch": 120, + "train_loss": 5.366396225891113, + "train_acc": 0.01, + "test_loss": 4.875214715576172, + "test_acc": 0.01, + "lyapunov": 1.5928466237719408, + "grad_norm": 1.5218270915127643, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252629e-05, + "time_sec": 177.28257083892822 + }, + { + "epoch": 121, + "train_loss": 5.366784219818115, + "train_acc": 0.01, + "test_loss": 4.868653475952148, + "test_acc": 0.01, + "lyapunov": 1.5932423071483213, + "grad_norm": 1.5915107890267433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.942539543314794e-05, + "time_sec": 177.2724094390869 + }, + { + "epoch": 122, + "train_loss": 5.3684937673950195, + "train_acc": 0.0095, + "test_loss": 4.872081127929688, + "test_acc": 0.01, + "lyapunov": 1.5947217929088855, + "grad_norm": 1.7802951927894717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.353937964495024e-05, + "time_sec": 177.29115104675293 + }, + { + "epoch": 123, + "train_loss": 5.368383057250977, + "train_acc": 0.00976, + "test_loss": 4.865282067871094, + "test_acc": 0.01, + "lyapunov": 1.5946415565202914, + "grad_norm": 1.8635884798014917, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.783603724899243e-05, + "time_sec": 177.29619812965393 + }, + { + "epoch": 124, + "train_loss": 5.369555229797363, + "train_acc": 0.01, + "test_loss": 4.850182081604004, + "test_acc": 0.01, + "lyapunov": 1.595543795839295, + "grad_norm": 1.9786412883932707, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.231786991974666e-05, + "time_sec": 177.28673815727234 + }, + { + "epoch": 125, + "train_loss": 5.366839987792969, + "train_acc": 0.0099, + "test_loss": 4.863481466674805, + "test_acc": 0.01, + "lyapunov": 1.5933110564566024, + "grad_norm": 1.981713372629457, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.698729810778072e-05, + "time_sec": 177.54408073425293 + }, + { + "epoch": 126, + "train_loss": 5.367286334533691, + "train_acc": 0.00978, + "test_loss": 4.864164552307129, + "test_acc": 0.01, + "lyapunov": 1.593780165133269, + "grad_norm": 2.0792063115884303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806817e-05, + "time_sec": 177.27722811698914 + }, + { + "epoch": 127, + "train_loss": 5.377017222900391, + "train_acc": 0.00976, + "test_loss": 4.867053485107422, + "test_acc": 0.01, + "lyapunov": 1.5985291836511752, + "grad_norm": 1.8808489686841805, + "grad_max_sv": 0.0020057843998074532, + "grad_min_sv": 0.0, + "grad_condition": 2005784399.8074532, + "lr": 5.6898210384392595e-05, + "time_sec": 177.32938599586487 + }, + { + "epoch": 128, + "train_loss": 5.3731236241149904, + "train_acc": 0.0099, + "test_loss": 4.862087628173828, + "test_acc": 0.01, + "lyapunov": 1.5972985928625707, + "grad_norm": 2.0544715272998646, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.214411988029363e-05, + "time_sec": 177.26091361045837 + }, + { + "epoch": 129, + "train_loss": 5.366952188110352, + "train_acc": 0.00966, + "test_loss": 4.87226043548584, + "test_acc": 0.01, + "lyapunov": 1.5934485755003323, + "grad_norm": 2.0287817825331826, + "grad_max_sv": 0.0008733986876904964, + "grad_min_sv": 0.0, + "grad_condition": 873398687.6904964, + "lr": 4.7586473766990294e-05, + "time_sec": 177.30408883094788 + }, + { + "epoch": 130, + "train_loss": 5.36849506149292, + "train_acc": 0.01004, + "test_loss": 4.863279203796386, + "test_acc": 0.01, + "lyapunov": 1.594751832735203, + "grad_norm": 1.980669281269925, + "grad_max_sv": 0.010736069735139608, + "grad_min_sv": 0.0, + "grad_condition": 10736069735.139608, + "lr": 4.32272711786996e-05, + "time_sec": 177.28869652748108 + }, + { + "epoch": 131, + "train_loss": 5.377595603637696, + "train_acc": 0.01, + "test_loss": 4.866737941741944, + "test_acc": 0.01, + "lyapunov": 1.5995000756305198, + "grad_norm": 2.154727256033659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.906842420574966e-05, + "time_sec": 177.257958650589 + }, + { + "epoch": 132, + "train_loss": 5.369090413818359, + "train_acc": 0.01, + "test_loss": 4.858406136322022, + "test_acc": 0.01, + "lyapunov": 1.5953167524484113, + "grad_norm": 2.191344847482899, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.5111757055874305e-05, + "time_sec": 177.27152252197266 + }, + { + "epoch": 133, + "train_loss": 5.3665374522399905, + "train_acc": 0.01, + "test_loss": 4.860008187866211, + "test_acc": 0.01, + "lyapunov": 1.5930466167152386, + "grad_norm": 2.0841828503003916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.1359005254054254e-05, + "time_sec": 177.28846549987793 + }, + { + "epoch": 134, + "train_loss": 5.366383743286133, + "train_acc": 0.00974, + "test_loss": 4.848487128448486, + "test_acc": 0.01, + "lyapunov": 1.592855043118567, + "grad_norm": 2.195653914411608, + "grad_max_sv": 0.0033036706037819384, + "grad_min_sv": 0.0, + "grad_condition": 3303670603.7819386, + "lr": 2.7811814881259484e-05, + "time_sec": 177.28988027572632 + }, + { + "epoch": 135, + "train_loss": 5.367761196746827, + "train_acc": 0.00998, + "test_loss": 4.859366925048828, + "test_acc": 0.01, + "lyapunov": 1.594165514802079, + "grad_norm": 2.1904859959999126, + "grad_max_sv": 0.0012543844059109688, + "grad_min_sv": 0.0, + "grad_condition": 1254384405.9109688, + "lr": 2.4471741852423218e-05, + "time_sec": 177.2780725955963 + }, + { + "epoch": 136, + "train_loss": 5.366510193634033, + "train_acc": 0.01, + "test_loss": 4.8595954734802245, + "test_acc": 0.01, + "lyapunov": 1.5930009638257039, + "grad_norm": 2.1839168134099793, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.1340251233966362e-05, + "time_sec": 177.28521990776062 + }, + { + "epoch": 137, + "train_loss": 5.367833109741211, + "train_acc": 0.01, + "test_loss": 4.850632510375976, + "test_acc": 0.01, + "lyapunov": 1.5938955752745918, + "grad_norm": 2.14228114693839, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.8418716601170932e-05, + "time_sec": 177.32584595680237 + }, + { + "epoch": 138, + "train_loss": 5.378068528137207, + "train_acc": 0.01018, + "test_loss": 4.858175395202637, + "test_acc": 0.01, + "lyapunov": 1.5998802581406615, + "grad_norm": 2.218784068596557, + "grad_max_sv": 0.0014573325868695974, + "grad_min_sv": 0.0, + "grad_condition": 1457332586.8695974, + "lr": 1.570841943568445e-05, + "time_sec": 177.31577253341675 + }, + { + "epoch": 139, + "train_loss": 5.367863772277832, + "train_acc": 0.01034, + "test_loss": 4.8480802886962895, + "test_acc": 0.01, + "lyapunov": 1.5942664253132424, + "grad_norm": 2.2444364897318794, + "grad_max_sv": 0.012257534638047218, + "grad_min_sv": 0.0, + "grad_condition": 12257534638.047218, + "lr": 1.3210548563419845e-05, + "time_sec": 177.30443215370178 + }, + { + "epoch": 140, + "train_loss": 5.366426722717285, + "train_acc": 0.00962, + "test_loss": 4.848219221496582, + "test_acc": 0.01, + "lyapunov": 1.5928701375756422, + "grad_norm": 2.3192997356397203, + "grad_max_sv": 0.006218939693644643, + "grad_min_sv": 0.0, + "grad_condition": 6218939693.644643, + "lr": 1.0926199633097203e-05, + "time_sec": 177.33384609222412 + }, + { + "epoch": 141, + "train_loss": 5.36580462097168, + "train_acc": 0.00986, + "test_loss": 4.850540889739991, + "test_acc": 0.01, + "lyapunov": 1.592248017830617, + "grad_norm": 2.287220965288124, + "grad_max_sv": 0.0013559065759181977, + "grad_min_sv": 0.0, + "grad_condition": 1355906575.9181976, + "lr": 8.856374635655688e-06, + "time_sec": 177.32693576812744 + }, + { + "epoch": 142, + "train_loss": 5.3662375875854496, + "train_acc": 0.01, + "test_loss": 4.853694881439209, + "test_acc": 0.01, + "lyapunov": 1.5927291526209058, + "grad_norm": 2.302468482661773, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.001981464747503e-06, + "time_sec": 177.3142066001892 + }, + { + "epoch": 143, + "train_loss": 5.372984427642822, + "train_acc": 0.01004, + "test_loss": 4.852922064208984, + "test_acc": 0.01, + "lyapunov": 1.597528722889893, + "grad_norm": 2.348373340052694, + "grad_max_sv": 0.0011802260298281908, + "grad_min_sv": 0.0, + "grad_condition": 1180226029.8281908, + "lr": 5.3638335185058295e-06, + "time_sec": 177.3356897830963 + }, + { + "epoch": 144, + "train_loss": 5.368205472106934, + "train_acc": 0.00984, + "test_loss": 4.849281020355225, + "test_acc": 0.01, + "lyapunov": 1.594479467252941, + "grad_norm": 2.312922144804607, + "grad_max_sv": 0.0006380858831107616, + "grad_min_sv": 0.0, + "grad_condition": 638085883.1107616, + "lr": 3.942649342761114e-06, + "time_sec": 177.28971314430237 + }, + { + "epoch": 145, + "train_loss": 5.366419898681641, + "train_acc": 0.01006, + "test_loss": 4.848984435272217, + "test_acc": 0.01, + "lyapunov": 1.592920510360347, + "grad_norm": 2.317195419975272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.7390523158633524e-06, + "time_sec": 177.31689953804016 + }, + { + "epoch": 146, + "train_loss": 5.373454104766846, + "train_acc": 0.01, + "test_loss": 4.849994027709961, + "test_acc": 0.01, + "lyapunov": 1.598964246642559, + "grad_norm": 2.4233925402092833, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.7535703752478133e-06, + "time_sec": 177.32813477516174 + }, + { + "epoch": 147, + "train_loss": 5.3674054251098635, + "train_acc": 0.01, + "test_loss": 4.851546574401856, + "test_acc": 0.01, + "lyapunov": 1.5935643969289481, + "grad_norm": 2.3247951305562196, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642196e-07, + "time_sec": 177.28444719314575 + }, + { + "epoch": 148, + "train_loss": 5.3666025303649905, + "train_acc": 0.01, + "test_loss": 4.8515466201782225, + "test_acc": 0.01, + "lyapunov": 1.5931046256019026, + "grad_norm": 2.3395920546004754, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.38584950570808e-07, + "time_sec": 177.2980020046234 + }, + { + "epoch": 149, + "train_loss": 5.365688817749024, + "train_acc": 0.01, + "test_loss": 4.851546644592285, + "test_acc": 0.01, + "lyapunov": 1.5921499198659912, + "grad_norm": 2.4070679367245766, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.096582625772501e-07, + "time_sec": 177.28436994552612 + }, + { + "epoch": 150, + "train_loss": 5.363941977539063, + "train_acc": 0.01, + "test_loss": 4.851546675109863, + "test_acc": 0.01, + "lyapunov": 1.5903311498329769, + "grad_norm": 2.3202323044197746, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 177.27790570259094 + } + ] + } +}
\ No newline at end of file |
