{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 4.348092296829224, "train_acc": 0.09724, "test_loss": 3.5478567863464354, "test_acc": 0.1787, "lyapunov": null, "grad_norm": 6.316536759043694, "grad_max_sv": 4.902881336212158, "grad_min_sv": 1.1448865706586986e-07, "grad_condition": 88191421.7926497, "lr": 0.0009998903417374227, "time_sec": 17.679682731628418 }, { "epoch": 2, "train_loss": 3.49050922706604, "train_acc": 0.1874, "test_loss": 3.2633129741668703, "test_acc": 0.2305, "lyapunov": null, "grad_norm": 4.4801349556346395, "grad_max_sv": 3.2215479910373688, "grad_min_sv": 8.299195606298326e-08, "grad_condition": 121110274.52327952, "lr": 0.0009995614150494292, "time_sec": 15.735185623168945 }, { "epoch": 3, "train_loss": 3.0170057023620607, "train_acc": 0.25916, "test_loss": 2.9698277725219726, "test_acc": 0.277, "lyapunov": null, "grad_norm": 3.5133664087504743, "grad_max_sv": 2.335329008102417, "grad_min_sv": 6.557634772974552e-08, "grad_condition": 39177377.20397766, "lr": 0.0009990133642141358, "time_sec": 15.478843212127686 }, { "epoch": 4, "train_loss": 2.72460933883667, "train_acc": 0.31376, "test_loss": 2.5551274646759032, "test_acc": 0.3459, "lyapunov": null, "grad_norm": 2.9634417699116904, "grad_max_sv": 1.8090383648872375, "grad_min_sv": 5.484415814827059e-08, "grad_condition": 38079849.47138412, "lr": 0.0009982464296247522, "time_sec": 15.453156232833862 }, { "epoch": 5, "train_loss": 2.490703504867554, "train_acc": 0.35894, "test_loss": 2.7182868785858156, "test_acc": 0.3267, "lyapunov": null, "grad_norm": 2.6429461818460145, "grad_max_sv": 1.5860196590423583, "grad_min_sv": 4.9649662298145714e-08, "grad_condition": 58850970.75600495, "lr": 0.0009972609476841367, "time_sec": 15.466280460357666 }, { "epoch": 6, "train_loss": 2.3172771724700927, "train_acc": 0.39578, "test_loss": 2.39353342666626, "test_acc": 0.3858, "lyapunov": null, "grad_norm": 2.425728150736765, "grad_max_sv": 1.3820528209209442, "grad_min_sv": 4.6181405355394387e-08, "grad_condition": 48644681.68891229, "lr": 0.000996057350657239, "time_sec": 15.472876071929932 }, { "epoch": 7, "train_loss": 2.1795343031311036, "train_acc": 0.42514, "test_loss": 2.5081939483642577, "test_acc": 0.3733, "lyapunov": null, "grad_norm": 2.261531612589412, "grad_max_sv": 1.2684625327587127, "grad_min_sv": 4.360769899069972e-08, "grad_condition": 42250330.837381184, "lr": 0.000994636166481494, "time_sec": 15.466506242752075 }, { "epoch": 8, "train_loss": 2.0688308012390135, "train_acc": 0.44974, "test_loss": 2.4493139656066893, "test_acc": 0.3851, "lyapunov": null, "grad_norm": 2.118981579627668, "grad_max_sv": 1.159741823375225, "grad_min_sv": 4.073619567137449e-08, "grad_condition": 437927531.63442343, "lr": 0.0009929980185352525, "time_sec": 15.472336769104004 }, { "epoch": 9, "train_loss": 1.9493904537963866, "train_acc": 0.47454, "test_loss": 2.441312085723877, "test_acc": 0.389, "lyapunov": null, "grad_norm": 1.9875075491821204, "grad_max_sv": 1.0529514640569686, "grad_min_sv": 3.8403542657050595e-08, "grad_condition": 87931604.40353736, "lr": 0.0009911436253643444, "time_sec": 15.4936044216156 }, { "epoch": 10, "train_loss": 1.858957971572876, "train_acc": 0.4983, "test_loss": 2.183478004837036, "test_acc": 0.4383, "lyapunov": null, "grad_norm": 1.8688341406216382, "grad_max_sv": 0.9524922624230385, "grad_min_sv": 3.567054506770084e-08, "grad_condition": 37551442.84495841, "lr": 0.0009890738003669028, "time_sec": 15.46358847618103 }, { "epoch": 11, "train_loss": 1.7630364864730834, "train_acc": 0.51782, "test_loss": 3.0158682430267336, "test_acc": 0.3359, "lyapunov": null, "grad_norm": 1.7816105917819214, "grad_max_sv": 0.9029998555779457, "grad_min_sv": 3.4386650932249904e-08, "grad_condition": 96253986.02645789, "lr": 0.00098678945143658, "time_sec": 15.461369752883911 }, { "epoch": 12, "train_loss": 1.7038999611282348, "train_acc": 0.52966, "test_loss": 2.345099726104736, "test_acc": 0.4116, "lyapunov": null, "grad_norm": 1.703439920745613, "grad_max_sv": 0.8390393868088722, "grad_min_sv": 3.2384037166287294e-08, "grad_condition": 263062888.07930222, "lr": 0.0009842915805643154, "time_sec": 15.47589898109436 }, { "epoch": 13, "train_loss": 1.6350115670394898, "train_acc": 0.54934, "test_loss": 2.3178677167892454, "test_acc": 0.4258, "lyapunov": null, "grad_norm": 1.627197475633154, "grad_max_sv": 0.7804030522704124, "grad_min_sv": 3.0640796072622935e-08, "grad_condition": 47339680.420034245, "lr": 0.000981581283398829, "time_sec": 15.482157230377197 }, { "epoch": 14, "train_loss": 1.5789134158706666, "train_acc": 0.56262, "test_loss": 3.108631703567505, "test_acc": 0.3341, "lyapunov": null, "grad_norm": 1.5815496416496932, "grad_max_sv": 0.7780330538749695, "grad_min_sv": 3.0241727028840204e-08, "grad_condition": 121072879.52128251, "lr": 0.0009786597487660333, "time_sec": 15.469743490219116 }, { "epoch": 15, "train_loss": 1.5213708932495118, "train_acc": 0.57622, "test_loss": 2.1178235721588137, "test_acc": 0.4665, "lyapunov": null, "grad_norm": 1.5137971406754955, "grad_max_sv": 0.7158914238214493, "grad_min_sv": 2.8684351333074785e-08, "grad_condition": 31997486.936446648, "lr": 0.0009755282581475766, "time_sec": 15.4898362159729 }, { "epoch": 16, "train_loss": 1.466670620689392, "train_acc": 0.58748, "test_loss": 1.9707215017318727, "test_acc": 0.4909, "lyapunov": null, "grad_norm": 1.4598686481318373, "grad_max_sv": 0.6799994811415673, "grad_min_sv": 2.748090726922836e-08, "grad_condition": 67712877.74998799, "lr": 0.0009721881851187403, "time_sec": 15.463284254074097 }, { "epoch": 17, "train_loss": 1.4266776397705079, "train_acc": 0.60022, "test_loss": 1.9578287740707399, "test_acc": 0.496, "lyapunov": null, "grad_norm": 1.4163199382153222, "grad_max_sv": 0.6607045501470565, "grad_min_sv": 2.6701706835885463e-08, "grad_condition": 69925020.646238, "lr": 0.0009686409947459456, "time_sec": 15.465324878692627 }, { "epoch": 18, "train_loss": 1.3868621417999267, "train_acc": 0.61008, "test_loss": 1.8873281810760498, "test_acc": 0.5122, "lyapunov": null, "grad_norm": 1.3780415134056272, "grad_max_sv": 0.6475953251123429, "grad_min_sv": 2.629753427935144e-08, "grad_condition": 71849203.49105962, "lr": 0.0009648882429441254, "time_sec": 15.476778745651245 }, { "epoch": 19, "train_loss": 1.3300997947692872, "train_acc": 0.6208, "test_loss": 1.8625336185455321, "test_acc": 0.5163, "lyapunov": null, "grad_norm": 1.3376016965348547, "grad_max_sv": 0.6296016126871109, "grad_min_sv": 2.534474096427264e-08, "grad_condition": 40912774.4949669, "lr": 0.00096093157579425, "time_sec": 15.47281002998352 }, { "epoch": 20, "train_loss": 1.2915953662490844, "train_acc": 0.6313, "test_loss": 1.88144536113739, "test_acc": 0.5061, "lyapunov": null, "grad_norm": 1.3064427354934414, "grad_max_sv": 0.5868082754313946, "grad_min_sv": 2.44614505123808e-08, "grad_condition": 40190101.53190343, "lr": 0.0009567727288213001, "time_sec": 15.473944902420044 }, { "epoch": 21, "train_loss": 1.2615811933898926, "train_acc": 0.63936, "test_loss": 2.138494786453247, "test_acc": 0.4639, "lyapunov": null, "grad_norm": 1.2742362971746195, "grad_max_sv": 0.577499034255743, "grad_min_sv": 2.428454916880707e-08, "grad_condition": 34685614.15402056, "lr": 0.0009524135262330095, "time_sec": 15.476754188537598 }, { "epoch": 22, "train_loss": 1.2293620531463623, "train_acc": 0.6453, "test_loss": 1.8758944011688232, "test_acc": 0.5147, "lyapunov": null, "grad_norm": 1.252289309007294, "grad_max_sv": 0.570976011455059, "grad_min_sv": 2.3561374129510426e-08, "grad_condition": 48751943.11700691, "lr": 0.0009478558801197061, "time_sec": 15.473217487335205 }, { "epoch": 23, "train_loss": 1.1897959590911866, "train_acc": 0.65626, "test_loss": 1.8954246566772461, "test_acc": 0.5211, "lyapunov": null, "grad_norm": 1.2259155434497018, "grad_max_sv": 0.5599369831383229, "grad_min_sv": 2.2801355227530795e-08, "grad_condition": 52092903.5694242, "lr": 0.000943101789615607, "time_sec": 15.473440170288086 }, { "epoch": 24, "train_loss": 1.1551566465377807, "train_acc": 0.665, "test_loss": 1.896939277267456, "test_acc": 0.5226, "lyapunov": null, "grad_norm": 1.2022612803404449, "grad_max_sv": 0.5331769093871117, "grad_min_sv": 2.2077526620062348e-08, "grad_condition": 154376470.85049906, "lr": 0.0009381533400219313, "time_sec": 15.473422765731812 }, { "epoch": 25, "train_loss": 1.13716111492157, "train_acc": 0.66968, "test_loss": 1.9673876178741454, "test_acc": 0.5073, "lyapunov": null, "grad_norm": 1.1814644477570717, "grad_max_sv": 0.5192016668617725, "grad_min_sv": 2.207178118607267e-08, "grad_condition": 32052263.833083443, "lr": 0.0009330127018922189, "time_sec": 15.463173151016235 }, { "epoch": 26, "train_loss": 1.0986487645339966, "train_acc": 0.6787, "test_loss": 1.7822764610290527, "test_acc": 0.5433, "lyapunov": null, "grad_norm": 1.1543031476624748, "grad_max_sv": 0.5173374325037002, "grad_min_sv": 2.149504294557403e-08, "grad_condition": 47084637.545989394, "lr": 0.000927682130080253, "time_sec": 15.460694313049316 }, { "epoch": 27, "train_loss": 1.0663320102691651, "train_acc": 0.6865, "test_loss": 1.8293514751434325, "test_acc": 0.533, "lyapunov": null, "grad_norm": 1.1345054831803263, "grad_max_sv": 0.4966191992163658, "grad_min_sv": 2.08524984349201e-08, "grad_condition": 45914156.60470325, "lr": 0.0009221639627510072, "time_sec": 15.467730045318604 }, { "epoch": 28, "train_loss": 1.0501069176864624, "train_acc": 0.68934, "test_loss": 2.0238259536743164, "test_acc": 0.5084, "lyapunov": null, "grad_norm": 1.1176238593171397, "grad_max_sv": 0.489936176687479, "grad_min_sv": 2.0258219826652103e-08, "grad_condition": 52549899.42960344, "lr": 0.0009164606203550494, "time_sec": 15.526809692382812 }, { "epoch": 29, "train_loss": 1.0180758087921142, "train_acc": 0.69862, "test_loss": 1.8129717712402345, "test_acc": 0.5511, "lyapunov": null, "grad_norm": 1.0978329669563418, "grad_max_sv": 0.49835110902786256, "grad_min_sv": 2.0405637433853347e-08, "grad_condition": 716037506.8371468, "lr": 0.0009105746045668516, "time_sec": 15.492526054382324 }, { "epoch": 30, "train_loss": 0.9951805596923828, "train_acc": 0.7055, "test_loss": 1.746192921257019, "test_acc": 0.5623, "lyapunov": null, "grad_norm": 1.0796441895567979, "grad_max_sv": 0.47773563787341117, "grad_min_sv": 1.9923237732071692e-08, "grad_condition": 316108467.8828658, "lr": 0.0009045084971874733, "time_sec": 15.470518827438354 }, { "epoch": 31, "train_loss": 0.9780883857536316, "train_acc": 0.70904, "test_loss": 1.7732117160797118, "test_acc": 0.558, "lyapunov": null, "grad_norm": 1.0645091607080823, "grad_max_sv": 0.46556121930480004, "grad_min_sv": 1.9688543108527246e-08, "grad_condition": 174238515.18129045, "lr": 0.0008982649590120977, "time_sec": 15.477237224578857 }, { "epoch": 32, "train_loss": 0.9519822745513916, "train_acc": 0.71686, "test_loss": 1.7432144353866577, "test_acc": 0.5575, "lyapunov": null, "grad_norm": 1.0432923508174365, "grad_max_sv": 0.46001894399523735, "grad_min_sv": 1.928787157004508e-08, "grad_condition": 84996179.20525053, "lr": 0.0008918467286629196, "time_sec": 15.482601881027222 }, { "epoch": 33, "train_loss": 0.9250898433685303, "train_acc": 0.7218, "test_loss": 1.7904945095062257, "test_acc": 0.556, "lyapunov": null, "grad_norm": 1.0314496073989632, "grad_max_sv": 0.45169909074902537, "grad_min_sv": 1.9128463927403638e-08, "grad_condition": 68691111.76926772, "lr": 0.0008852566213878943, "time_sec": 15.519761800765991 }, { "epoch": 34, "train_loss": 0.9152010176086426, "train_acc": 0.72778, "test_loss": 1.835019757270813, "test_acc": 0.5553, "lyapunov": null, "grad_norm": 1.0226948793120243, "grad_max_sv": 0.44521483927965166, "grad_min_sv": 1.8672882064196816e-08, "grad_condition": 72631593.89558022, "lr": 0.000878497527825878, "time_sec": 15.492830753326416 }, { "epoch": 35, "train_loss": 0.8909054629325867, "train_acc": 0.72998, "test_loss": 1.8686577810287475, "test_acc": 0.5431, "lyapunov": null, "grad_norm": 1.0060209353905554, "grad_max_sv": 0.428337212651968, "grad_min_sv": 1.8221278065555514e-08, "grad_condition": 54925799.50217812, "lr": 0.000871572412738697, "time_sec": 15.495248556137085 }, { "epoch": 36, "train_loss": 0.8669569097518921, "train_acc": 0.7396, "test_loss": 1.8778275032043457, "test_acc": 0.5506, "lyapunov": null, "grad_norm": 0.9935254761598353, "grad_max_sv": 0.42610192447900774, "grad_min_sv": 1.789830566673034e-08, "grad_condition": 65521171.05971684, "lr": 0.0008644843137107055, "time_sec": 15.501812219619751 }, { "epoch": 37, "train_loss": 0.8407849538421631, "train_acc": 0.74404, "test_loss": 1.884768021965027, "test_acc": 0.5558, "lyapunov": null, "grad_norm": 0.983358047025113, "grad_max_sv": 0.429234990477562, "grad_min_sv": 1.8252723432699015e-08, "grad_condition": 312919609.17862236, "lr": 0.0008572363398164014, "time_sec": 15.485287427902222 }, { "epoch": 38, "train_loss": 0.8223714313125611, "train_acc": 0.74734, "test_loss": 1.8372897932052612, "test_acc": 0.5581, "lyapunov": null, "grad_norm": 0.9730686293969507, "grad_max_sv": 0.43215164765715597, "grad_min_sv": 1.805779136082597e-08, "grad_condition": 111631952.08398516, "lr": 0.0008498316702566826, "time_sec": 15.495893239974976 }, { "epoch": 39, "train_loss": 0.8224841629219055, "train_acc": 0.7495, "test_loss": 1.8123548791885375, "test_acc": 0.5623, "lyapunov": null, "grad_norm": 0.9689754376402935, "grad_max_sv": 0.41914472356438637, "grad_min_sv": 1.7533556316562392e-08, "grad_condition": 50149472.40203967, "lr": 0.0008422735529643442, "time_sec": 15.51100492477417 }, { "epoch": 40, "train_loss": 0.8005770356750488, "train_acc": 0.75588, "test_loss": 1.9014682191848755, "test_acc": 0.5541, "lyapunov": null, "grad_norm": 0.9508080469971997, "grad_max_sv": 0.42388487085700033, "grad_min_sv": 1.762832624032859e-08, "grad_condition": 346358468.0799734, "lr": 0.0008345653031794289, "time_sec": 15.498661279678345 }, { "epoch": 41, "train_loss": 0.7747948072814942, "train_acc": 0.76342, "test_loss": 1.8567888566970825, "test_acc": 0.5642, "lyapunov": null, "grad_norm": 0.9372391115065106, "grad_max_sv": 0.4081222198903561, "grad_min_sv": 1.7018125511580885e-08, "grad_condition": 61876276.47604829, "lr": 0.0008267103019950526, "time_sec": 15.5028657913208 }, { "epoch": 42, "train_loss": 0.7694620947647095, "train_acc": 0.76502, "test_loss": 1.8408411359786987, "test_acc": 0.5591, "lyapunov": null, "grad_norm": 0.9326717735984488, "grad_max_sv": 0.41085106804966925, "grad_min_sv": 1.7216302598821454e-08, "grad_condition": 43901470.16833824, "lr": 0.0008187119948743447, "time_sec": 15.496897459030151 }, { "epoch": 43, "train_loss": 0.7424543988418579, "train_acc": 0.77306, "test_loss": 1.809230382347107, "test_acc": 0.571, "lyapunov": null, "grad_norm": 0.9131307159835452, "grad_max_sv": 0.40560107976198195, "grad_min_sv": 1.6559755318563962e-08, "grad_condition": 374063353.4207941, "lr": 0.000810573890139155, "time_sec": 15.487475872039795 }, { "epoch": 44, "train_loss": 0.7239759206962585, "train_acc": 0.77538, "test_loss": 1.7808053987503052, "test_acc": 0.5793, "lyapunov": null, "grad_norm": 0.9060005234187932, "grad_max_sv": 0.39045327603816987, "grad_min_sv": 1.6347653778933656e-08, "grad_condition": 175023718.92676198, "lr": 0.0008022995574311873, "time_sec": 15.478513240814209 }, { "epoch": 45, "train_loss": 0.709962793712616, "train_acc": 0.77894, "test_loss": 1.9501771980285645, "test_acc": 0.5602, "lyapunov": null, "grad_norm": 0.8987907360568149, "grad_max_sv": 0.39080821722745895, "grad_min_sv": 1.634847552334229e-08, "grad_condition": 38169444.05614711, "lr": 0.0007938926261462363, "time_sec": 15.49375057220459 }, { "epoch": 46, "train_loss": 0.7000335352516174, "train_acc": 0.78202, "test_loss": 1.9276861065864563, "test_acc": 0.563, "lyapunov": null, "grad_norm": 0.8939654390908522, "grad_max_sv": 0.3900447376072407, "grad_min_sv": 1.6118415283213062e-08, "grad_condition": 201079781.287968, "lr": 0.0007853567838422158, "time_sec": 15.506261825561523 }, { "epoch": 47, "train_loss": 0.6843666355323792, "train_acc": 0.78712, "test_loss": 1.8863512687683106, "test_acc": 0.5648, "lyapunov": null, "grad_norm": 0.8860846821543104, "grad_max_sv": 0.38012751266360284, "grad_min_sv": 1.5984218158706515e-08, "grad_condition": 363331609.5318787, "lr": 0.0007766957746216719, "time_sec": 15.481945991516113 }, { "epoch": 48, "train_loss": 0.6651840719032288, "train_acc": 0.79232, "test_loss": 1.826128447341919, "test_acc": 0.5815, "lyapunov": null, "grad_norm": 0.8702032066364243, "grad_max_sv": 0.37026465982198714, "grad_min_sv": 1.544788876539638e-08, "grad_condition": 1805163796.8757565, "lr": 0.0007679133974894982, "time_sec": 15.52286958694458 }, { "epoch": 49, "train_loss": 0.6528418668937683, "train_acc": 0.79534, "test_loss": 1.8805492639541626, "test_acc": 0.5748, "lyapunov": null, "grad_norm": 0.8668040159369109, "grad_max_sv": 0.3801993615925312, "grad_min_sv": 1.5647269831914333e-08, "grad_condition": 52007972.99755625, "lr": 0.000759013504686565, "time_sec": 15.518036127090454 }, { "epoch": 50, "train_loss": 0.6436834973526001, "train_acc": 0.7997, "test_loss": 1.793442686843872, "test_acc": 0.5833, "lyapunov": null, "grad_norm": 0.8597198609492746, "grad_max_sv": 0.37670152857899664, "grad_min_sv": 1.5507358382387677e-08, "grad_condition": 427721692.1185082, "lr": 0.0007499999999999998, "time_sec": 15.534092426300049 }, { "epoch": 51, "train_loss": 0.6239418637657166, "train_acc": 0.80486, "test_loss": 1.9321050287246704, "test_acc": 0.5702, "lyapunov": null, "grad_norm": 0.8414343547264628, "grad_max_sv": 0.3712430141866207, "grad_min_sv": 1.5363422166663614e-08, "grad_condition": 365943262.8213007, "lr": 0.0007408768370508575, "time_sec": 15.527155876159668 }, { "epoch": 52, "train_loss": 0.6170344979095459, "train_acc": 0.80566, "test_loss": 1.7804856214523315, "test_acc": 0.588, "lyapunov": null, "grad_norm": 0.8457147724415158, "grad_max_sv": 0.36000491231679915, "grad_min_sv": 1.510340268962018e-08, "grad_condition": 55532260.257321715, "lr": 0.0007316480175599307, "time_sec": 15.508218765258789 }, { "epoch": 53, "train_loss": 0.6110373974990845, "train_acc": 0.8104, "test_loss": 2.008984780883789, "test_acc": 0.5633, "lyapunov": null, "grad_norm": 0.8288727311238714, "grad_max_sv": 0.3595147252082825, "grad_min_sv": 1.5030111735758744e-08, "grad_condition": 51249181.30750112, "lr": 0.0007223175895924635, "time_sec": 15.506837129592896 }, { "epoch": 54, "train_loss": 0.5891339810752869, "train_acc": 0.81566, "test_loss": 1.8466287677764892, "test_acc": 0.578, "lyapunov": null, "grad_norm": 0.8213597411734475, "grad_max_sv": 0.3565825395286083, "grad_min_sv": 1.4749719501978495e-08, "grad_condition": 570713779.6923382, "lr": 0.0007128896457825361, "time_sec": 15.501415491104126 }, { "epoch": 55, "train_loss": 0.5801966732025147, "train_acc": 0.81848, "test_loss": 1.8548430694580078, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.815116092241223, "grad_max_sv": 0.36071729883551595, "grad_min_sv": 1.4880934259310642e-08, "grad_condition": 334242266.9087108, "lr": 0.0007033683215378998, "time_sec": 15.510899066925049 }, { "epoch": 56, "train_loss": 0.569889211063385, "train_acc": 0.82134, "test_loss": 1.8169442867279053, "test_acc": 0.5857, "lyapunov": null, "grad_norm": 0.8134294920256526, "grad_max_sv": 0.3643924631178379, "grad_min_sv": 1.5098616617734152e-08, "grad_condition": 592439727.9387308, "lr": 0.0006937577932260512, "time_sec": 15.496611595153809 }, { "epoch": 57, "train_loss": 0.5602374402427673, "train_acc": 0.82158, "test_loss": 1.915207731628418, "test_acc": 0.5802, "lyapunov": null, "grad_norm": 0.8103201963167868, "grad_max_sv": 0.3596944443881512, "grad_min_sv": 1.4392631711435122e-08, "grad_condition": 84052786.33799395, "lr": 0.0006840622763423388, "time_sec": 15.500912427902222 }, { "epoch": 58, "train_loss": 0.5363558686447144, "train_acc": 0.83006, "test_loss": 1.9087711734771728, "test_acc": 0.579, "lyapunov": null, "grad_norm": 0.7940934690943876, "grad_max_sv": 0.3485556967556477, "grad_min_sv": 1.4054249935363528e-08, "grad_condition": 99578456.52402398, "lr": 0.0006742860236609073, "time_sec": 15.499320268630981 }, { "epoch": 59, "train_loss": 0.5240596619415283, "train_acc": 0.83386, "test_loss": 1.8847876579284668, "test_acc": 0.5849, "lyapunov": null, "grad_norm": 0.7848942902344976, "grad_max_sv": 0.3444338757544756, "grad_min_sv": 1.4203639615807326e-08, "grad_condition": 1006017198.7685986, "lr": 0.0006644333233692913, "time_sec": 15.51360535621643 }, { "epoch": 60, "train_loss": 0.5250089431381225, "train_acc": 0.83314, "test_loss": 1.8497852947235107, "test_acc": 0.5934, "lyapunov": null, "grad_norm": 0.78894564972248, "grad_max_sv": 0.35073093622922896, "grad_min_sv": 1.3935465524236857e-08, "grad_condition": 88013656.03250492, "lr": 0.0006545084971874734, "time_sec": 15.508491516113281 }, { "epoch": 61, "train_loss": 0.5165614600944519, "train_acc": 0.83506, "test_loss": 1.8630810359954835, "test_acc": 0.5874, "lyapunov": null, "grad_norm": 0.7829768565092297, "grad_max_sv": 0.3336628802120686, "grad_min_sv": 1.3946549117481444e-08, "grad_condition": 180242934.78653836, "lr": 0.0006445158984722354, "time_sec": 15.503038167953491 }, { "epoch": 62, "train_loss": 0.500950801115036, "train_acc": 0.83966, "test_loss": 1.8171254947662354, "test_acc": 0.5999, "lyapunov": null, "grad_norm": 0.7677509624143988, "grad_max_sv": 0.3256234541535378, "grad_min_sv": 1.3750762319075793e-08, "grad_condition": 64445933.52390041, "lr": 0.0006344599103076324, "time_sec": 15.505617618560791 }, { "epoch": 63, "train_loss": 0.48925278188705446, "train_acc": 0.84414, "test_loss": 1.9641206827163695, "test_acc": 0.5824, "lyapunov": null, "grad_norm": 0.7625502199233959, "grad_max_sv": 0.3294233627617359, "grad_min_sv": 1.32725306221243e-08, "grad_condition": 1228963257.7671177, "lr": 0.0006243449435824269, "time_sec": 15.529828071594238 }, { "epoch": 64, "train_loss": 0.48350829057693484, "train_acc": 0.84334, "test_loss": 1.9596610692977905, "test_acc": 0.5774, "lyapunov": null, "grad_norm": 0.7632750006619222, "grad_max_sv": 0.3282707162201405, "grad_min_sv": 1.3222439235009708e-08, "grad_condition": 124220191.9706742, "lr": 0.0006141754350553275, "time_sec": 15.521306037902832 }, { "epoch": 65, "train_loss": 0.4709274704360962, "train_acc": 0.84992, "test_loss": 1.8849371217727662, "test_acc": 0.5929, "lyapunov": null, "grad_norm": 0.7514320426924211, "grad_max_sv": 0.3312883138656616, "grad_min_sv": 1.352077347374636e-08, "grad_condition": 135157839.23060852, "lr": 0.0006039558454088793, "time_sec": 15.500089168548584 }, { "epoch": 66, "train_loss": 0.4579773247909546, "train_acc": 0.85246, "test_loss": 1.9383041584968568, "test_acc": 0.5795, "lyapunov": null, "grad_norm": 0.7398296341112965, "grad_max_sv": 0.32728378027677535, "grad_min_sv": 1.3280565344621006e-08, "grad_condition": 870917269.6899513, "lr": 0.000593690657292862, "time_sec": 15.498245477676392 }, { "epoch": 67, "train_loss": 0.4509772509765625, "train_acc": 0.85632, "test_loss": 1.9290270626068116, "test_acc": 0.5832, "lyapunov": null, "grad_norm": 0.733532607565585, "grad_max_sv": 0.3176191322505474, "grad_min_sv": 1.2820620155827924e-08, "grad_condition": 563528143.6689861, "lr": 0.0005833843733580507, "time_sec": 15.513327360153198 }, { "epoch": 68, "train_loss": 0.44296426357269286, "train_acc": 0.85874, "test_loss": 1.9557575977325439, "test_acc": 0.5895, "lyapunov": null, "grad_norm": 0.7313567414469692, "grad_max_sv": 0.3311334565281868, "grad_min_sv": 1.299003317134506e-08, "grad_condition": 57636313.192167915, "lr": 0.0005730415142812054, "time_sec": 15.521730422973633 }, { "epoch": 69, "train_loss": 0.43896515016555787, "train_acc": 0.85892, "test_loss": 1.960878660583496, "test_acc": 0.5868, "lyapunov": null, "grad_norm": 0.7340093422433535, "grad_max_sv": 0.3193955574184656, "grad_min_sv": 1.2791151784291576e-08, "grad_condition": 100597916.68063782, "lr": 0.0005626666167821517, "time_sec": 15.51311707496643 }, { "epoch": 70, "train_loss": 0.4285468480491638, "train_acc": 0.86298, "test_loss": 1.9584955738067626, "test_acc": 0.591, "lyapunov": null, "grad_norm": 0.7244061253185728, "grad_max_sv": 0.31838734485208986, "grad_min_sv": 1.2623370689458097e-08, "grad_condition": 256671325.86986813, "lr": 0.0005522642316338265, "time_sec": 15.545679569244385 }, { "epoch": 71, "train_loss": 0.4232082028102875, "train_acc": 0.863, "test_loss": 1.9168709438323974, "test_acc": 0.5946, "lyapunov": null, "grad_norm": 0.7235116987420683, "grad_max_sv": 0.3361910209059715, "grad_min_sv": 1.3065330882943912e-08, "grad_condition": 539616293.1861387, "lr": 0.0005418389216661573, "time_sec": 15.529778480529785 }, { "epoch": 72, "train_loss": 0.40893464082717895, "train_acc": 0.8671, "test_loss": 1.9778603734970093, "test_acc": 0.5917, "lyapunov": null, "grad_norm": 0.7120788606908913, "grad_max_sv": 0.3133332245051861, "grad_min_sv": 1.2864244934573943e-08, "grad_condition": 599875620.9980721, "lr": 0.0005313952597646563, "time_sec": 15.501370429992676 }, { "epoch": 73, "train_loss": 0.4073019913864136, "train_acc": 0.86922, "test_loss": 1.8993178993225097, "test_acc": 0.6036, "lyapunov": null, "grad_norm": 0.7054800561985982, "grad_max_sv": 0.32210378982126714, "grad_min_sv": 1.2598049555162874e-08, "grad_condition": 609078116.1228421, "lr": 0.0005209378268645994, "time_sec": 15.514087915420532 }, { "epoch": 74, "train_loss": 0.38610194705963136, "train_acc": 0.87514, "test_loss": 1.9717372917175293, "test_acc": 0.5877, "lyapunov": null, "grad_norm": 0.6876754791376803, "grad_max_sv": 0.30587312653660775, "grad_min_sv": 1.228859272620758e-08, "grad_condition": 287047740.76686746, "lr": 0.0005104712099416781, "time_sec": 15.521286249160767 }, { "epoch": 75, "train_loss": 0.38415311262130736, "train_acc": 0.87532, "test_loss": 1.9978297256469726, "test_acc": 0.5873, "lyapunov": null, "grad_norm": 0.6901352414114731, "grad_max_sv": 0.30640832521021366, "grad_min_sv": 1.2382189768650464e-08, "grad_condition": 89574244.76284985, "lr": 0.0004999999999999996, "time_sec": 15.522554159164429 }, { "epoch": 76, "train_loss": 0.38036803808212283, "train_acc": 0.87676, "test_loss": 1.9114773050308227, "test_acc": 0.5941, "lyapunov": null, "grad_norm": 0.6862042555811976, "grad_max_sv": 0.30668022595345973, "grad_min_sv": 1.2098685775799311e-08, "grad_condition": 79753720.75813168, "lr": 0.0004895287900583212, "time_sec": 15.500049591064453 }, { "epoch": 77, "train_loss": 0.37699529049873354, "train_acc": 0.8755, "test_loss": 1.9144949556350708, "test_acc": 0.6035, "lyapunov": null, "grad_norm": 0.6869175270134545, "grad_max_sv": 0.30233032815158367, "grad_min_sv": 1.210133520196388e-08, "grad_condition": 86138637.5204114, "lr": 0.0004790621731353997, "time_sec": 15.553943395614624 }, { "epoch": 78, "train_loss": 0.3636139490318298, "train_acc": 0.88226, "test_loss": 1.9924920860290527, "test_acc": 0.5927, "lyapunov": null, "grad_norm": 0.6711688569608495, "grad_max_sv": 0.29902654588222505, "grad_min_sv": 1.1863716191731766e-08, "grad_condition": 88817475.8392382, "lr": 0.000468604740235343, "time_sec": 15.530450820922852 }, { "epoch": 79, "train_loss": 0.362152115983963, "train_acc": 0.88426, "test_loss": 1.924188154411316, "test_acc": 0.598, "lyapunov": null, "grad_norm": 0.6714773282743005, "grad_max_sv": 0.29965595006942747, "grad_min_sv": 1.1964831648906583e-08, "grad_condition": 902616195.7149051, "lr": 0.00045816107833384175, "time_sec": 15.498046636581421 }, { "epoch": 80, "train_loss": 0.35668459805488584, "train_acc": 0.88318, "test_loss": 1.9200622287750244, "test_acc": 0.5961, "lyapunov": null, "grad_norm": 0.6691406173146984, "grad_max_sv": 0.30350013412535193, "grad_min_sv": 1.2079031691623194e-08, "grad_condition": 208431932.92374653, "lr": 0.0004477357683661729, "time_sec": 15.500086307525635 }, { "epoch": 81, "train_loss": 0.3465567926597595, "train_acc": 0.88642, "test_loss": 1.9750726140975952, "test_acc": 0.5909, "lyapunov": null, "grad_norm": 0.6600906573823067, "grad_max_sv": 0.3025949317961931, "grad_min_sv": 1.1841972132921319e-08, "grad_condition": 833170767.4888487, "lr": 0.00043733338321784746, "time_sec": 15.528315544128418 }, { "epoch": 82, "train_loss": 0.3412511627674103, "train_acc": 0.88932, "test_loss": 1.9702592422485352, "test_acc": 0.5983, "lyapunov": null, "grad_norm": 0.6534470838362898, "grad_max_sv": 0.281625871360302, "grad_min_sv": 1.1298424867564605e-08, "grad_condition": 245256269.73618746, "lr": 0.0004269584857187939, "time_sec": 15.54018759727478 }, { "epoch": 83, "train_loss": 0.32986866790771485, "train_acc": 0.89278, "test_loss": 1.9833718214035034, "test_acc": 0.5983, "lyapunov": null, "grad_norm": 0.6472964118800569, "grad_max_sv": 0.2898814812302589, "grad_min_sv": 1.1219894397937468e-08, "grad_condition": 67348047.22944725, "lr": 0.0004166156266419484, "time_sec": 15.523268938064575 }, { "epoch": 84, "train_loss": 0.32046857831954956, "train_acc": 0.89464, "test_loss": 1.9931445137023927, "test_acc": 0.5976, "lyapunov": null, "grad_norm": 0.6387491891164032, "grad_max_sv": 0.2859178498387337, "grad_min_sv": 1.1112689026274158e-08, "grad_condition": 532191414.5407898, "lr": 0.0004063093427071373, "time_sec": 15.5046226978302 }, { "epoch": 85, "train_loss": 0.31971281969070436, "train_acc": 0.89616, "test_loss": 1.919898393058777, "test_acc": 0.6034, "lyapunov": null, "grad_norm": 0.6349502290101287, "grad_max_sv": 0.2895286176353693, "grad_min_sv": 1.114760893840749e-08, "grad_condition": 1708507357.4309907, "lr": 0.0003960441545911199, "time_sec": 15.50874662399292 }, { "epoch": 86, "train_loss": 0.314735742893219, "train_acc": 0.89802, "test_loss": 1.9826490537643433, "test_acc": 0.6039, "lyapunov": null, "grad_norm": 0.6374095409599659, "grad_max_sv": 0.29547037966549394, "grad_min_sv": 1.1427597929134642e-08, "grad_condition": 249196257.17434186, "lr": 0.0003858245649446718, "time_sec": 15.518042802810669 }, { "epoch": 87, "train_loss": 0.3056777443599701, "train_acc": 0.90104, "test_loss": 2.015980870628357, "test_acc": 0.5982, "lyapunov": null, "grad_norm": 0.6267239770409858, "grad_max_sv": 0.29190454818308353, "grad_min_sv": 1.1234584110458944e-08, "grad_condition": 1983104332.2605565, "lr": 0.00037565505641757235, "time_sec": 15.49971318244934 }, { "epoch": 88, "train_loss": 0.3044772444725037, "train_acc": 0.90106, "test_loss": 2.005346726799011, "test_acc": 0.6026, "lyapunov": null, "grad_norm": 0.6293105806437898, "grad_max_sv": 0.2927882194519043, "grad_min_sv": 1.12210154674941e-08, "grad_condition": 178904778.3418693, "lr": 0.00036554008969236695, "time_sec": 15.495405673980713 }, { "epoch": 89, "train_loss": 0.30109511434555053, "train_acc": 0.90188, "test_loss": 1.998448072052002, "test_acc": 0.6034, "lyapunov": null, "grad_norm": 0.6266125109308321, "grad_max_sv": 0.29103793352842333, "grad_min_sv": 1.1148633635108679e-08, "grad_condition": 893976917.5132227, "lr": 0.0003554841015277638, "time_sec": 15.50434947013855 }, { "epoch": 90, "train_loss": 0.28917674076080324, "train_acc": 0.90682, "test_loss": 1.9980867877960204, "test_acc": 0.6012, "lyapunov": null, "grad_norm": 0.6127659289231001, "grad_max_sv": 0.29112574011087416, "grad_min_sv": 1.1166155032202307e-08, "grad_condition": 348701496.86000526, "lr": 0.000345491502812526, "time_sec": 15.520820617675781 }, { "epoch": 91, "train_loss": 0.2823534561729431, "train_acc": 0.90822, "test_loss": 1.9809785503387451, "test_acc": 0.6052, "lyapunov": null, "grad_norm": 0.606268342013339, "grad_max_sv": 0.27696173191070556, "grad_min_sv": 1.0846671113454859e-08, "grad_condition": 248996494.78191227, "lr": 0.0003355666766307081, "time_sec": 15.745567321777344 }, { "epoch": 92, "train_loss": 0.28228991139411924, "train_acc": 0.91008, "test_loss": 2.0131442947387694, "test_acc": 0.6001, "lyapunov": null, "grad_norm": 0.6064057382091922, "grad_max_sv": 0.277644307166338, "grad_min_sv": 1.0798128024722132e-08, "grad_condition": 406311701.1258798, "lr": 0.00032571397633909225, "time_sec": 15.527170181274414 }, { "epoch": 93, "train_loss": 0.2772208102607727, "train_acc": 0.91184, "test_loss": 2.0510717596054078, "test_acc": 0.5952, "lyapunov": null, "grad_norm": 0.603398829043512, "grad_max_sv": 0.2785311110317707, "grad_min_sv": 1.0620686785936529e-08, "grad_condition": 159246942.28978306, "lr": 0.00031593772365766094, "time_sec": 15.521395206451416 }, { "epoch": 94, "train_loss": 0.2721544520187378, "train_acc": 0.91266, "test_loss": 2.044207299041748, "test_acc": 0.5963, "lyapunov": null, "grad_norm": 0.597776334868791, "grad_max_sv": 0.2813128184527159, "grad_min_sv": 1.032634765595758e-08, "grad_condition": 320344963.9972409, "lr": 0.0003062422067739483, "time_sec": 15.535969257354736 }, { "epoch": 95, "train_loss": 0.2562399788665771, "train_acc": 0.91636, "test_loss": 2.1072509820938112, "test_acc": 0.5953, "lyapunov": null, "grad_norm": 0.5775561165196347, "grad_max_sv": 0.27824114337563516, "grad_min_sv": 1.0481623234420353e-08, "grad_condition": 474004359.26671135, "lr": 0.00029663167846209965, "time_sec": 15.517311334609985 }, { "epoch": 96, "train_loss": 0.2625131010723114, "train_acc": 0.9142, "test_loss": 2.035417915725708, "test_acc": 0.604, "lyapunov": null, "grad_norm": 0.5877203581399221, "grad_max_sv": 0.28129979483783246, "grad_min_sv": 1.0502568877773787e-08, "grad_condition": 177356414.63757357, "lr": 0.00028711035421746345, "time_sec": 15.521276950836182 }, { "epoch": 97, "train_loss": 0.2552481310462952, "train_acc": 0.9173, "test_loss": 1.9491484304428102, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.5816116237706002, "grad_max_sv": 0.27597419619560243, "grad_min_sv": 1.0369440153409904e-08, "grad_condition": 153072053.30610082, "lr": 0.00027768241040753615, "time_sec": 15.518199920654297 }, { "epoch": 98, "train_loss": 0.2514290081501007, "train_acc": 0.91774, "test_loss": 1.9556513019561768, "test_acc": 0.6144, "lyapunov": null, "grad_norm": 0.5786453355425705, "grad_max_sv": 0.25863444767892363, "grad_min_sv": 9.982682687079137e-09, "grad_condition": 323898207.1043015, "lr": 0.00026835198244006903, "time_sec": 15.518558025360107 }, { "epoch": 99, "train_loss": 0.24542429465293883, "train_acc": 0.92078, "test_loss": 2.0414382596969602, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.5720561260068352, "grad_max_sv": 0.2730622936040163, "grad_min_sv": 1.0236981595745931e-08, "grad_condition": 73009111.50173582, "lr": 0.0002591231629491421, "time_sec": 15.516184568405151 }, { "epoch": 100, "train_loss": 0.2419339677333832, "train_acc": 0.92168, "test_loss": 2.0001620481491087, "test_acc": 0.615, "lyapunov": null, "grad_norm": 0.5656963959074934, "grad_max_sv": 0.2690838035196066, "grad_min_sv": 1.0369351413283546e-08, "grad_condition": 325100290.9819474, "lr": 0.0002499999999999997, "time_sec": 15.516221761703491 }, { "epoch": 101, "train_loss": 0.23517837069511413, "train_acc": 0.92362, "test_loss": 2.0624069427490235, "test_acc": 0.6006, "lyapunov": null, "grad_norm": 0.5588551885657764, "grad_max_sv": 0.26636214926838875, "grad_min_sv": 9.985110372735806e-09, "grad_condition": 152593330.29256034, "lr": 0.00024098649531343477, "time_sec": 15.525659799575806 }, { "epoch": 102, "train_loss": 0.23243571233749388, "train_acc": 0.92494, "test_loss": 2.050922277832031, "test_acc": 0.6071, "lyapunov": null, "grad_norm": 0.555094837720988, "grad_max_sv": 0.2671301085501909, "grad_min_sv": 9.489460735148495e-09, "grad_condition": 975172257.3566437, "lr": 0.0002320866025105016, "time_sec": 15.512139797210693 }, { "epoch": 103, "train_loss": 0.22915385756969453, "train_acc": 0.92618, "test_loss": 2.0090701560974122, "test_acc": 0.6102, "lyapunov": null, "grad_norm": 0.551643622576711, "grad_max_sv": 0.26358814239501954, "grad_min_sv": 9.903819275135706e-09, "grad_condition": 8450881945.308035, "lr": 0.0002233042253783278, "time_sec": 15.51590085029602 }, { "epoch": 104, "train_loss": 0.22301624965667724, "train_acc": 0.929, "test_loss": 2.0414324163436888, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.547361757777093, "grad_max_sv": 0.2635317210108042, "grad_min_sv": 9.868235632663237e-09, "grad_condition": 918464158.4766433, "lr": 0.000214643216157784, "time_sec": 15.517698764801025 }, { "epoch": 105, "train_loss": 0.21800282436847687, "train_acc": 0.92888, "test_loss": 2.006334408760071, "test_acc": 0.6108, "lyapunov": null, "grad_norm": 0.5441245707971135, "grad_max_sv": 0.2652390133589506, "grad_min_sv": 9.775255871067018e-09, "grad_condition": 1728037982.0008423, "lr": 0.00020610737385376332, "time_sec": 15.521651268005371 }, { "epoch": 106, "train_loss": 0.22170533905029297, "train_acc": 0.92766, "test_loss": 2.0015246070861816, "test_acc": 0.6151, "lyapunov": null, "grad_norm": 0.5504732473005655, "grad_max_sv": 0.2658932194113731, "grad_min_sv": 9.836566865553675e-09, "grad_condition": 187622343.96039546, "lr": 0.00019770044256881242, "time_sec": 15.52303409576416 }, { "epoch": 107, "train_loss": 0.21625425663948059, "train_acc": 0.92998, "test_loss": 2.0188750885009767, "test_acc": 0.6132, "lyapunov": null, "grad_norm": 0.5416895117176501, "grad_max_sv": 0.25219607427716256, "grad_min_sv": 9.366761803773077e-09, "grad_condition": 260260509.50687146, "lr": 0.0001894261098608447, "time_sec": 15.538499593734741 }, { "epoch": 108, "train_loss": 0.20747127439498902, "train_acc": 0.93344, "test_loss": 1.992410384941101, "test_acc": 0.6181, "lyapunov": null, "grad_norm": 0.5312872760984289, "grad_max_sv": 0.26626099497079847, "grad_min_sv": 9.742697032379816e-09, "grad_condition": 241868081.8815055, "lr": 0.000181288005125655, "time_sec": 15.520596027374268 }, { "epoch": 109, "train_loss": 0.21061437376976014, "train_acc": 0.93212, "test_loss": 2.0430712549209593, "test_acc": 0.6121, "lyapunov": null, "grad_norm": 0.53793437376293, "grad_max_sv": 0.26196735054254533, "grad_min_sv": 9.911649283440849e-09, "grad_condition": 196778424.3729182, "lr": 0.0001732896980049473, "time_sec": 15.514817953109741 }, { "epoch": 110, "train_loss": 0.20801750651359557, "train_acc": 0.93272, "test_loss": 2.0129987867355346, "test_acc": 0.6136, "lyapunov": null, "grad_norm": 0.5345111757966097, "grad_max_sv": 0.2620788164436817, "grad_min_sv": 9.685049608479378e-09, "grad_condition": 442982408.6181739, "lr": 0.00016543469682057076, "time_sec": 15.524093389511108 }, { "epoch": 111, "train_loss": 0.20387941056251527, "train_acc": 0.93432, "test_loss": 2.017576940536499, "test_acc": 0.6171, "lyapunov": null, "grad_norm": 0.5265383831682404, "grad_max_sv": 0.2475517351180315, "grad_min_sv": 9.334722057222771e-09, "grad_condition": 520706944.53767884, "lr": 0.00015772644703565552, "time_sec": 15.520273685455322 }, { "epoch": 112, "train_loss": 0.20065601328372956, "train_acc": 0.93514, "test_loss": 2.0878772733688353, "test_acc": 0.6091, "lyapunov": null, "grad_norm": 0.5235410807678327, "grad_max_sv": 0.2556714225560427, "grad_min_sv": 9.592023909182901e-09, "grad_condition": 295083197.1946956, "lr": 0.00015016832974331713, "time_sec": 15.510764837265015 }, { "epoch": 113, "train_loss": 0.1982079153442383, "train_acc": 0.93612, "test_loss": 2.047266570854187, "test_acc": 0.6181, "lyapunov": null, "grad_norm": 0.5197176578777744, "grad_max_sv": 0.25255175642669203, "grad_min_sv": 9.308845385150311e-09, "grad_condition": 520055211.6428779, "lr": 0.00014276366018359834, "time_sec": 15.705829381942749 }, { "epoch": 114, "train_loss": 0.19655517510414122, "train_acc": 0.93708, "test_loss": 2.0292094760894774, "test_acc": 0.6144, "lyapunov": null, "grad_norm": 0.5181527372855724, "grad_max_sv": 0.25922506861388683, "grad_min_sv": 9.507550523431274e-09, "grad_condition": 332806274.6985155, "lr": 0.00013551568628929425, "time_sec": 15.525954723358154 }, { "epoch": 115, "train_loss": 0.18803977591514587, "train_acc": 0.93928, "test_loss": 2.0187850973129273, "test_acc": 0.6152, "lyapunov": null, "grad_norm": 0.5114058292617459, "grad_max_sv": 0.2462628223001957, "grad_min_sv": 9.353905294090265e-09, "grad_condition": 1483441837.69936, "lr": 0.00012842758726130276, "time_sec": 15.518154859542847 }, { "epoch": 116, "train_loss": 0.18797869988918303, "train_acc": 0.93912, "test_loss": 2.084369885826111, "test_acc": 0.6095, "lyapunov": null, "grad_norm": 0.5077819115434521, "grad_max_sv": 0.25109760873019693, "grad_min_sv": 8.964496494212256e-09, "grad_condition": 298276978.79912215, "lr": 0.0001215024721741218, "time_sec": 15.520355939865112 }, { "epoch": 117, "train_loss": 0.18214592965126036, "train_acc": 0.94196, "test_loss": 2.034072047996521, "test_acc": 0.6169, "lyapunov": null, "grad_norm": 0.49960618612788865, "grad_max_sv": 0.25671581737697124, "grad_min_sv": 9.445877218535077e-09, "grad_condition": 1803107586.0713096, "lr": 0.00011474337861210538, "time_sec": 15.5315523147583 }, { "epoch": 118, "train_loss": 0.18415243848800658, "train_acc": 0.93992, "test_loss": 2.082629474067688, "test_acc": 0.6147, "lyapunov": null, "grad_norm": 0.5036047735021936, "grad_max_sv": 0.24121248573064805, "grad_min_sv": 8.989532489320911e-09, "grad_condition": 1883514828.3661075, "lr": 0.00010815327133708009, "time_sec": 15.565385580062866 }, { "epoch": 119, "train_loss": 0.18069743538856506, "train_acc": 0.94234, "test_loss": 2.0749569414138795, "test_acc": 0.6104, "lyapunov": null, "grad_norm": 0.4967845602516186, "grad_max_sv": 0.24950436390936376, "grad_min_sv": 9.221202780431564e-09, "grad_condition": 275651167.2776666, "lr": 0.00010173504098790182, "time_sec": 15.531636476516724 }, { "epoch": 120, "train_loss": 0.1800184269142151, "train_acc": 0.9418, "test_loss": 2.063923722267151, "test_acc": 0.6149, "lyapunov": null, "grad_norm": 0.5000634640274525, "grad_max_sv": 0.2467968337237835, "grad_min_sv": 9.10186292138633e-09, "grad_condition": 420120780.22859687, "lr": 9.549150281252629e-05, "time_sec": 15.545646905899048 }, { "epoch": 121, "train_loss": 0.1746319353055954, "train_acc": 0.94524, "test_loss": 2.031014646720886, "test_acc": 0.6202, "lyapunov": null, "grad_norm": 0.4894634649372604, "grad_max_sv": 0.24847413785755634, "grad_min_sv": 9.111916768203901e-09, "grad_condition": 529933823.1357336, "lr": 8.942539543314794e-05, "time_sec": 15.525688648223877 }, { "epoch": 122, "train_loss": 0.1720413486146927, "train_acc": 0.94558, "test_loss": 2.0709302186965943, "test_acc": 0.6107, "lyapunov": null, "grad_norm": 0.4872422158802626, "grad_max_sv": 0.25410806462168695, "grad_min_sv": 9.372779969513134e-09, "grad_condition": 129683199.58735898, "lr": 8.353937964495024e-05, "time_sec": 15.53614616394043 }, { "epoch": 123, "train_loss": 0.167387109708786, "train_acc": 0.94716, "test_loss": 2.04781618976593, "test_acc": 0.621, "lyapunov": null, "grad_norm": 0.47867845277837057, "grad_max_sv": 0.24308387711644172, "grad_min_sv": 8.83432009590561e-09, "grad_condition": 446940201.78913987, "lr": 7.783603724899243e-05, "time_sec": 15.534965991973877 }, { "epoch": 124, "train_loss": 0.17369194811820984, "train_acc": 0.9434, "test_loss": 2.080777750968933, "test_acc": 0.6137, "lyapunov": null, "grad_norm": 0.4915299120514337, "grad_max_sv": 0.24491641744971276, "grad_min_sv": 8.973002642667129e-09, "grad_condition": 968560910.7177868, "lr": 7.231786991974666e-05, "time_sec": 15.534366130828857 }, { "epoch": 125, "train_loss": 0.17029917016983032, "train_acc": 0.94574, "test_loss": 2.0687435190200807, "test_acc": 0.6157, "lyapunov": null, "grad_norm": 0.4850020461380622, "grad_max_sv": 0.24593175910413265, "grad_min_sv": 8.810581337420631e-09, "grad_condition": 165938611.54228717, "lr": 6.698729810778072e-05, "time_sec": 15.55061674118042 }, { "epoch": 126, "train_loss": 0.1665445522928238, "train_acc": 0.94674, "test_loss": 2.0515053030014037, "test_acc": 0.6187, "lyapunov": null, "grad_norm": 0.48056912270271285, "grad_max_sv": 0.23969021812081337, "grad_min_sv": 8.827286746693327e-09, "grad_condition": 1743247825.2921212, "lr": 6.184665997806817e-05, "time_sec": 15.531169652938843 }, { "epoch": 127, "train_loss": 0.16487963933944702, "train_acc": 0.94836, "test_loss": 2.033387902641296, "test_acc": 0.6198, "lyapunov": null, "grad_norm": 0.47729941792361885, "grad_max_sv": 0.2343486487865448, "grad_min_sv": 8.995271932876748e-09, "grad_condition": 606828641.3185183, "lr": 5.6898210384392595e-05, "time_sec": 15.539721250534058 }, { "epoch": 128, "train_loss": 0.16376567732810973, "train_acc": 0.94834, "test_loss": 2.0975912773132324, "test_acc": 0.6112, "lyapunov": null, "grad_norm": 0.47555669561822944, "grad_max_sv": 0.2403645869344473, "grad_min_sv": 8.86344721578395e-09, "grad_condition": 1871409158.001809, "lr": 5.214411988029363e-05, "time_sec": 15.523812055587769 }, { "epoch": 129, "train_loss": 0.16381013206005096, "train_acc": 0.94882, "test_loss": 2.0344886224746705, "test_acc": 0.6205, "lyapunov": null, "grad_norm": 0.47811068127125184, "grad_max_sv": 0.2321129973977804, "grad_min_sv": 8.809577021736195e-09, "grad_condition": 674841641.2549579, "lr": 4.7586473766990294e-05, "time_sec": 15.542162656784058 }, { "epoch": 130, "train_loss": 0.1587965604352951, "train_acc": 0.95018, "test_loss": 2.039856211090088, "test_acc": 0.6198, "lyapunov": null, "grad_norm": 0.46996704308372744, "grad_max_sv": 0.24367436692118644, "grad_min_sv": 8.878338260412334e-09, "grad_condition": 3107522776.3953853, "lr": 4.32272711786996e-05, "time_sec": 15.518379926681519 }, { "epoch": 131, "train_loss": 0.16415684640884398, "train_acc": 0.94804, "test_loss": 2.0716621114730835, "test_acc": 0.6177, "lyapunov": null, "grad_norm": 0.477860267933493, "grad_max_sv": 0.23813350014388562, "grad_min_sv": 8.676938825780134e-09, "grad_condition": 186204488.74284863, "lr": 3.906842420574966e-05, "time_sec": 15.52889084815979 }, { "epoch": 132, "train_loss": 0.1586827588367462, "train_acc": 0.94982, "test_loss": 2.053567728805542, "test_acc": 0.6199, "lyapunov": null, "grad_norm": 0.4697672382287586, "grad_max_sv": 0.2426899142563343, "grad_min_sv": 8.828440787385545e-09, "grad_condition": 1012659868.4686158, "lr": 3.5111757055874305e-05, "time_sec": 15.524049282073975 }, { "epoch": 133, "train_loss": 0.15553737973690032, "train_acc": 0.95082, "test_loss": 2.043516174507141, "test_acc": 0.6191, "lyapunov": null, "grad_norm": 0.4649067986135626, "grad_max_sv": 0.24401309713721275, "grad_min_sv": 8.961552855574292e-09, "grad_condition": 1162757970.0586789, "lr": 3.1359005254054254e-05, "time_sec": 15.536059856414795 }, { "epoch": 134, "train_loss": 0.15784678574085237, "train_acc": 0.9499, "test_loss": 2.03684903011322, "test_acc": 0.6189, "lyapunov": null, "grad_norm": 0.4686730421924603, "grad_max_sv": 0.23595759123563767, "grad_min_sv": 8.586731024010303e-09, "grad_condition": 4315274102.848023, "lr": 2.7811814881259484e-05, "time_sec": 15.534076690673828 }, { "epoch": 135, "train_loss": 0.15442110489368438, "train_acc": 0.95192, "test_loss": 2.0882527042388914, "test_acc": 0.6147, "lyapunov": null, "grad_norm": 0.4615131055534514, "grad_max_sv": 0.2321950040757656, "grad_min_sv": 8.617836743177176e-09, "grad_condition": 99470014.62201284, "lr": 2.4471741852423218e-05, "time_sec": 15.554243803024292 }, { "epoch": 136, "train_loss": 0.15938658513069154, "train_acc": 0.95014, "test_loss": 2.0193495433807374, "test_acc": 0.619, "lyapunov": null, "grad_norm": 0.46997706784197274, "grad_max_sv": 0.24588101021945477, "grad_min_sv": 8.594699345537e-09, "grad_condition": 299854790.23102367, "lr": 2.1340251233966362e-05, "time_sec": 15.515581130981445 }, { "epoch": 137, "train_loss": 0.15305941107273102, "train_acc": 0.95102, "test_loss": 2.085107785606384, "test_acc": 0.6178, "lyapunov": null, "grad_norm": 0.4651082031381239, "grad_max_sv": 0.23546294569969178, "grad_min_sv": 8.641280193082048e-09, "grad_condition": 1355468630.1220336, "lr": 1.8418716601170932e-05, "time_sec": 15.523824691772461 }, { "epoch": 138, "train_loss": 0.15521952202796935, "train_acc": 0.95138, "test_loss": 2.05961570148468, "test_acc": 0.621, "lyapunov": null, "grad_norm": 0.4655707979434113, "grad_max_sv": 0.22249948792159557, "grad_min_sv": 8.559314398871517e-09, "grad_condition": 523110775.45855033, "lr": 1.570841943568445e-05, "time_sec": 15.527312755584717 }, { "epoch": 139, "train_loss": 0.15613153836250304, "train_acc": 0.94964, "test_loss": 2.0917256591796876, "test_acc": 0.6145, "lyapunov": null, "grad_norm": 0.4685524417915432, "grad_max_sv": 0.23622551932930946, "grad_min_sv": 8.448936071386512e-09, "grad_condition": 381309760.86173236, "lr": 1.3210548563419845e-05, "time_sec": 15.53156852722168 }, { "epoch": 140, "train_loss": 0.15750930822372436, "train_acc": 0.95076, "test_loss": 2.0336023241043093, "test_acc": 0.6231, "lyapunov": null, "grad_norm": 0.46956356170298885, "grad_max_sv": 0.24571651183068752, "grad_min_sv": 8.880518665268025e-09, "grad_condition": 446576930.15414965, "lr": 1.0926199633097203e-05, "time_sec": 15.513741731643677 }, { "epoch": 141, "train_loss": 0.15634389350891112, "train_acc": 0.95178, "test_loss": 2.0461313623428343, "test_acc": 0.6206, "lyapunov": null, "grad_norm": 0.4667179789960613, "grad_max_sv": 0.2333354063332081, "grad_min_sv": 8.735082636959725e-09, "grad_condition": 2773787337.949284, "lr": 8.856374635655688e-06, "time_sec": 15.527939558029175 }, { "epoch": 142, "train_loss": 0.1522996149158478, "train_acc": 0.95188, "test_loss": 2.036745939064026, "test_acc": 0.6191, "lyapunov": null, "grad_norm": 0.45971196350477606, "grad_max_sv": 0.23409303948283194, "grad_min_sv": 8.654798093845651e-09, "grad_condition": 899766914.5561358, "lr": 7.001981464747503e-06, "time_sec": 15.528279781341553 }, { "epoch": 143, "train_loss": 0.15602009796380997, "train_acc": 0.95086, "test_loss": 2.030546005439758, "test_acc": 0.6179, "lyapunov": null, "grad_norm": 0.46698211747670393, "grad_max_sv": 0.2427021000534296, "grad_min_sv": 8.880018779116672e-09, "grad_condition": 2005668849.0321355, "lr": 5.3638335185058295e-06, "time_sec": 15.519719362258911 }, { "epoch": 144, "train_loss": 0.15405357198238373, "train_acc": 0.95214, "test_loss": 2.0480900999069216, "test_acc": 0.6225, "lyapunov": null, "grad_norm": 0.4619783068969592, "grad_max_sv": 0.24754497669637204, "grad_min_sv": 9.022524723482569e-09, "grad_condition": 472769507.4774891, "lr": 3.942649342761114e-06, "time_sec": 15.538635015487671 }, { "epoch": 145, "train_loss": 0.15324831766605376, "train_acc": 0.95236, "test_loss": 2.0383225648880003, "test_acc": 0.6217, "lyapunov": null, "grad_norm": 0.46106192343039926, "grad_max_sv": 0.23626826107501983, "grad_min_sv": 8.604992432687843e-09, "grad_condition": 1211825093.7054877, "lr": 2.7390523158633524e-06, "time_sec": 15.542897939682007 }, { "epoch": 146, "train_loss": 0.15349729721069336, "train_acc": 0.9521, "test_loss": 2.0096838916778563, "test_acc": 0.6241, "lyapunov": null, "grad_norm": 0.4615822267692517, "grad_max_sv": 0.23966375291347503, "grad_min_sv": 8.838330253866516e-09, "grad_condition": 685922400.3184944, "lr": 1.7535703752478133e-06, "time_sec": 15.519303321838379 }, { "epoch": 147, "train_loss": 0.15039199693679808, "train_acc": 0.95362, "test_loss": 2.0573708726882933, "test_acc": 0.6207, "lyapunov": null, "grad_norm": 0.4572591547952713, "grad_max_sv": 0.2330123759806156, "grad_min_sv": 8.66143673887215e-09, "grad_condition": 1329748658.9084074, "lr": 9.866357858642196e-07, "time_sec": 15.523812532424927 }, { "epoch": 148, "train_loss": 0.15033800620317458, "train_acc": 0.95234, "test_loss": 2.0463861759185793, "test_acc": 0.6186, "lyapunov": null, "grad_norm": 0.45711357740306113, "grad_max_sv": 0.2265869051218033, "grad_min_sv": 8.489472146479878e-09, "grad_condition": 764759274.1337291, "lr": 4.38584950570808e-07, "time_sec": 15.51754641532898 }, { "epoch": 149, "train_loss": 0.15091258768081664, "train_acc": 0.95256, "test_loss": 2.0271072778701784, "test_acc": 0.6188, "lyapunov": null, "grad_norm": 0.4574063447607332, "grad_max_sv": 0.23711176067590714, "grad_min_sv": 8.619700593825432e-09, "grad_condition": 2609529945.0149875, "lr": 1.096582625772501e-07, "time_sec": 15.518434286117554 }, { "epoch": 150, "train_loss": 0.153145382938385, "train_acc": 0.95224, "test_loss": 2.03473729095459, "test_acc": 0.6182, "lyapunov": null, "grad_norm": 0.46046361312569684, "grad_max_sv": 0.22179042883217334, "grad_min_sv": 8.465783018335969e-09, "grad_condition": 1154619433.2746358, "lr": 0.0, "time_sec": 15.527158737182617 } ], "8": [ { "epoch": 1, "train_loss": 4.604280056762695, "train_acc": 0.06204, "test_loss": 4.320657266998291, "test_acc": 0.0698, "lyapunov": null, "grad_norm": 6.299548945029663, "grad_max_sv": 5.383423590660096, "grad_min_sv": 1.0969439819819016e-07, "grad_condition": 135387683.66756994, "lr": 0.0009998903417374227, "time_sec": 32.66659903526306 }, { "epoch": 2, "train_loss": 3.8911869562530517, "train_acc": 0.12252, "test_loss": 3.901215605163574, "test_acc": 0.1102, "lyapunov": null, "grad_norm": 4.7289084274834625, "grad_max_sv": 4.045294773578644, "grad_min_sv": 8.59628614957586e-08, "grad_condition": 54316925.08787592, "lr": 0.0009995614150494292, "time_sec": 32.55902910232544 }, { "epoch": 3, "train_loss": 3.5447918058776855, "train_acc": 0.16864, "test_loss": 3.5751065971374514, "test_acc": 0.1632, "lyapunov": null, "grad_norm": 3.9235192359291027, "grad_max_sv": 3.218869465589523, "grad_min_sv": 7.25899491738069e-08, "grad_condition": 59713400.674747445, "lr": 0.0009990133642141358, "time_sec": 32.56558012962341 }, { "epoch": 4, "train_loss": 3.285915934448242, "train_acc": 0.20564, "test_loss": 3.4154525535583495, "test_acc": 0.1808, "lyapunov": null, "grad_norm": 3.2931939429390655, "grad_max_sv": 2.48674353659153, "grad_min_sv": 6.094367343001394e-08, "grad_condition": 49578785.90593137, "lr": 0.0009982464296247522, "time_sec": 32.57981467247009 }, { "epoch": 5, "train_loss": 3.049801904296875, "train_acc": 0.2475, "test_loss": 3.380838261413574, "test_acc": 0.2067, "lyapunov": null, "grad_norm": 2.7585548587495836, "grad_max_sv": 1.9313260614871979, "grad_min_sv": 5.103909220399716e-08, "grad_condition": 117086071.43576927, "lr": 0.0009972609476841367, "time_sec": 32.564860582351685 }, { "epoch": 6, "train_loss": 2.861402225112915, "train_acc": 0.28052, "test_loss": 3.1182963836669924, "test_acc": 0.2393, "lyapunov": null, "grad_norm": 2.365169286939716, "grad_max_sv": 1.514634570479393, "grad_min_sv": 4.377452151871353e-08, "grad_condition": 42685906.70361744, "lr": 0.000996057350657239, "time_sec": 32.57882595062256 }, { "epoch": 7, "train_loss": 2.683069683303833, "train_acc": 0.31566, "test_loss": 2.857948400115967, "test_acc": 0.2899, "lyapunov": null, "grad_norm": 2.0678830204526424, "grad_max_sv": 1.2104690104722977, "grad_min_sv": 3.849874057187952e-08, "grad_condition": 83742051.18670955, "lr": 0.000994636166481494, "time_sec": 32.585235834121704 }, { "epoch": 8, "train_loss": 2.5299233337402343, "train_acc": 0.34444, "test_loss": 3.000171680831909, "test_acc": 0.2752, "lyapunov": null, "grad_norm": 1.874555701802065, "grad_max_sv": 1.0279113829135895, "grad_min_sv": 3.509024343872902e-08, "grad_condition": 55390142.1353655, "lr": 0.0009929980185352525, "time_sec": 32.69047737121582 }, { "epoch": 9, "train_loss": 2.4147268306732177, "train_acc": 0.3694, "test_loss": 2.543715224456787, "test_acc": 0.3455, "lyapunov": null, "grad_norm": 1.7485138229937156, "grad_max_sv": 0.9131708398461342, "grad_min_sv": 3.287046465294541e-08, "grad_condition": 39656658.27812234, "lr": 0.0009911436253643444, "time_sec": 32.57169961929321 }, { "epoch": 10, "train_loss": 2.2967233794403077, "train_acc": 0.39298, "test_loss": 2.6548849906921386, "test_acc": 0.3353, "lyapunov": null, "grad_norm": 1.6282804367899422, "grad_max_sv": 0.782713083922863, "grad_min_sv": 3.019940961190848e-08, "grad_condition": 36873848.007240444, "lr": 0.0009890738003669028, "time_sec": 32.577866077423096 }, { "epoch": 11, "train_loss": 2.192351549682617, "train_acc": 0.41852, "test_loss": 2.3893451919555666, "test_acc": 0.3824, "lyapunov": null, "grad_norm": 1.5518898048516216, "grad_max_sv": 0.7297310382127762, "grad_min_sv": 2.9274875311402494e-08, "grad_condition": 81724146.83842216, "lr": 0.00098678945143658, "time_sec": 32.599745750427246 }, { "epoch": 12, "train_loss": 2.117909373779297, "train_acc": 0.4337, "test_loss": 2.522136171722412, "test_acc": 0.3587, "lyapunov": null, "grad_norm": 1.4842631514558458, "grad_max_sv": 0.66500775963068, "grad_min_sv": 2.8010595395921988e-08, "grad_condition": 35670339.18143847, "lr": 0.0009842915805643154, "time_sec": 32.62933874130249 }, { "epoch": 13, "train_loss": 2.035253409576416, "train_acc": 0.45344, "test_loss": 2.391997838592529, "test_acc": 0.3805, "lyapunov": null, "grad_norm": 1.4422903854957079, "grad_max_sv": 0.6408356204628944, "grad_min_sv": 2.7295970482510425e-08, "grad_condition": 43720876.000019774, "lr": 0.000981581283398829, "time_sec": 32.557313442230225 }, { "epoch": 14, "train_loss": 1.9614996997451781, "train_acc": 0.46826, "test_loss": 2.3329195419311524, "test_acc": 0.4028, "lyapunov": null, "grad_norm": 1.3741944023253918, "grad_max_sv": 0.6013172835111618, "grad_min_sv": 2.5733794781213072e-08, "grad_condition": 36069642.478253104, "lr": 0.0009786597487660333, "time_sec": 32.58955407142639 }, { "epoch": 15, "train_loss": 1.8944761297988892, "train_acc": 0.48526, "test_loss": 2.2367286880493165, "test_acc": 0.4236, "lyapunov": null, "grad_norm": 1.3219592289498192, "grad_max_sv": 0.5812912411987782, "grad_min_sv": 2.4716666779944773e-08, "grad_condition": 29281331.50836698, "lr": 0.0009755282581475766, "time_sec": 32.56029748916626 }, { "epoch": 16, "train_loss": 1.8379625350189208, "train_acc": 0.49608, "test_loss": 2.1963637313842774, "test_acc": 0.4284, "lyapunov": null, "grad_norm": 1.2908175006695335, "grad_max_sv": 0.5532825239002704, "grad_min_sv": 2.4336655729539913e-08, "grad_condition": 42358304.72716427, "lr": 0.0009721881851187403, "time_sec": 32.54909014701843 }, { "epoch": 17, "train_loss": 1.7670473766326904, "train_acc": 0.51538, "test_loss": 2.1328998752593993, "test_acc": 0.4452, "lyapunov": null, "grad_norm": 1.2440997761596901, "grad_max_sv": 0.5198108039796352, "grad_min_sv": 2.3273317767413813e-08, "grad_condition": 35998824.48422967, "lr": 0.0009686409947459456, "time_sec": 32.55762696266174 }, { "epoch": 18, "train_loss": 1.7253368561553954, "train_acc": 0.52444, "test_loss": 2.245950330352783, "test_acc": 0.4284, "lyapunov": null, "grad_norm": 1.214902512911659, "grad_max_sv": 0.5048692628741265, "grad_min_sv": 2.2689030459988047e-08, "grad_condition": 49317544.599824145, "lr": 0.0009648882429441254, "time_sec": 32.5514817237854 }, { "epoch": 19, "train_loss": 1.6694325649261474, "train_acc": 0.5342, "test_loss": 2.19226961517334, "test_acc": 0.4387, "lyapunov": null, "grad_norm": 1.1750671216974986, "grad_max_sv": 0.4863507993519306, "grad_min_sv": 2.2075054092324244e-08, "grad_condition": 97502207.70501134, "lr": 0.00096093157579425, "time_sec": 32.55115628242493 }, { "epoch": 20, "train_loss": 1.617248278427124, "train_acc": 0.5473, "test_loss": 2.143247143173218, "test_acc": 0.453, "lyapunov": null, "grad_norm": 1.1445750522907119, "grad_max_sv": 0.4708236537873745, "grad_min_sv": 2.1383133666508236e-08, "grad_condition": 30242603.347623855, "lr": 0.0009567727288213001, "time_sec": 32.56135654449463 }, { "epoch": 21, "train_loss": 1.5802922723007202, "train_acc": 0.557, "test_loss": 2.0990093154907226, "test_acc": 0.4651, "lyapunov": null, "grad_norm": 1.1146123139527973, "grad_max_sv": 0.45539517551660535, "grad_min_sv": 2.1216313506045025e-08, "grad_condition": 32120917.787080377, "lr": 0.0009524135262330095, "time_sec": 32.58874869346619 }, { "epoch": 22, "train_loss": 1.540067174949646, "train_acc": 0.56592, "test_loss": 2.0439955375671386, "test_acc": 0.4707, "lyapunov": null, "grad_norm": 1.0888616623198637, "grad_max_sv": 0.43293082937598226, "grad_min_sv": 2.0197447772596356e-08, "grad_condition": 51667507.409315005, "lr": 0.0009478558801197061, "time_sec": 32.57522892951965 }, { "epoch": 23, "train_loss": 1.5045368173980713, "train_acc": 0.57686, "test_loss": 2.0701497230529786, "test_acc": 0.4729, "lyapunov": null, "grad_norm": 1.0823066547637195, "grad_max_sv": 0.4348363593220711, "grad_min_sv": 2.0215574525472847e-08, "grad_condition": 38846769.86075296, "lr": 0.000943101789615607, "time_sec": 32.58562135696411 }, { "epoch": 24, "train_loss": 1.464451589126587, "train_acc": 0.58532, "test_loss": 2.2039865215301515, "test_acc": 0.4486, "lyapunov": null, "grad_norm": 1.0523927832685198, "grad_max_sv": 0.41661558151245115, "grad_min_sv": 1.950878351086871e-08, "grad_condition": 34416119.9412758, "lr": 0.0009381533400219313, "time_sec": 32.563148736953735 }, { "epoch": 25, "train_loss": 1.4205649266052247, "train_acc": 0.59388, "test_loss": 2.1708908073425293, "test_acc": 0.4631, "lyapunov": null, "grad_norm": 1.0237955167104829, "grad_max_sv": 0.41313874199986456, "grad_min_sv": 1.9160673876000846e-08, "grad_condition": 116069222.65926342, "lr": 0.0009330127018922189, "time_sec": 32.58251953125 }, { "epoch": 26, "train_loss": 1.3801667861938476, "train_acc": 0.60904, "test_loss": 2.141048712158203, "test_acc": 0.4804, "lyapunov": null, "grad_norm": 1.003894338084706, "grad_max_sv": 0.39152884259819987, "grad_min_sv": 1.85417132805496e-08, "grad_condition": 149070926.97039393, "lr": 0.000927682130080253, "time_sec": 32.58069562911987 }, { "epoch": 27, "train_loss": 1.3742198986053467, "train_acc": 0.6049, "test_loss": 2.1493278324127196, "test_acc": 0.4766, "lyapunov": null, "grad_norm": 1.0025464883815882, "grad_max_sv": 0.3876075059175491, "grad_min_sv": 1.830616184195222e-08, "grad_condition": 35882215.67392446, "lr": 0.0009221639627510072, "time_sec": 32.56836271286011 }, { "epoch": 28, "train_loss": 1.320306241645813, "train_acc": 0.6196, "test_loss": 2.1034063312530518, "test_acc": 0.4844, "lyapunov": null, "grad_norm": 0.9735499274270826, "grad_max_sv": 0.3877687506377697, "grad_min_sv": 1.8286890105835564e-08, "grad_condition": 335682383.9298244, "lr": 0.0009164606203550494, "time_sec": 32.57155418395996 }, { "epoch": 29, "train_loss": 1.2960155849075317, "train_acc": 0.6256, "test_loss": 2.1984372549057007, "test_acc": 0.4692, "lyapunov": null, "grad_norm": 0.9613960934578316, "grad_max_sv": 0.3829047717154026, "grad_min_sv": 1.7720739411974938e-08, "grad_condition": 36256976.72962162, "lr": 0.0009105746045668516, "time_sec": 32.55882430076599 }, { "epoch": 30, "train_loss": 1.276566519241333, "train_acc": 0.62918, "test_loss": 2.3138665813446044, "test_acc": 0.4615, "lyapunov": null, "grad_norm": 0.9496542327680724, "grad_max_sv": 0.37292894124984743, "grad_min_sv": 1.7765610841463662e-08, "grad_condition": 48990654.53726908, "lr": 0.0009045084971874733, "time_sec": 32.57599472999573 }, { "epoch": 31, "train_loss": 1.2222671955871582, "train_acc": 0.64256, "test_loss": 2.1691656875610352, "test_acc": 0.4809, "lyapunov": null, "grad_norm": 0.9328591067251968, "grad_max_sv": 0.3668631583452225, "grad_min_sv": 1.731717505781827e-08, "grad_condition": 30411660.235134684, "lr": 0.0008982649590120977, "time_sec": 32.56551241874695 }, { "epoch": 32, "train_loss": 1.2110996068191529, "train_acc": 0.64794, "test_loss": 2.214646379852295, "test_acc": 0.4829, "lyapunov": null, "grad_norm": 0.930727366359918, "grad_max_sv": 0.3651597030460835, "grad_min_sv": 1.725773807192965e-08, "grad_condition": 25901528.27644656, "lr": 0.0008918467286629196, "time_sec": 32.56990313529968 }, { "epoch": 33, "train_loss": 1.1722402347946168, "train_acc": 0.6566, "test_loss": 2.2246903633117676, "test_acc": 0.4846, "lyapunov": null, "grad_norm": 0.9124985410949377, "grad_max_sv": 0.35901916325092315, "grad_min_sv": 1.6734816802102536e-08, "grad_condition": 84184024.35994068, "lr": 0.0008852566213878943, "time_sec": 32.58838510513306 }, { "epoch": 34, "train_loss": 1.1472361179351807, "train_acc": 0.66254, "test_loss": 2.1493885478973387, "test_acc": 0.4941, "lyapunov": null, "grad_norm": 0.8981676912068559, "grad_max_sv": 0.34216810315847396, "grad_min_sv": 1.6077876746622975e-08, "grad_condition": 36468768.92296384, "lr": 0.000878497527825878, "time_sec": 32.57939434051514 }, { "epoch": 35, "train_loss": 1.1205655740356446, "train_acc": 0.66956, "test_loss": 2.163042925453186, "test_acc": 0.4954, "lyapunov": null, "grad_norm": 0.8860645128225066, "grad_max_sv": 0.3396616868674755, "grad_min_sv": 1.607423450074308e-08, "grad_condition": 144981538.90034992, "lr": 0.000871572412738697, "time_sec": 32.57995939254761 }, { "epoch": 36, "train_loss": 1.1019499723815918, "train_acc": 0.67338, "test_loss": 2.1101196655273435, "test_acc": 0.508, "lyapunov": null, "grad_norm": 0.8837215741761234, "grad_max_sv": 0.3453404136002064, "grad_min_sv": 1.6300073393815674e-08, "grad_condition": 39609134.3745661, "lr": 0.0008644843137107055, "time_sec": 32.610419511795044 }, { "epoch": 37, "train_loss": 1.0685892918777466, "train_acc": 0.68264, "test_loss": 2.166209588623047, "test_acc": 0.5007, "lyapunov": null, "grad_norm": 0.8688858809651051, "grad_max_sv": 0.3433241851627827, "grad_min_sv": 1.6007609650054573e-08, "grad_condition": 775786281.5340235, "lr": 0.0008572363398164014, "time_sec": 32.565879583358765 }, { "epoch": 38, "train_loss": 1.0574775017929077, "train_acc": 0.68396, "test_loss": 2.222346786689758, "test_acc": 0.5, "lyapunov": null, "grad_norm": 0.8639145605396845, "grad_max_sv": 0.3388586565852165, "grad_min_sv": 1.583358475998331e-08, "grad_condition": 34039562.91252621, "lr": 0.0008498316702566826, "time_sec": 32.57612729072571 }, { "epoch": 39, "train_loss": 1.0226109420394898, "train_acc": 0.69532, "test_loss": 2.190898861312866, "test_acc": 0.502, "lyapunov": null, "grad_norm": 0.8542002974927076, "grad_max_sv": 0.3443542592227459, "grad_min_sv": 1.5959563168244095e-08, "grad_condition": 59986387.77119949, "lr": 0.0008422735529643442, "time_sec": 32.57960486412048 }, { "epoch": 40, "train_loss": 1.0001259584808349, "train_acc": 0.70102, "test_loss": 2.25260383605957, "test_acc": 0.4998, "lyapunov": null, "grad_norm": 0.8465843258509351, "grad_max_sv": 0.33337946608662605, "grad_min_sv": 1.5467166557259216e-08, "grad_condition": 37113133.49315401, "lr": 0.0008345653031794289, "time_sec": 32.61366534233093 }, { "epoch": 41, "train_loss": 0.980431226234436, "train_acc": 0.70476, "test_loss": 2.1930856651306154, "test_acc": 0.5111, "lyapunov": null, "grad_norm": 0.8344894111462177, "grad_max_sv": 0.3344740740954876, "grad_min_sv": 1.5184292248560104e-08, "grad_condition": 42849773.682712145, "lr": 0.0008267103019950526, "time_sec": 32.604257106781006 }, { "epoch": 42, "train_loss": 0.9617984279251098, "train_acc": 0.71146, "test_loss": 2.2299947700500486, "test_acc": 0.506, "lyapunov": null, "grad_norm": 0.8242242603947335, "grad_max_sv": 0.3212660253047943, "grad_min_sv": 1.4864016899610033e-08, "grad_condition": 73401477.5678053, "lr": 0.0008187119948743447, "time_sec": 32.6293363571167 }, { "epoch": 43, "train_loss": 0.9384816081619263, "train_acc": 0.71576, "test_loss": 2.1490371479034422, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.8237477937232076, "grad_max_sv": 0.3244126185774803, "grad_min_sv": 1.494453279390906e-08, "grad_condition": 58033299.26618519, "lr": 0.000810573890139155, "time_sec": 32.59305548667908 }, { "epoch": 44, "train_loss": 0.9152639833831787, "train_acc": 0.72254, "test_loss": 2.227645333480835, "test_acc": 0.515, "lyapunov": null, "grad_norm": 0.8114307246954692, "grad_max_sv": 0.32891099974513055, "grad_min_sv": 1.470089587857909e-08, "grad_condition": 187882457.4560508, "lr": 0.0008022995574311873, "time_sec": 32.56365776062012 }, { "epoch": 45, "train_loss": 0.8937730826950073, "train_acc": 0.72926, "test_loss": 2.257075512313843, "test_acc": 0.5171, "lyapunov": null, "grad_norm": 0.7991066773444042, "grad_max_sv": 0.310314255207777, "grad_min_sv": 1.442440034638004e-08, "grad_condition": 67545918.8595486, "lr": 0.0007938926261462363, "time_sec": 32.56998062133789 }, { "epoch": 46, "train_loss": 0.8821200103569031, "train_acc": 0.73168, "test_loss": 2.312848774147034, "test_acc": 0.5052, "lyapunov": null, "grad_norm": 0.7987404367629951, "grad_max_sv": 0.31381460800766947, "grad_min_sv": 1.427665476706752e-08, "grad_condition": 147171178.65022224, "lr": 0.0007853567838422158, "time_sec": 32.57842302322388 }, { "epoch": 47, "train_loss": 0.8545298266983032, "train_acc": 0.73686, "test_loss": 2.2923807540893555, "test_acc": 0.5057, "lyapunov": null, "grad_norm": 0.7859231581178334, "grad_max_sv": 0.31694323718547823, "grad_min_sv": 1.4505229091466009e-08, "grad_condition": 93313806.69758794, "lr": 0.0007766957746216719, "time_sec": 32.56472444534302 }, { "epoch": 48, "train_loss": 0.8375117244720459, "train_acc": 0.74296, "test_loss": 2.350985548019409, "test_acc": 0.5065, "lyapunov": null, "grad_norm": 0.7733144016514287, "grad_max_sv": 0.31536148227751254, "grad_min_sv": 1.3926250694989983e-08, "grad_condition": 138817686.6846688, "lr": 0.0007679133974894982, "time_sec": 32.562721490859985 }, { "epoch": 49, "train_loss": 0.8223947568511963, "train_acc": 0.74656, "test_loss": 2.268610196495056, "test_acc": 0.509, "lyapunov": null, "grad_norm": 0.7708191932209156, "grad_max_sv": 0.3082855362445116, "grad_min_sv": 1.424878183428624e-08, "grad_condition": 48064293.176824205, "lr": 0.000759013504686565, "time_sec": 32.59068489074707 }, { "epoch": 50, "train_loss": 0.8102355616569519, "train_acc": 0.75154, "test_loss": 2.303807855987549, "test_acc": 0.5172, "lyapunov": null, "grad_norm": 0.7678857639968419, "grad_max_sv": 0.30606309957802297, "grad_min_sv": 1.401376939977328e-08, "grad_condition": 66554378.026006415, "lr": 0.0007499999999999998, "time_sec": 32.61594772338867 }, { "epoch": 51, "train_loss": 0.7894559608268737, "train_acc": 0.75788, "test_loss": 2.3806381210327148, "test_acc": 0.5067, "lyapunov": null, "grad_norm": 0.7578995070890107, "grad_max_sv": 0.2958958923816681, "grad_min_sv": 1.3479759735507413e-08, "grad_condition": 59071539.288179755, "lr": 0.0007408768370508575, "time_sec": 32.58355736732483 }, { "epoch": 52, "train_loss": 0.7807610025405883, "train_acc": 0.7587, "test_loss": 2.335085013961792, "test_acc": 0.5175, "lyapunov": null, "grad_norm": 0.7536291786486181, "grad_max_sv": 0.3058082439005375, "grad_min_sv": 1.4062500508851828e-08, "grad_condition": 89488373.11429313, "lr": 0.0007316480175599307, "time_sec": 32.58504581451416 }, { "epoch": 53, "train_loss": 0.7639712882995605, "train_acc": 0.76632, "test_loss": 2.2413758136749267, "test_acc": 0.529, "lyapunov": null, "grad_norm": 0.7437671807956605, "grad_max_sv": 0.2986128095537424, "grad_min_sv": 1.3716437835195604e-08, "grad_condition": 153765004.26652625, "lr": 0.0007223175895924635, "time_sec": 32.599562883377075 }, { "epoch": 54, "train_loss": 0.7342572978401184, "train_acc": 0.77172, "test_loss": 2.3813604881286623, "test_acc": 0.5211, "lyapunov": null, "grad_norm": 0.7415334115465683, "grad_max_sv": 0.2952877823263407, "grad_min_sv": 1.3237078199702934e-08, "grad_condition": 158912190.85988137, "lr": 0.0007128896457825361, "time_sec": 32.58093762397766 }, { "epoch": 55, "train_loss": 0.7243311285591125, "train_acc": 0.77394, "test_loss": 2.5364841087341308, "test_acc": 0.4919, "lyapunov": null, "grad_norm": 0.7336077653545635, "grad_max_sv": 0.30250501483678816, "grad_min_sv": 1.3610404020827915e-08, "grad_condition": 80425531.55629282, "lr": 0.0007033683215378998, "time_sec": 32.64418268203735 }, { "epoch": 56, "train_loss": 0.7082911996078491, "train_acc": 0.77956, "test_loss": 2.494243837738037, "test_acc": 0.5119, "lyapunov": null, "grad_norm": 0.7290174142670145, "grad_max_sv": 0.2945553746074438, "grad_min_sv": 1.3041360513894872e-08, "grad_condition": 131633091.2577754, "lr": 0.0006937577932260512, "time_sec": 32.61989617347717 }, { "epoch": 57, "train_loss": 0.6861382236289978, "train_acc": 0.7852, "test_loss": 2.4704931076049803, "test_acc": 0.518, "lyapunov": null, "grad_norm": 0.7189100733167055, "grad_max_sv": 0.2928345203399658, "grad_min_sv": 1.3202054537260477e-08, "grad_condition": 122301802.04377504, "lr": 0.0006840622763423388, "time_sec": 32.601600885391235 }, { "epoch": 58, "train_loss": 0.6700656919956207, "train_acc": 0.79076, "test_loss": 2.505882039642334, "test_acc": 0.5131, "lyapunov": null, "grad_norm": 0.7086978020515203, "grad_max_sv": 0.28342925757169724, "grad_min_sv": 1.2833174680912385e-08, "grad_condition": 67698817.82937825, "lr": 0.0006742860236609073, "time_sec": 32.58192586898804 }, { "epoch": 59, "train_loss": 0.6577284108161926, "train_acc": 0.79492, "test_loss": 2.491006435775757, "test_acc": 0.5155, "lyapunov": null, "grad_norm": 0.7069652566379913, "grad_max_sv": 0.2849778015166521, "grad_min_sv": 1.2662411319475097e-08, "grad_condition": 54369902.95066987, "lr": 0.0006644333233692913, "time_sec": 32.601956605911255 }, { "epoch": 60, "train_loss": 0.6429468762397766, "train_acc": 0.7985, "test_loss": 2.4342385992050173, "test_acc": 0.5281, "lyapunov": null, "grad_norm": 0.6950269523418225, "grad_max_sv": 0.2759479142725468, "grad_min_sv": 1.2526198570604087e-08, "grad_condition": 1003668275.7453331, "lr": 0.0006545084971874734, "time_sec": 32.593979835510254 }, { "epoch": 61, "train_loss": 0.6316694467926025, "train_acc": 0.80204, "test_loss": 2.572236448669434, "test_acc": 0.5228, "lyapunov": null, "grad_norm": 0.6953930381951806, "grad_max_sv": 0.2823780722916126, "grad_min_sv": 1.2607634538338957e-08, "grad_condition": 910241325.2806966, "lr": 0.0006445158984722354, "time_sec": 32.63531136512756 }, { "epoch": 62, "train_loss": 0.6084016784477234, "train_acc": 0.80756, "test_loss": 2.528528450965881, "test_acc": 0.5249, "lyapunov": null, "grad_norm": 0.6902039343361056, "grad_max_sv": 0.2754691679030657, "grad_min_sv": 1.2385301192095743e-08, "grad_condition": 124171966.43343556, "lr": 0.0006344599103076324, "time_sec": 32.646347761154175 }, { "epoch": 63, "train_loss": 0.6006980142784119, "train_acc": 0.81018, "test_loss": 2.438706118583679, "test_acc": 0.5266, "lyapunov": null, "grad_norm": 0.6822637884805373, "grad_max_sv": 0.276136140525341, "grad_min_sv": 1.2456568440621928e-08, "grad_condition": 41258405.402897015, "lr": 0.0006243449435824269, "time_sec": 32.60796880722046 }, { "epoch": 64, "train_loss": 0.585920947380066, "train_acc": 0.81566, "test_loss": 2.505697784423828, "test_acc": 0.5259, "lyapunov": null, "grad_norm": 0.6743129224923755, "grad_max_sv": 0.26691033616662024, "grad_min_sv": 1.2091218234630552e-08, "grad_condition": 57195642.756296314, "lr": 0.0006141754350553275, "time_sec": 32.621875286102295 }, { "epoch": 65, "train_loss": 0.5716569157028198, "train_acc": 0.81832, "test_loss": 2.488600128173828, "test_acc": 0.5221, "lyapunov": null, "grad_norm": 0.6747582168048405, "grad_max_sv": 0.2778852738440037, "grad_min_sv": 1.2316326589503767e-08, "grad_condition": 66617009.51688242, "lr": 0.0006039558454088793, "time_sec": 32.58805871009827 }, { "epoch": 66, "train_loss": 0.5558187670326233, "train_acc": 0.82442, "test_loss": 2.455172736740112, "test_acc": 0.5327, "lyapunov": null, "grad_norm": 0.6650651562580321, "grad_max_sv": 0.27054035626351836, "grad_min_sv": 1.1980440989180913e-08, "grad_condition": 263553333.63889045, "lr": 0.000593690657292862, "time_sec": 32.61953616142273 }, { "epoch": 67, "train_loss": 0.5372648673820496, "train_acc": 0.82802, "test_loss": 2.5111166515350343, "test_acc": 0.5259, "lyapunov": null, "grad_norm": 0.6598459109898526, "grad_max_sv": 0.26995205879211426, "grad_min_sv": 1.1711705713568498e-08, "grad_condition": 40680262.666348636, "lr": 0.0005833843733580507, "time_sec": 32.596007108688354 }, { "epoch": 68, "train_loss": 0.529928300704956, "train_acc": 0.83184, "test_loss": 2.505376844024658, "test_acc": 0.5324, "lyapunov": null, "grad_norm": 0.6554247710983278, "grad_max_sv": 0.2640453014522791, "grad_min_sv": 1.16465385096437e-08, "grad_condition": 196611022.55457097, "lr": 0.0005730415142812054, "time_sec": 32.589977502822876 }, { "epoch": 69, "train_loss": 0.5270337955570221, "train_acc": 0.83232, "test_loss": 2.6256065521240233, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.6567252289857295, "grad_max_sv": 0.2711860008537769, "grad_min_sv": 1.1960956241034368e-08, "grad_condition": 561898784.4199932, "lr": 0.0005626666167821517, "time_sec": 32.5863139629364 }, { "epoch": 70, "train_loss": 0.5109112097549439, "train_acc": 0.8354, "test_loss": 2.5708269050598145, "test_acc": 0.5302, "lyapunov": null, "grad_norm": 0.646381173102848, "grad_max_sv": 0.27013656310737133, "grad_min_sv": 1.1766451666391648e-08, "grad_condition": 259686356.85246676, "lr": 0.0005522642316338265, "time_sec": 32.601078033447266 }, { "epoch": 71, "train_loss": 0.49452698835372927, "train_acc": 0.84226, "test_loss": 2.5480498626708985, "test_acc": 0.5341, "lyapunov": null, "grad_norm": 0.6360062848670928, "grad_max_sv": 0.26699192114174364, "grad_min_sv": 1.1295523278341807e-08, "grad_condition": 5391854944.622183, "lr": 0.0005418389216661573, "time_sec": 32.60187101364136 }, { "epoch": 72, "train_loss": 0.48291658142089844, "train_acc": 0.84586, "test_loss": 2.659250145339966, "test_acc": 0.5273, "lyapunov": null, "grad_norm": 0.6354901528331942, "grad_max_sv": 0.26031049638986586, "grad_min_sv": 1.1230092526043345e-08, "grad_condition": 88239876.70399968, "lr": 0.0005313952597646563, "time_sec": 32.61269569396973 }, { "epoch": 73, "train_loss": 0.4778318354034424, "train_acc": 0.8473, "test_loss": 2.5874798002243042, "test_acc": 0.5314, "lyapunov": null, "grad_norm": 0.6300098949086598, "grad_max_sv": 0.26232460178434847, "grad_min_sv": 1.134239846749957e-08, "grad_condition": 105944680.31289935, "lr": 0.0005209378268645994, "time_sec": 32.613691091537476 }, { "epoch": 74, "train_loss": 0.46288997037887575, "train_acc": 0.85288, "test_loss": 2.5993505474090575, "test_acc": 0.5337, "lyapunov": null, "grad_norm": 0.6215157272690962, "grad_max_sv": 0.26828358359634874, "grad_min_sv": 1.1235708100021391e-08, "grad_condition": 41868662.72964181, "lr": 0.0005104712099416781, "time_sec": 32.61982536315918 }, { "epoch": 75, "train_loss": 0.45871317274093626, "train_acc": 0.85266, "test_loss": 2.6259676776885987, "test_acc": 0.5345, "lyapunov": null, "grad_norm": 0.6170925610226076, "grad_max_sv": 0.2573466833680868, "grad_min_sv": 1.104757565784445e-08, "grad_condition": 212140699.82071534, "lr": 0.0004999999999999996, "time_sec": 32.598039627075195 }, { "epoch": 76, "train_loss": 0.45109452469825745, "train_acc": 0.85454, "test_loss": 2.665439921569824, "test_acc": 0.5303, "lyapunov": null, "grad_norm": 0.6161744946755234, "grad_max_sv": 0.25873752422630786, "grad_min_sv": 1.1002691283393782e-08, "grad_condition": 1052469961.0162939, "lr": 0.0004895287900583212, "time_sec": 32.58305859565735 }, { "epoch": 77, "train_loss": 0.43257994356155394, "train_acc": 0.86046, "test_loss": 2.702251711654663, "test_acc": 0.526, "lyapunov": null, "grad_norm": 0.607726688787837, "grad_max_sv": 0.26136815659701823, "grad_min_sv": 1.0734200759157653e-08, "grad_condition": 189329156.27802238, "lr": 0.0004790621731353997, "time_sec": 32.59784960746765 }, { "epoch": 78, "train_loss": 0.41896025703430173, "train_acc": 0.86472, "test_loss": 2.671762952804565, "test_acc": 0.5336, "lyapunov": null, "grad_norm": 0.5957655893318665, "grad_max_sv": 0.2534705221652985, "grad_min_sv": 1.0711852985699488e-08, "grad_condition": 191261118.43217826, "lr": 0.000468604740235343, "time_sec": 32.62303113937378 }, { "epoch": 79, "train_loss": 0.40766072305679324, "train_acc": 0.86786, "test_loss": 2.584160025596619, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.5933439762516267, "grad_max_sv": 0.2529820345342159, "grad_min_sv": 1.1027942445340776e-08, "grad_condition": 38680465.32555069, "lr": 0.00045816107833384175, "time_sec": 32.64057159423828 }, { "epoch": 80, "train_loss": 0.395585339012146, "train_acc": 0.8719, "test_loss": 2.6836016262054443, "test_acc": 0.5338, "lyapunov": null, "grad_norm": 0.5915283577904045, "grad_max_sv": 0.2511633686721325, "grad_min_sv": 1.074133903124913e-08, "grad_condition": 579600714.0219278, "lr": 0.0004477357683661729, "time_sec": 32.63526272773743 }, { "epoch": 81, "train_loss": 0.39450348417282105, "train_acc": 0.87178, "test_loss": 2.5824236192703247, "test_acc": 0.5448, "lyapunov": null, "grad_norm": 0.5885071131780099, "grad_max_sv": 0.25625271871685984, "grad_min_sv": 1.0501880514518502e-08, "grad_condition": 124784334.66343915, "lr": 0.00043733338321784746, "time_sec": 32.604066610336304 }, { "epoch": 82, "train_loss": 0.3872408880805969, "train_acc": 0.87422, "test_loss": 2.6602687486648557, "test_acc": 0.5352, "lyapunov": null, "grad_norm": 0.5833408041873426, "grad_max_sv": 0.2544650699943304, "grad_min_sv": 1.0623962720494873e-08, "grad_condition": 134511278.94006854, "lr": 0.0004269584857187939, "time_sec": 32.63341236114502 }, { "epoch": 83, "train_loss": 0.3692175518798828, "train_acc": 0.8823, "test_loss": 2.6812981620788574, "test_acc": 0.5354, "lyapunov": null, "grad_norm": 0.571242006609448, "grad_max_sv": 0.2509057328104973, "grad_min_sv": 1.0469137029164855e-08, "grad_condition": 133735555.98911181, "lr": 0.0004166156266419484, "time_sec": 32.600364685058594 }, { "epoch": 84, "train_loss": 0.36960686668396, "train_acc": 0.8806, "test_loss": 2.6419603324890137, "test_acc": 0.5453, "lyapunov": null, "grad_norm": 0.5733982210439359, "grad_max_sv": 0.25141631327569486, "grad_min_sv": 1.0406415923511908e-08, "grad_condition": 126933629.16775417, "lr": 0.0004063093427071373, "time_sec": 32.60528612136841 }, { "epoch": 85, "train_loss": 0.3596297464942932, "train_acc": 0.88366, "test_loss": 2.716620068740845, "test_acc": 0.5395, "lyapunov": null, "grad_norm": 0.5676461114412606, "grad_max_sv": 0.24900777079164982, "grad_min_sv": 1.0182381811286654e-08, "grad_condition": 508099869.8504903, "lr": 0.0003960441545911199, "time_sec": 32.61734056472778 }, { "epoch": 86, "train_loss": 0.3471255212688446, "train_acc": 0.88682, "test_loss": 2.6910045627593995, "test_acc": 0.5395, "lyapunov": null, "grad_norm": 0.5548265984779118, "grad_max_sv": 0.23751378245651722, "grad_min_sv": 9.806933828904186e-09, "grad_condition": 127564160.08711353, "lr": 0.0003858245649446718, "time_sec": 32.59777784347534 }, { "epoch": 87, "train_loss": 0.3406936288833618, "train_acc": 0.8891, "test_loss": 2.744849885940552, "test_acc": 0.5429, "lyapunov": null, "grad_norm": 0.5555218429462011, "grad_max_sv": 0.2389649160206318, "grad_min_sv": 9.80964975061914e-09, "grad_condition": 889623886.9749553, "lr": 0.00037565505641757235, "time_sec": 32.603169679641724 }, { "epoch": 88, "train_loss": 0.332358439912796, "train_acc": 0.89152, "test_loss": 2.7001221378326417, "test_acc": 0.5481, "lyapunov": null, "grad_norm": 0.550628932039783, "grad_max_sv": 0.24251497723162174, "grad_min_sv": 9.773675100493983e-09, "grad_condition": 85698012.51102474, "lr": 0.00036554008969236695, "time_sec": 32.60269355773926 }, { "epoch": 89, "train_loss": 0.31770461375236514, "train_acc": 0.89674, "test_loss": 2.826695262527466, "test_acc": 0.5359, "lyapunov": null, "grad_norm": 0.5452633910908743, "grad_max_sv": 0.2457874234765768, "grad_min_sv": 1.0011228396625271e-08, "grad_condition": 115516500.1980664, "lr": 0.0003554841015277638, "time_sec": 32.615172147750854 }, { "epoch": 90, "train_loss": 0.3198126357555389, "train_acc": 0.89686, "test_loss": 2.761284243011475, "test_acc": 0.5383, "lyapunov": null, "grad_norm": 0.5420260505535877, "grad_max_sv": 0.2379120856523514, "grad_min_sv": 9.806707615064857e-09, "grad_condition": 292496720.3714178, "lr": 0.000345491502812526, "time_sec": 32.60730767250061 }, { "epoch": 91, "train_loss": 0.31583098639965057, "train_acc": 0.89624, "test_loss": 2.798471709060669, "test_acc": 0.5389, "lyapunov": null, "grad_norm": 0.541688273995152, "grad_max_sv": 0.2411293275654316, "grad_min_sv": 9.842002349441745e-09, "grad_condition": 859517900.635659, "lr": 0.0003355666766307081, "time_sec": 32.59173631668091 }, { "epoch": 92, "train_loss": 0.30620651626586914, "train_acc": 0.89982, "test_loss": 2.8147284172058105, "test_acc": 0.5372, "lyapunov": null, "grad_norm": 0.534845986324325, "grad_max_sv": 0.2446113031357527, "grad_min_sv": 9.80392773058253e-09, "grad_condition": 318006434.8637026, "lr": 0.00032571397633909225, "time_sec": 32.625818729400635 }, { "epoch": 93, "train_loss": 0.2942564325428009, "train_acc": 0.9027, "test_loss": 2.7974524646759034, "test_acc": 0.5458, "lyapunov": null, "grad_norm": 0.5258623807030809, "grad_max_sv": 0.23323353454470636, "grad_min_sv": 9.338492477830445e-09, "grad_condition": 179043441.62085792, "lr": 0.00031593772365766094, "time_sec": 32.64636468887329 }, { "epoch": 94, "train_loss": 0.29325305396080015, "train_acc": 0.90696, "test_loss": 2.7924257678985596, "test_acc": 0.5399, "lyapunov": null, "grad_norm": 0.5223436049599501, "grad_max_sv": 0.23972665779292585, "grad_min_sv": 9.572742014005153e-09, "grad_condition": 829147220.8115915, "lr": 0.0003062422067739483, "time_sec": 32.63534426689148 }, { "epoch": 95, "train_loss": 0.2819689624214172, "train_acc": 0.90976, "test_loss": 2.925028160858154, "test_acc": 0.5349, "lyapunov": null, "grad_norm": 0.5142202374019095, "grad_max_sv": 0.2272823579609394, "grad_min_sv": 9.26979293529133e-09, "grad_condition": 746493228.5809206, "lr": 0.00029663167846209965, "time_sec": 32.632474184036255 }, { "epoch": 96, "train_loss": 0.2815214267730713, "train_acc": 0.90818, "test_loss": 2.834438822937012, "test_acc": 0.5361, "lyapunov": null, "grad_norm": 0.5120345521537165, "grad_max_sv": 0.23016531057655812, "grad_min_sv": 9.260385527062182e-09, "grad_condition": 233123428.8839547, "lr": 0.00028711035421746345, "time_sec": 32.61351776123047 }, { "epoch": 97, "train_loss": 0.2686532742404938, "train_acc": 0.91288, "test_loss": 2.7868608379364015, "test_acc": 0.5454, "lyapunov": null, "grad_norm": 0.50888083523268, "grad_max_sv": 0.23386715427041055, "grad_min_sv": 9.24353042355136e-09, "grad_condition": 480824699.4459009, "lr": 0.00027768241040753615, "time_sec": 32.597689628601074 }, { "epoch": 98, "train_loss": 0.26857261137008664, "train_acc": 0.9114, "test_loss": 2.8518635543823243, "test_acc": 0.5437, "lyapunov": null, "grad_norm": 0.5090536597227022, "grad_max_sv": 0.22117703258991242, "grad_min_sv": 8.954814682826662e-09, "grad_condition": 523046386.34619534, "lr": 0.00026835198244006903, "time_sec": 32.608073472976685 }, { "epoch": 99, "train_loss": 0.25366373962402344, "train_acc": 0.91882, "test_loss": 2.8721565658569337, "test_acc": 0.543, "lyapunov": null, "grad_norm": 0.49238261306821557, "grad_max_sv": 0.2156506847590208, "grad_min_sv": 8.781873435826509e-09, "grad_condition": 904102693.0135263, "lr": 0.0002591231629491421, "time_sec": 32.61784863471985 }, { "epoch": 100, "train_loss": 0.24887621872901916, "train_acc": 0.91974, "test_loss": 2.921920951461792, "test_acc": 0.5361, "lyapunov": null, "grad_norm": 0.4888254012066189, "grad_max_sv": 0.2262551225721836, "grad_min_sv": 9.07711106217608e-09, "grad_condition": 2378158119.157684, "lr": 0.0002499999999999997, "time_sec": 32.63064646720886 }, { "epoch": 101, "train_loss": 0.2486992248916626, "train_acc": 0.92078, "test_loss": 2.84906298789978, "test_acc": 0.546, "lyapunov": null, "grad_norm": 0.49044990509199843, "grad_max_sv": 0.2249086916446686, "grad_min_sv": 8.942711630455583e-09, "grad_condition": 368518315.458243, "lr": 0.00024098649531343477, "time_sec": 32.61569309234619 }, { "epoch": 102, "train_loss": 0.24084433520317078, "train_acc": 0.92134, "test_loss": 2.8644924999237062, "test_acc": 0.5466, "lyapunov": null, "grad_norm": 0.4835634789382412, "grad_max_sv": 0.22181024961173534, "grad_min_sv": 8.71543736290746e-09, "grad_condition": 729146084.7030591, "lr": 0.0002320866025105016, "time_sec": 32.61780500411987 }, { "epoch": 103, "train_loss": 0.23572091526031494, "train_acc": 0.9245, "test_loss": 2.8849633934020997, "test_acc": 0.5462, "lyapunov": null, "grad_norm": 0.47616360717681877, "grad_max_sv": 0.21196404211223124, "grad_min_sv": 8.353945581216632e-09, "grad_condition": 474656759.6437806, "lr": 0.0002233042253783278, "time_sec": 32.613890647888184 }, { "epoch": 104, "train_loss": 0.2249231512260437, "train_acc": 0.92648, "test_loss": 2.9231421543121336, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.47192872655679174, "grad_max_sv": 0.214255590736866, "grad_min_sv": 8.505988313570536e-09, "grad_condition": 289197672.1924402, "lr": 0.000214643216157784, "time_sec": 32.601218938827515 }, { "epoch": 105, "train_loss": 0.22248219745159148, "train_acc": 0.9281, "test_loss": 2.9562902782440186, "test_acc": 0.5427, "lyapunov": null, "grad_norm": 0.4698308403081668, "grad_max_sv": 0.22572967931628227, "grad_min_sv": 8.526192928743314e-09, "grad_condition": 1450261253.9932175, "lr": 0.00020610737385376332, "time_sec": 32.612290382385254 }, { "epoch": 106, "train_loss": 0.21623054056167604, "train_acc": 0.92962, "test_loss": 2.908762315750122, "test_acc": 0.5446, "lyapunov": null, "grad_norm": 0.46340711985172833, "grad_max_sv": 0.21638907827436923, "grad_min_sv": 8.416883249314638e-09, "grad_condition": 255468039.70825052, "lr": 0.00019770044256881242, "time_sec": 32.612945318222046 }, { "epoch": 107, "train_loss": 0.21244655453205108, "train_acc": 0.93246, "test_loss": 2.974463511657715, "test_acc": 0.5384, "lyapunov": null, "grad_norm": 0.4594548274355528, "grad_max_sv": 0.22012278363108634, "grad_min_sv": 8.49774636952922e-09, "grad_condition": 2473361556.8977194, "lr": 0.0001894261098608447, "time_sec": 32.62226438522339 }, { "epoch": 108, "train_loss": 0.2094324759197235, "train_acc": 0.93186, "test_loss": 2.8919307563781738, "test_acc": 0.5468, "lyapunov": null, "grad_norm": 0.4576154748028718, "grad_max_sv": 0.2116704247891903, "grad_min_sv": 8.391172841922153e-09, "grad_condition": 466352424.25916034, "lr": 0.000181288005125655, "time_sec": 32.6186683177948 }, { "epoch": 109, "train_loss": 0.20401785006046294, "train_acc": 0.93418, "test_loss": 2.957660815048218, "test_acc": 0.539, "lyapunov": null, "grad_norm": 0.4546298422322962, "grad_max_sv": 0.21849206127226353, "grad_min_sv": 8.682296616380203e-09, "grad_condition": 191940882.5588118, "lr": 0.0001732896980049473, "time_sec": 32.628432273864746 }, { "epoch": 110, "train_loss": 0.20467783069610596, "train_acc": 0.9347, "test_loss": 2.958277463912964, "test_acc": 0.5437, "lyapunov": null, "grad_norm": 0.4527691780730168, "grad_max_sv": 0.20565569326281546, "grad_min_sv": 8.186116849185146e-09, "grad_condition": 362737702.71097183, "lr": 0.00016543469682057076, "time_sec": 32.61425018310547 }, { "epoch": 111, "train_loss": 0.1963657117843628, "train_acc": 0.93738, "test_loss": 2.912566703796387, "test_acc": 0.5453, "lyapunov": null, "grad_norm": 0.4442740357567778, "grad_max_sv": 0.20528529062867165, "grad_min_sv": 7.897949131502324e-09, "grad_condition": 332879126.46642524, "lr": 0.00015772644703565552, "time_sec": 32.640437841415405 }, { "epoch": 112, "train_loss": 0.19529674465417862, "train_acc": 0.93706, "test_loss": 2.9921934005737305, "test_acc": 0.5439, "lyapunov": null, "grad_norm": 0.4472859282028686, "grad_max_sv": 0.21485005132853985, "grad_min_sv": 8.123189853593854e-09, "grad_condition": 1264491045.958951, "lr": 0.00015016832974331713, "time_sec": 32.62719178199768 }, { "epoch": 113, "train_loss": 0.19033806517124177, "train_acc": 0.93864, "test_loss": 2.982124820327759, "test_acc": 0.5437, "lyapunov": null, "grad_norm": 0.44136667096649934, "grad_max_sv": 0.21058676335960627, "grad_min_sv": 8.165891918036905e-09, "grad_condition": 312331837.29792935, "lr": 0.00014276366018359834, "time_sec": 32.62637948989868 }, { "epoch": 114, "train_loss": 0.1861744700717926, "train_acc": 0.9415, "test_loss": 2.9888067501068116, "test_acc": 0.5439, "lyapunov": null, "grad_norm": 0.4352864374741274, "grad_max_sv": 0.20403808429837228, "grad_min_sv": 7.826812852777115e-09, "grad_condition": 157749511.7241363, "lr": 0.00013551568628929425, "time_sec": 32.61394190788269 }, { "epoch": 115, "train_loss": 0.17919604228019714, "train_acc": 0.94228, "test_loss": 2.9267702087402343, "test_acc": 0.5533, "lyapunov": null, "grad_norm": 0.4303078691865104, "grad_max_sv": 0.21317217014729978, "grad_min_sv": 7.932376714335499e-09, "grad_condition": 130563128.16561177, "lr": 0.00012842758726130276, "time_sec": 32.59867215156555 }, { "epoch": 116, "train_loss": 0.1819922329044342, "train_acc": 0.9421, "test_loss": 2.9711815841674807, "test_acc": 0.5465, "lyapunov": null, "grad_norm": 0.43180962461173705, "grad_max_sv": 0.22204699292778968, "grad_min_sv": 8.152687410540802e-09, "grad_condition": 465179275.152493, "lr": 0.0001215024721741218, "time_sec": 32.63067364692688 }, { "epoch": 117, "train_loss": 0.1775187094783783, "train_acc": 0.94306, "test_loss": 2.9692884788513183, "test_acc": 0.5485, "lyapunov": null, "grad_norm": 0.42535422696695824, "grad_max_sv": 0.20696271434426308, "grad_min_sv": 7.841850190731802e-09, "grad_condition": 340204799.15066475, "lr": 0.00011474337861210538, "time_sec": 32.682225465774536 }, { "epoch": 118, "train_loss": 0.1782768397474289, "train_acc": 0.94228, "test_loss": 2.9190274017333984, "test_acc": 0.5529, "lyapunov": null, "grad_norm": 0.4288690474100953, "grad_max_sv": 0.20459303073585033, "grad_min_sv": 7.852907129212925e-09, "grad_condition": 413565999.92345744, "lr": 0.00010815327133708009, "time_sec": 32.6104941368103 }, { "epoch": 119, "train_loss": 0.17245361244678498, "train_acc": 0.94452, "test_loss": 2.9115855850219727, "test_acc": 0.5518, "lyapunov": null, "grad_norm": 0.42115534183071457, "grad_max_sv": 0.20364198610186576, "grad_min_sv": 7.842290997188895e-09, "grad_condition": 4300198879.021836, "lr": 0.00010173504098790182, "time_sec": 32.599159479141235 }, { "epoch": 120, "train_loss": 0.16841998175621034, "train_acc": 0.9465, "test_loss": 2.9750044021606445, "test_acc": 0.5509, "lyapunov": null, "grad_norm": 0.4139970919760924, "grad_max_sv": 0.21118448078632354, "grad_min_sv": 7.870022611139622e-09, "grad_condition": 588234398.5889165, "lr": 9.549150281252629e-05, "time_sec": 32.60773468017578 }, { "epoch": 121, "train_loss": 0.1674146131658554, "train_acc": 0.94722, "test_loss": 3.043567562866211, "test_acc": 0.5401, "lyapunov": null, "grad_norm": 0.4140688259905283, "grad_max_sv": 0.19524961337447166, "grad_min_sv": 7.740067117572789e-09, "grad_condition": 294042234.42343616, "lr": 8.942539543314794e-05, "time_sec": 32.605161905288696 }, { "epoch": 122, "train_loss": 0.16243593076705934, "train_acc": 0.94846, "test_loss": 2.929161159515381, "test_acc": 0.5544, "lyapunov": null, "grad_norm": 0.4069435316400916, "grad_max_sv": 0.1928358545526862, "grad_min_sv": 7.721300553786966e-09, "grad_condition": 1492464032.2227066, "lr": 8.353937964495024e-05, "time_sec": 32.641791105270386 }, { "epoch": 123, "train_loss": 0.1584806259393692, "train_acc": 0.94938, "test_loss": 3.1013183868408203, "test_acc": 0.5441, "lyapunov": null, "grad_norm": 0.4074794428211969, "grad_max_sv": 0.19953589588403703, "grad_min_sv": 7.50950879795792e-09, "grad_condition": 963926565.1466379, "lr": 7.783603724899243e-05, "time_sec": 32.63674283027649 }, { "epoch": 124, "train_loss": 0.15840048369407653, "train_acc": 0.9494, "test_loss": 3.02653837890625, "test_acc": 0.5519, "lyapunov": null, "grad_norm": 0.4076422491058348, "grad_max_sv": 0.2066960282623768, "grad_min_sv": 7.477964763082447e-09, "grad_condition": 442993334.53740203, "lr": 7.231786991974666e-05, "time_sec": 32.61531352996826 }, { "epoch": 125, "train_loss": 0.15796427134990693, "train_acc": 0.9492, "test_loss": 3.0291555103302, "test_acc": 0.547, "lyapunov": null, "grad_norm": 0.4074327913561712, "grad_max_sv": 0.20506599061191083, "grad_min_sv": 7.742264148888345e-09, "grad_condition": 174320401.78922492, "lr": 6.698729810778072e-05, "time_sec": 32.616377115249634 }, { "epoch": 126, "train_loss": 0.15587055792808532, "train_acc": 0.94994, "test_loss": 3.0593951934814454, "test_acc": 0.5475, "lyapunov": null, "grad_norm": 0.40499205379602254, "grad_max_sv": 0.20328918769955634, "grad_min_sv": 7.676706426616719e-09, "grad_condition": 1609865519.3051925, "lr": 6.184665997806817e-05, "time_sec": 32.61218738555908 }, { "epoch": 127, "train_loss": 0.1515829546546936, "train_acc": 0.95164, "test_loss": 2.997521667098999, "test_acc": 0.5527, "lyapunov": null, "grad_norm": 0.3980720784578974, "grad_max_sv": 0.20609603635966778, "grad_min_sv": 7.607568789811877e-09, "grad_condition": 467148050.5049923, "lr": 5.6898210384392595e-05, "time_sec": 32.59871435165405 }, { "epoch": 128, "train_loss": 0.15070208614826203, "train_acc": 0.95202, "test_loss": 2.989130591583252, "test_acc": 0.5478, "lyapunov": null, "grad_norm": 0.4001034661246295, "grad_max_sv": 0.1990298792719841, "grad_min_sv": 7.700730269807106e-09, "grad_condition": 1087373342.1502237, "lr": 5.214411988029363e-05, "time_sec": 32.64661478996277 }, { "epoch": 129, "train_loss": 0.1532275314569473, "train_acc": 0.95156, "test_loss": 3.076161633300781, "test_acc": 0.5428, "lyapunov": null, "grad_norm": 0.39710317166706477, "grad_max_sv": 0.2050964504480362, "grad_min_sv": 7.753612097250589e-09, "grad_condition": 177848968.01384813, "lr": 4.7586473766990294e-05, "time_sec": 32.619911193847656 }, { "epoch": 130, "train_loss": 0.14840273664474488, "train_acc": 0.95386, "test_loss": 3.0291847702026367, "test_acc": 0.5514, "lyapunov": null, "grad_norm": 0.3943339950090642, "grad_max_sv": 0.20189184583723546, "grad_min_sv": 7.418064280288045e-09, "grad_condition": 225551543.43719563, "lr": 4.32272711786996e-05, "time_sec": 32.61198544502258 }, { "epoch": 131, "train_loss": 0.1431949885225296, "train_acc": 0.95528, "test_loss": 3.027348929977417, "test_acc": 0.5507, "lyapunov": null, "grad_norm": 0.38711994826678314, "grad_max_sv": 0.19673722572624683, "grad_min_sv": 7.518409088564434e-09, "grad_condition": 1146835061.4670472, "lr": 3.906842420574966e-05, "time_sec": 32.61335587501526 }, { "epoch": 132, "train_loss": 0.1487313818216324, "train_acc": 0.95322, "test_loss": 3.0886004333496095, "test_acc": 0.5461, "lyapunov": null, "grad_norm": 0.395507713545241, "grad_max_sv": 0.20544077269732952, "grad_min_sv": 7.573043920433565e-09, "grad_condition": 168877391.5952191, "lr": 3.5111757055874305e-05, "time_sec": 32.5999391078949 }, { "epoch": 133, "train_loss": 0.14615771746635436, "train_acc": 0.95264, "test_loss": 3.000204067611694, "test_acc": 0.5534, "lyapunov": null, "grad_norm": 0.3932909447553781, "grad_max_sv": 0.18928411398082973, "grad_min_sv": 7.371471794906034e-09, "grad_condition": 362753839.3369804, "lr": 3.1359005254054254e-05, "time_sec": 32.6199426651001 }, { "epoch": 134, "train_loss": 0.14433889319181442, "train_acc": 0.95458, "test_loss": 3.007744090270996, "test_acc": 0.5535, "lyapunov": null, "grad_norm": 0.38729299837720393, "grad_max_sv": 0.1966633189469576, "grad_min_sv": 7.389140074115508e-09, "grad_condition": 474683811.0722334, "lr": 2.7811814881259484e-05, "time_sec": 32.66906452178955 }, { "epoch": 135, "train_loss": 0.14040502546787262, "train_acc": 0.95526, "test_loss": 2.9782509716033934, "test_acc": 0.5519, "lyapunov": null, "grad_norm": 0.3837181152764762, "grad_max_sv": 0.19970894865691663, "grad_min_sv": 7.428829410741772e-09, "grad_condition": 568455087.6695989, "lr": 2.4471741852423218e-05, "time_sec": 32.612287521362305 }, { "epoch": 136, "train_loss": 0.14493111051797866, "train_acc": 0.95468, "test_loss": 3.0520059284210204, "test_acc": 0.5481, "lyapunov": null, "grad_norm": 0.39055918813288093, "grad_max_sv": 0.20612289309501647, "grad_min_sv": 7.689209627608634e-09, "grad_condition": 670288720.96072, "lr": 2.1340251233966362e-05, "time_sec": 32.61230111122131 }, { "epoch": 137, "train_loss": 0.1412872414493561, "train_acc": 0.95532, "test_loss": 2.9926007400512695, "test_acc": 0.5538, "lyapunov": null, "grad_norm": 0.3847438191608403, "grad_max_sv": 0.1935590598732233, "grad_min_sv": 7.3988825210688506e-09, "grad_condition": 818122774.676174, "lr": 1.8418716601170932e-05, "time_sec": 32.63673734664917 }, { "epoch": 138, "train_loss": 0.1368464488697052, "train_acc": 0.95786, "test_loss": 3.0026862827301026, "test_acc": 0.5541, "lyapunov": null, "grad_norm": 0.3793276651282968, "grad_max_sv": 0.2012945655733347, "grad_min_sv": 7.351351802645234e-09, "grad_condition": 363599415.4796465, "lr": 1.570841943568445e-05, "time_sec": 32.59603404998779 }, { "epoch": 139, "train_loss": 0.1389853618478775, "train_acc": 0.95644, "test_loss": 3.04127444152832, "test_acc": 0.5497, "lyapunov": null, "grad_norm": 0.38369680042825305, "grad_max_sv": 0.1901318434625864, "grad_min_sv": 7.190909153147098e-09, "grad_condition": 1063192542.6047398, "lr": 1.3210548563419845e-05, "time_sec": 32.623175382614136 }, { "epoch": 140, "train_loss": 0.13792312327384948, "train_acc": 0.95614, "test_loss": 3.004412171936035, "test_acc": 0.5534, "lyapunov": null, "grad_norm": 0.37904522036307264, "grad_max_sv": 0.19201667234301567, "grad_min_sv": 7.376605424202435e-09, "grad_condition": 1234012097.4190845, "lr": 1.0926199633097203e-05, "time_sec": 32.630115270614624 }, { "epoch": 141, "train_loss": 0.1407741106414795, "train_acc": 0.95654, "test_loss": 3.0456832256317137, "test_acc": 0.5511, "lyapunov": null, "grad_norm": 0.38330137862093777, "grad_max_sv": 0.19592518154531718, "grad_min_sv": 7.054394128222507e-09, "grad_condition": 86708521.56413671, "lr": 8.856374635655688e-06, "time_sec": 32.61585021018982 }, { "epoch": 142, "train_loss": 0.1388852431154251, "train_acc": 0.95632, "test_loss": 3.063602409744263, "test_acc": 0.5478, "lyapunov": null, "grad_norm": 0.3828568546417417, "grad_max_sv": 0.1969303483143449, "grad_min_sv": 7.518555048707278e-09, "grad_condition": 678890293.0423553, "lr": 7.001981464747503e-06, "time_sec": 32.630441427230835 }, { "epoch": 143, "train_loss": 0.13581469515800476, "train_acc": 0.9579, "test_loss": 3.0148553092956543, "test_acc": 0.5538, "lyapunov": null, "grad_norm": 0.37580622771801075, "grad_max_sv": 0.18920586220920085, "grad_min_sv": 7.312373946242665e-09, "grad_condition": 360908520.84421337, "lr": 5.3638335185058295e-06, "time_sec": 32.64005398750305 }, { "epoch": 144, "train_loss": 0.1397603491592407, "train_acc": 0.9547, "test_loss": 3.017238700866699, "test_acc": 0.5514, "lyapunov": null, "grad_norm": 0.3851319102923484, "grad_max_sv": 0.19529533758759499, "grad_min_sv": 7.18097194788922e-09, "grad_condition": 274499937.83092636, "lr": 3.942649342761114e-06, "time_sec": 32.60517716407776 }, { "epoch": 145, "train_loss": 0.13670911428451538, "train_acc": 0.95648, "test_loss": 3.0282860946655275, "test_acc": 0.5508, "lyapunov": null, "grad_norm": 0.37783913784420287, "grad_max_sv": 0.19311878457665443, "grad_min_sv": 7.273629627901489e-09, "grad_condition": 2161793817.455667, "lr": 2.7390523158633524e-06, "time_sec": 32.614171266555786 }, { "epoch": 146, "train_loss": 0.1391296845769882, "train_acc": 0.95668, "test_loss": 3.0094220054626466, "test_acc": 0.5501, "lyapunov": null, "grad_norm": 0.37960085678866656, "grad_max_sv": 0.18867351226508616, "grad_min_sv": 7.0429120130072884e-09, "grad_condition": 483257361.70673215, "lr": 1.7535703752478133e-06, "time_sec": 32.59815835952759 }, { "epoch": 147, "train_loss": 0.13715074803590774, "train_acc": 0.95716, "test_loss": 3.018283353805542, "test_acc": 0.5494, "lyapunov": null, "grad_norm": 0.3750663523004214, "grad_max_sv": 0.19733735918998718, "grad_min_sv": 7.336720725349341e-09, "grad_condition": 639022830.9873111, "lr": 9.866357858642196e-07, "time_sec": 32.63532900810242 }, { "epoch": 148, "train_loss": 0.13438899482250213, "train_acc": 0.95838, "test_loss": 3.0480747367858885, "test_acc": 0.5511, "lyapunov": null, "grad_norm": 0.374029090307932, "grad_max_sv": 0.19485083129256964, "grad_min_sv": 7.2787410602915756e-09, "grad_condition": 1280998842.4402964, "lr": 4.38584950570808e-07, "time_sec": 32.61666941642761 }, { "epoch": 149, "train_loss": 0.1355752257716656, "train_acc": 0.95742, "test_loss": 3.020583014678955, "test_acc": 0.5479, "lyapunov": null, "grad_norm": 0.3742080999065961, "grad_max_sv": 0.18681482430547475, "grad_min_sv": 7.387960459213656e-09, "grad_condition": 886872133.6824732, "lr": 1.096582625772501e-07, "time_sec": 32.62542963027954 }, { "epoch": 150, "train_loss": 0.13964056191444396, "train_acc": 0.95646, "test_loss": 3.1249655624389647, "test_acc": 0.5464, "lyapunov": null, "grad_norm": 0.3794352519997707, "grad_max_sv": 0.2051174059510231, "grad_min_sv": 7.552300875884155e-09, "grad_condition": 4688136301.586805, "lr": 0.0, "time_sec": 32.61311602592468 } ], "12": [ { "epoch": 1, "train_loss": 4.857979267883301, "train_acc": 0.03128, "test_loss": 4.8280028671264645, "test_acc": 0.0162, "lyapunov": null, "grad_norm": 5.914070912211268, "grad_max_sv": 5.325387370586395, "grad_min_sv": 9.769405192663893e-08, "grad_condition": 1337497985.1511102, "lr": 0.0009998903417374227, "time_sec": 49.62461066246033 }, { "epoch": 2, "train_loss": 4.336386154098511, "train_acc": 0.05714, "test_loss": 4.968493894958496, "test_acc": 0.0197, "lyapunov": null, "grad_norm": 4.4863167388537235, "grad_max_sv": 3.9469796657562255, "grad_min_sv": 7.601632206477583e-08, "grad_condition": 129963899.4749479, "lr": 0.0009995614150494292, "time_sec": 49.636900901794434 }, { "epoch": 3, "train_loss": 4.062883013763428, "train_acc": 0.08342, "test_loss": 4.448897337341308, "test_acc": 0.037, "lyapunov": null, "grad_norm": 3.6333047310988777, "grad_max_sv": 3.0409141004085543, "grad_min_sv": 6.369543137374478e-08, "grad_condition": 59962043.95176021, "lr": 0.0009990133642141358, "time_sec": 49.63047957420349 }, { "epoch": 4, "train_loss": 3.8605975818634035, "train_acc": 0.10722, "test_loss": 4.516425963592529, "test_acc": 0.0415, "lyapunov": null, "grad_norm": 3.020259734680317, "grad_max_sv": 2.476314604282379, "grad_min_sv": 5.230481114892882e-08, "grad_condition": 51922675.56557977, "lr": 0.0009982464296247522, "time_sec": 49.61615824699402 }, { "epoch": 5, "train_loss": 3.6876567860412597, "train_acc": 0.13404, "test_loss": 4.7616854064941405, "test_acc": 0.0373, "lyapunov": null, "grad_norm": 2.454606191256652, "grad_max_sv": 1.8841783970594406, "grad_min_sv": 4.2170166864030635e-08, "grad_condition": 61784571.5567351, "lr": 0.0009972609476841367, "time_sec": 49.621190309524536 }, { "epoch": 6, "train_loss": 3.5600004296875, "train_acc": 0.15464, "test_loss": 4.541135731506348, "test_acc": 0.0565, "lyapunov": null, "grad_norm": 2.047081522054368, "grad_max_sv": 1.4700775474309922, "grad_min_sv": 3.5812032206372636e-08, "grad_condition": 47166242.58068286, "lr": 0.000996057350657239, "time_sec": 49.63187623023987 }, { "epoch": 7, "train_loss": 3.453279203033447, "train_acc": 0.17224, "test_loss": 4.9032746643066405, "test_acc": 0.0512, "lyapunov": null, "grad_norm": 1.7128403586652834, "grad_max_sv": 1.1189136162400246, "grad_min_sv": 3.018336235394159e-08, "grad_condition": 41920446.3053714, "lr": 0.000994636166481494, "time_sec": 49.60520005226135 }, { "epoch": 8, "train_loss": 3.36041114944458, "train_acc": 0.1888, "test_loss": 4.752816521453857, "test_acc": 0.0648, "lyapunov": null, "grad_norm": 1.4850467477612923, "grad_max_sv": 0.8669481813907624, "grad_min_sv": 2.6475041869922223e-08, "grad_condition": 37599938.73602452, "lr": 0.0009929980185352525, "time_sec": 49.618135929107666 }, { "epoch": 9, "train_loss": 3.286079960784912, "train_acc": 0.20154, "test_loss": 5.178885292053223, "test_acc": 0.0623, "lyapunov": null, "grad_norm": 1.342261473440063, "grad_max_sv": 0.7033843606710434, "grad_min_sv": 2.384479090948577e-08, "grad_condition": 141440858.58776602, "lr": 0.0009911436253643444, "time_sec": 49.62771654129028 }, { "epoch": 10, "train_loss": 3.2129677861022947, "train_acc": 0.2144, "test_loss": 5.0195522842407225, "test_acc": 0.0622, "lyapunov": null, "grad_norm": 1.2503967032062735, "grad_max_sv": 0.6261777065694332, "grad_min_sv": 2.239258505704056e-08, "grad_condition": 118005336.87045276, "lr": 0.0009890738003669028, "time_sec": 49.60965371131897 }, { "epoch": 11, "train_loss": 3.162713228683472, "train_acc": 0.22544, "test_loss": 4.962263533020019, "test_acc": 0.0779, "lyapunov": null, "grad_norm": 1.1906728267056432, "grad_max_sv": 0.5766806580126286, "grad_min_sv": 2.144448115332098e-08, "grad_condition": 68570214.69490463, "lr": 0.00098678945143658, "time_sec": 49.638447284698486 }, { "epoch": 12, "train_loss": 3.107430252532959, "train_acc": 0.23672, "test_loss": 5.273008836364746, "test_acc": 0.0622, "lyapunov": null, "grad_norm": 1.1141405269120466, "grad_max_sv": 0.5137097157537938, "grad_min_sv": 2.047304612853851e-08, "grad_condition": 58656857.58404706, "lr": 0.0009842915805643154, "time_sec": 49.64548635482788 }, { "epoch": 13, "train_loss": 3.054518303833008, "train_acc": 0.24298, "test_loss": 4.751382202148437, "test_acc": 0.0805, "lyapunov": null, "grad_norm": 1.056334374659988, "grad_max_sv": 0.4537819892168045, "grad_min_sv": 1.9099582219961332e-08, "grad_condition": 40473913.58753422, "lr": 0.000981581283398829, "time_sec": 49.62596035003662 }, { "epoch": 14, "train_loss": 3.0128901699066164, "train_acc": 0.2535, "test_loss": 5.3179588119506835, "test_acc": 0.0894, "lyapunov": null, "grad_norm": 1.0060720335526403, "grad_max_sv": 0.4221613615751266, "grad_min_sv": 1.8469374840623944e-08, "grad_condition": 27648316.070058893, "lr": 0.0009786597487660333, "time_sec": 49.63119626045227 }, { "epoch": 15, "train_loss": 2.9737020013427733, "train_acc": 0.26082, "test_loss": 6.165470205688477, "test_acc": 0.0593, "lyapunov": null, "grad_norm": 0.9787012560859192, "grad_max_sv": 0.39918764010071756, "grad_min_sv": 1.789977660815456e-08, "grad_condition": 32066062.312103875, "lr": 0.0009755282581475766, "time_sec": 49.61084794998169 }, { "epoch": 16, "train_loss": 2.9363278299713134, "train_acc": 0.2678, "test_loss": 7.10851273803711, "test_acc": 0.0421, "lyapunov": null, "grad_norm": 0.9372246408127133, "grad_max_sv": 0.38435717970132827, "grad_min_sv": 1.733210386878348e-08, "grad_condition": 24088715.267205216, "lr": 0.0009721881851187403, "time_sec": 49.61706733703613 }, { "epoch": 17, "train_loss": 2.911891692504883, "train_acc": 0.27176, "test_loss": 6.38866512298584, "test_acc": 0.0601, "lyapunov": null, "grad_norm": 0.9126706344355823, "grad_max_sv": 0.3579227849841118, "grad_min_sv": 1.667584251102694e-08, "grad_condition": 47679489.14127077, "lr": 0.0009686409947459456, "time_sec": 49.62139368057251 }, { "epoch": 18, "train_loss": 2.8810440801239015, "train_acc": 0.2804, "test_loss": 6.160967282104492, "test_acc": 0.0718, "lyapunov": null, "grad_norm": 0.8853626149459919, "grad_max_sv": 0.36028596982359884, "grad_min_sv": 1.644115990712125e-08, "grad_condition": 52172419.08719461, "lr": 0.0009648882429441254, "time_sec": 49.61437940597534 }, { "epoch": 19, "train_loss": 2.845276382827759, "train_acc": 0.28578, "test_loss": 5.377824464416504, "test_acc": 0.0852, "lyapunov": null, "grad_norm": 0.859853543351059, "grad_max_sv": 0.33440142646431925, "grad_min_sv": 1.5989740054234146e-08, "grad_condition": 23981566.09987827, "lr": 0.00096093157579425, "time_sec": 49.60141611099243 }, { "epoch": 20, "train_loss": 2.8133937200927734, "train_acc": 0.29282, "test_loss": 6.930623114013672, "test_acc": 0.061, "lyapunov": null, "grad_norm": 0.8428428790749917, "grad_max_sv": 0.3265179105103016, "grad_min_sv": 1.569473392637466e-08, "grad_condition": 52730874.60876007, "lr": 0.0009567727288213001, "time_sec": 49.62118935585022 }, { "epoch": 21, "train_loss": 2.792502545776367, "train_acc": 0.29682, "test_loss": 7.603221396636963, "test_acc": 0.0601, "lyapunov": null, "grad_norm": 0.8301062641843454, "grad_max_sv": 0.3209334272891283, "grad_min_sv": 1.5400497213602372e-08, "grad_condition": 32858821.905855753, "lr": 0.0009524135262330095, "time_sec": 49.61830496788025 }, { "epoch": 22, "train_loss": 2.763432760696411, "train_acc": 0.30106, "test_loss": 7.683717921447754, "test_acc": 0.0632, "lyapunov": null, "grad_norm": 0.8155075807756811, "grad_max_sv": 0.31464248038828374, "grad_min_sv": 1.523456016894187e-08, "grad_condition": 22807354.246203102, "lr": 0.0009478558801197061, "time_sec": 49.62720441818237 }, { "epoch": 23, "train_loss": 2.7460695344543455, "train_acc": 0.3031, "test_loss": 5.747795407867431, "test_acc": 0.0819, "lyapunov": null, "grad_norm": 0.7966165231048401, "grad_max_sv": 0.29990778900682924, "grad_min_sv": 1.4812020640575519e-08, "grad_condition": 26907900.924312055, "lr": 0.000943101789615607, "time_sec": 49.620564699172974 }, { "epoch": 24, "train_loss": 2.713617621231079, "train_acc": 0.31124, "test_loss": 6.716322633361816, "test_acc": 0.08, "lyapunov": null, "grad_norm": 0.7863969132473815, "grad_max_sv": 0.3049128696322441, "grad_min_sv": 1.4714444074304112e-08, "grad_condition": 23621111.366144888, "lr": 0.0009381533400219313, "time_sec": 49.6185462474823 }, { "epoch": 25, "train_loss": 2.692608075027466, "train_acc": 0.3135, "test_loss": 6.315327671813965, "test_acc": 0.0773, "lyapunov": null, "grad_norm": 0.7780809028085155, "grad_max_sv": 0.28820848651230335, "grad_min_sv": 1.4556970873158548e-08, "grad_condition": 22925885.469558023, "lr": 0.0009330127018922189, "time_sec": 49.63029909133911 }, { "epoch": 26, "train_loss": 2.6578130314636232, "train_acc": 0.32226, "test_loss": 7.161731970214844, "test_acc": 0.074, "lyapunov": null, "grad_norm": 0.7600241350813963, "grad_max_sv": 0.27918743565678594, "grad_min_sv": 1.41998530961418e-08, "grad_condition": 24836498.868989673, "lr": 0.000927682130080253, "time_sec": 49.61888551712036 }, { "epoch": 27, "train_loss": 2.6360860138702393, "train_acc": 0.3281, "test_loss": 6.265446292114258, "test_acc": 0.072, "lyapunov": null, "grad_norm": 0.7503860366874832, "grad_max_sv": 0.27820607759058474, "grad_min_sv": 1.403503115116056e-08, "grad_condition": 43704568.438496746, "lr": 0.0009221639627510072, "time_sec": 49.6322455406189 }, { "epoch": 28, "train_loss": 2.621903458404541, "train_acc": 0.33094, "test_loss": 8.008352018737792, "test_acc": 0.0635, "lyapunov": null, "grad_norm": 0.7411508249278186, "grad_max_sv": 0.276602141186595, "grad_min_sv": 1.3749510615473914e-08, "grad_condition": 48846366.407403715, "lr": 0.0009164606203550494, "time_sec": 49.62464737892151 }, { "epoch": 29, "train_loss": 2.6009712726593017, "train_acc": 0.33356, "test_loss": 6.3420821472167965, "test_acc": 0.0871, "lyapunov": null, "grad_norm": 0.7392237108014773, "grad_max_sv": 0.2745568320155144, "grad_min_sv": 1.3796570551283249e-08, "grad_condition": 31273171.49927681, "lr": 0.0009105746045668516, "time_sec": 49.654367446899414 }, { "epoch": 30, "train_loss": 2.5890472722625733, "train_acc": 0.33498, "test_loss": 6.483042420959473, "test_acc": 0.0746, "lyapunov": null, "grad_norm": 0.7254213710143503, "grad_max_sv": 0.2663456965237856, "grad_min_sv": 1.3537345176783955e-08, "grad_condition": 33323808.90351194, "lr": 0.0009045084971874733, "time_sec": 49.62457275390625 }, { "epoch": 31, "train_loss": 2.5546424687194826, "train_acc": 0.3411, "test_loss": 5.880196138000488, "test_acc": 0.0666, "lyapunov": null, "grad_norm": 0.7170650074645288, "grad_max_sv": 0.2706871546804905, "grad_min_sv": 1.3557976122346993e-08, "grad_condition": 55625831.471463725, "lr": 0.0008982649590120977, "time_sec": 49.625417709350586 }, { "epoch": 32, "train_loss": 2.5356599130249022, "train_acc": 0.3476, "test_loss": 6.206172892761231, "test_acc": 0.0935, "lyapunov": null, "grad_norm": 0.7148263297514528, "grad_max_sv": 0.2631382804363966, "grad_min_sv": 1.335368298993611e-08, "grad_condition": 27919253.234171998, "lr": 0.0008918467286629196, "time_sec": 49.64267349243164 }, { "epoch": 33, "train_loss": 2.520495999908447, "train_acc": 0.34764, "test_loss": 6.414087007141113, "test_acc": 0.0819, "lyapunov": null, "grad_norm": 0.7096693517368512, "grad_max_sv": 0.2555254019796848, "grad_min_sv": 1.326168482251866e-08, "grad_condition": 30057889.81326326, "lr": 0.0008852566213878943, "time_sec": 49.633198976516724 }, { "epoch": 34, "train_loss": 2.4981268305206297, "train_acc": 0.35368, "test_loss": 7.161307034301758, "test_acc": 0.0753, "lyapunov": null, "grad_norm": 0.6981273416861422, "grad_max_sv": 0.25148845836520195, "grad_min_sv": 1.3116743149965693e-08, "grad_condition": 25097258.440184355, "lr": 0.000878497527825878, "time_sec": 49.629374980926514 }, { "epoch": 35, "train_loss": 2.4812187934875487, "train_acc": 0.35656, "test_loss": 6.375511972045898, "test_acc": 0.0787, "lyapunov": null, "grad_norm": 0.693256631694674, "grad_max_sv": 0.24989120960235595, "grad_min_sv": 1.3051334765701306e-08, "grad_condition": 22699406.58897232, "lr": 0.000871572412738697, "time_sec": 49.620848655700684 }, { "epoch": 36, "train_loss": 2.4649569733428955, "train_acc": 0.3595, "test_loss": 5.7549407691955565, "test_acc": 0.1002, "lyapunov": null, "grad_norm": 0.6880223056040339, "grad_max_sv": 0.2544675827026367, "grad_min_sv": 1.2971388471672008e-08, "grad_condition": 27090819.46416967, "lr": 0.0008644843137107055, "time_sec": 49.639307498931885 }, { "epoch": 37, "train_loss": 2.4404139349365233, "train_acc": 0.36276, "test_loss": 6.19379566192627, "test_acc": 0.0843, "lyapunov": null, "grad_norm": 0.6915322266205055, "grad_max_sv": 0.25557893700897694, "grad_min_sv": 1.3099128221005785e-08, "grad_condition": 22396412.415633548, "lr": 0.0008572363398164014, "time_sec": 49.65658497810364 }, { "epoch": 38, "train_loss": 2.4350104721832277, "train_acc": 0.36944, "test_loss": 6.483997691345214, "test_acc": 0.0947, "lyapunov": null, "grad_norm": 0.6860817508888643, "grad_max_sv": 0.24186794832348824, "grad_min_sv": 1.2734190080188058e-08, "grad_condition": 24245161.640245236, "lr": 0.0008498316702566826, "time_sec": 49.636590003967285 }, { "epoch": 39, "train_loss": 2.4035986038970947, "train_acc": 0.37506, "test_loss": 7.426128985595703, "test_acc": 0.0633, "lyapunov": null, "grad_norm": 0.6768284631491337, "grad_max_sv": 0.23978918939828872, "grad_min_sv": 1.2544681339196617e-08, "grad_condition": 58875883.49556484, "lr": 0.0008422735529643442, "time_sec": 49.6271595954895 }, { "epoch": 40, "train_loss": 2.396695173187256, "train_acc": 0.37446, "test_loss": 6.887982989501953, "test_acc": 0.0659, "lyapunov": null, "grad_norm": 0.6758452994499082, "grad_max_sv": 0.23218532651662827, "grad_min_sv": 1.2284334864609559e-08, "grad_condition": 27825244.741001748, "lr": 0.0008345653031794289, "time_sec": 49.6188850402832 }, { "epoch": 41, "train_loss": 2.3766202754211427, "train_acc": 0.38084, "test_loss": 7.051847720336914, "test_acc": 0.061, "lyapunov": null, "grad_norm": 0.6727252530320494, "grad_max_sv": 0.2428621307015419, "grad_min_sv": 1.2773543862920622e-08, "grad_condition": 27042190.577230137, "lr": 0.0008267103019950526, "time_sec": 49.63360857963562 }, { "epoch": 42, "train_loss": 2.3670169010925295, "train_acc": 0.38192, "test_loss": 6.82649090423584, "test_acc": 0.0753, "lyapunov": null, "grad_norm": 0.6702600637325808, "grad_max_sv": 0.23488462790846826, "grad_min_sv": 1.2701740556564367e-08, "grad_condition": 22978134.483096853, "lr": 0.0008187119948743447, "time_sec": 49.626428842544556 }, { "epoch": 43, "train_loss": 2.34640893951416, "train_acc": 0.38418, "test_loss": 7.456131955718994, "test_acc": 0.0764, "lyapunov": null, "grad_norm": 0.6673821071425099, "grad_max_sv": 0.2304955620318651, "grad_min_sv": 1.2439765384453239e-08, "grad_condition": 31820388.99010671, "lr": 0.000810573890139155, "time_sec": 49.62021851539612 }, { "epoch": 44, "train_loss": 2.3332527070617677, "train_acc": 0.38834, "test_loss": 6.233900453186036, "test_acc": 0.0882, "lyapunov": null, "grad_norm": 0.6619434612787911, "grad_max_sv": 0.23275020457804202, "grad_min_sv": 1.2357255231576491e-08, "grad_condition": 41092001.19472371, "lr": 0.0008022995574311873, "time_sec": 49.632553815841675 }, { "epoch": 45, "train_loss": 2.319253850402832, "train_acc": 0.3902, "test_loss": 7.539175698852539, "test_acc": 0.0652, "lyapunov": null, "grad_norm": 0.6606380867238602, "grad_max_sv": 0.2288034502416849, "grad_min_sv": 1.234043749409608e-08, "grad_condition": 23995474.740780547, "lr": 0.0007938926261462363, "time_sec": 49.638259410858154 }, { "epoch": 46, "train_loss": 2.308006600112915, "train_acc": 0.39154, "test_loss": 7.362489430999756, "test_acc": 0.0558, "lyapunov": null, "grad_norm": 0.660045345704197, "grad_max_sv": 0.2337587408721447, "grad_min_sv": 1.2529785493875512e-08, "grad_condition": 24243355.610875387, "lr": 0.0007853567838422158, "time_sec": 49.64337158203125 }, { "epoch": 47, "train_loss": 2.287512142944336, "train_acc": 0.39698, "test_loss": 7.659019016265869, "test_acc": 0.0729, "lyapunov": null, "grad_norm": 0.6552491008893353, "grad_max_sv": 0.2252129375934601, "grad_min_sv": 1.2101228903660389e-08, "grad_condition": 37944286.39668895, "lr": 0.0007766957746216719, "time_sec": 49.610002756118774 }, { "epoch": 48, "train_loss": 2.2750962590026855, "train_acc": 0.39712, "test_loss": 6.906008920288086, "test_acc": 0.085, "lyapunov": null, "grad_norm": 0.6572787443040576, "grad_max_sv": 0.23201882764697074, "grad_min_sv": 1.233105519499178e-08, "grad_condition": 27571588.322845332, "lr": 0.0007679133974894982, "time_sec": 49.65186142921448 }, { "epoch": 49, "train_loss": 2.2525532193756104, "train_acc": 0.40456, "test_loss": 7.617325218963623, "test_acc": 0.074, "lyapunov": null, "grad_norm": 0.6492386918943517, "grad_max_sv": 0.2307146478444338, "grad_min_sv": 1.229703296403914e-08, "grad_condition": 211540506.258676, "lr": 0.000759013504686565, "time_sec": 49.6446647644043 }, { "epoch": 50, "train_loss": 2.237634787826538, "train_acc": 0.40684, "test_loss": 6.678198162841797, "test_acc": 0.0633, "lyapunov": null, "grad_norm": 0.6565102133805185, "grad_max_sv": 0.2293539997190237, "grad_min_sv": 1.2340318197856526e-08, "grad_condition": 27740724.758145083, "lr": 0.0007499999999999998, "time_sec": 49.653481006622314 }, { "epoch": 51, "train_loss": 2.209577166748047, "train_acc": 0.40976, "test_loss": 6.840425001525879, "test_acc": 0.0718, "lyapunov": null, "grad_norm": 0.6547461235382159, "grad_max_sv": 0.22949806824326516, "grad_min_sv": 1.2320622985728668e-08, "grad_condition": 23307963.55905198, "lr": 0.0007408768370508575, "time_sec": 49.61805582046509 }, { "epoch": 52, "train_loss": 2.200788235549927, "train_acc": 0.41432, "test_loss": 7.2077490463256835, "test_acc": 0.0756, "lyapunov": null, "grad_norm": 0.6510213685672233, "grad_max_sv": 0.23402363583445548, "grad_min_sv": 1.2258231881986937e-08, "grad_condition": 75476519.13664213, "lr": 0.0007316480175599307, "time_sec": 49.646629095077515 }, { "epoch": 53, "train_loss": 2.184033504333496, "train_acc": 0.41906, "test_loss": 6.790815046691894, "test_acc": 0.0761, "lyapunov": null, "grad_norm": 0.6498948423513097, "grad_max_sv": 0.2297774288803339, "grad_min_sv": 1.2289613515736875e-08, "grad_condition": 25175002.986691862, "lr": 0.0007223175895924635, "time_sec": 49.616777181625366 }, { "epoch": 54, "train_loss": 2.1751246100616455, "train_acc": 0.4209, "test_loss": 7.843894770812988, "test_acc": 0.0728, "lyapunov": null, "grad_norm": 0.6502026955560598, "grad_max_sv": 0.22432956397533416, "grad_min_sv": 1.2058743079079725e-08, "grad_condition": 27210725.454316296, "lr": 0.0007128896457825361, "time_sec": 49.63462972640991 }, { "epoch": 55, "train_loss": 2.1508761085510253, "train_acc": 0.42416, "test_loss": 7.085880072784424, "test_acc": 0.0952, "lyapunov": null, "grad_norm": 0.6487356152863625, "grad_max_sv": 0.22850245125591756, "grad_min_sv": 1.2312155951710312e-08, "grad_condition": 41183718.923533805, "lr": 0.0007033683215378998, "time_sec": 49.64608693122864 }, { "epoch": 56, "train_loss": 2.141602848587036, "train_acc": 0.42634, "test_loss": 6.250551121520996, "test_acc": 0.0971, "lyapunov": null, "grad_norm": 0.6410808562446506, "grad_max_sv": 0.2151340998709202, "grad_min_sv": 1.176430176191845e-08, "grad_condition": 30604181.986327033, "lr": 0.0006937577932260512, "time_sec": 49.70740008354187 }, { "epoch": 57, "train_loss": 2.14431159286499, "train_acc": 0.42548, "test_loss": 6.846168923950195, "test_acc": 0.0958, "lyapunov": null, "grad_norm": 0.6444720385859491, "grad_max_sv": 0.2224727988243103, "grad_min_sv": 1.2025717233132837e-08, "grad_condition": 23924517.448539954, "lr": 0.0006840622763423388, "time_sec": 49.63225722312927 }, { "epoch": 58, "train_loss": 2.10916792388916, "train_acc": 0.43432, "test_loss": 6.8249847625732425, "test_acc": 0.1066, "lyapunov": null, "grad_norm": 0.6502634467633226, "grad_max_sv": 0.22863934263587, "grad_min_sv": 1.218627998234023e-08, "grad_condition": 28771962.702913057, "lr": 0.0006742860236609073, "time_sec": 49.63661074638367 }, { "epoch": 59, "train_loss": 2.100633440322876, "train_acc": 0.43724, "test_loss": 7.080769053649902, "test_acc": 0.097, "lyapunov": null, "grad_norm": 0.6514345540301675, "grad_max_sv": 0.23131897561252118, "grad_min_sv": 1.2473222341102818e-08, "grad_condition": 23428156.69088362, "lr": 0.0006644333233692913, "time_sec": 49.631585359573364 }, { "epoch": 60, "train_loss": 2.0753550579452513, "train_acc": 0.44222, "test_loss": 7.097881182861328, "test_acc": 0.0782, "lyapunov": null, "grad_norm": 0.642048459758103, "grad_max_sv": 0.21754480227828027, "grad_min_sv": 1.2038245155582273e-08, "grad_condition": 35173118.59205349, "lr": 0.0006545084971874734, "time_sec": 49.642804861068726 }, { "epoch": 61, "train_loss": 2.060260758514404, "train_acc": 0.4465, "test_loss": 6.766320790863037, "test_acc": 0.0839, "lyapunov": null, "grad_norm": 0.6459643627424662, "grad_max_sv": 0.223102143406868, "grad_min_sv": 1.22261165164117e-08, "grad_condition": 22073921.720915027, "lr": 0.0006445158984722354, "time_sec": 49.64657950401306 }, { "epoch": 62, "train_loss": 2.0472131072998048, "train_acc": 0.4486, "test_loss": 6.881848452758789, "test_acc": 0.0976, "lyapunov": null, "grad_norm": 0.6461433133831308, "grad_max_sv": 0.22962211742997168, "grad_min_sv": 1.2113809159074174e-08, "grad_condition": 324038818.4677658, "lr": 0.0006344599103076324, "time_sec": 49.627341747283936 }, { "epoch": 63, "train_loss": 2.035955301361084, "train_acc": 0.44882, "test_loss": 7.18960142211914, "test_acc": 0.0878, "lyapunov": null, "grad_norm": 0.6422783690964438, "grad_max_sv": 0.2209172960370779, "grad_min_sv": 1.2127595816480152e-08, "grad_condition": 21910433.389134284, "lr": 0.0006243449435824269, "time_sec": 49.64501976966858 }, { "epoch": 64, "train_loss": 2.036686828079224, "train_acc": 0.45056, "test_loss": 7.650535336303711, "test_acc": 0.0924, "lyapunov": null, "grad_norm": 0.641718667248247, "grad_max_sv": 0.22157798074185847, "grad_min_sv": 1.1966991517176062e-08, "grad_condition": 25321432.686805125, "lr": 0.0006141754350553275, "time_sec": 49.63518667221069 }, { "epoch": 65, "train_loss": 2.0039944877624514, "train_acc": 0.45574, "test_loss": 7.262261317443848, "test_acc": 0.114, "lyapunov": null, "grad_norm": 0.6509729656164255, "grad_max_sv": 0.2328164666891098, "grad_min_sv": 1.2227686406116046e-08, "grad_condition": 78588688.09864715, "lr": 0.0006039558454088793, "time_sec": 49.62892246246338 }, { "epoch": 66, "train_loss": 1.9934623148345947, "train_acc": 0.4604, "test_loss": 6.735845774841309, "test_acc": 0.0988, "lyapunov": null, "grad_norm": 0.6428090636861153, "grad_max_sv": 0.22018610946834088, "grad_min_sv": 1.2050285417425366e-08, "grad_condition": 33987345.003156364, "lr": 0.000593690657292862, "time_sec": 49.634801626205444 }, { "epoch": 67, "train_loss": 1.968681404800415, "train_acc": 0.46364, "test_loss": 7.602304705810547, "test_acc": 0.0987, "lyapunov": null, "grad_norm": 0.6457740641454927, "grad_max_sv": 0.2279145259410143, "grad_min_sv": 1.2256968678903136e-08, "grad_condition": 23591230.853540566, "lr": 0.0005833843733580507, "time_sec": 49.640379190444946 }, { "epoch": 68, "train_loss": 1.9723771545791626, "train_acc": 0.46456, "test_loss": 7.501553115844726, "test_acc": 0.0743, "lyapunov": null, "grad_norm": 0.6345718818470338, "grad_max_sv": 0.21636971682310105, "grad_min_sv": 1.1871784413863828e-08, "grad_condition": 21468624.440050583, "lr": 0.0005730415142812054, "time_sec": 49.618358850479126 }, { "epoch": 69, "train_loss": 1.950169172744751, "train_acc": 0.46892, "test_loss": 7.0990902679443355, "test_acc": 0.0888, "lyapunov": null, "grad_norm": 0.6406229801466465, "grad_max_sv": 0.2206659872084856, "grad_min_sv": 1.1992476682196051e-08, "grad_condition": 56593916.45522114, "lr": 0.0005626666167821517, "time_sec": 49.63790965080261 }, { "epoch": 70, "train_loss": 1.939907547531128, "train_acc": 0.4716, "test_loss": 7.282066575622559, "test_acc": 0.0983, "lyapunov": null, "grad_norm": 0.6459981596212524, "grad_max_sv": 0.23004377372562884, "grad_min_sv": 1.2037511798457245e-08, "grad_condition": 28235857.849722397, "lr": 0.0005522642316338265, "time_sec": 49.62828755378723 }, { "epoch": 71, "train_loss": 1.929073366470337, "train_acc": 0.47462, "test_loss": 6.812109463500977, "test_acc": 0.1063, "lyapunov": null, "grad_norm": 0.6476540219610287, "grad_max_sv": 0.22166885659098626, "grad_min_sv": 1.2136537663048897e-08, "grad_condition": 51677369.32839097, "lr": 0.0005418389216661573, "time_sec": 49.61943817138672 }, { "epoch": 72, "train_loss": 1.919623097305298, "train_acc": 0.47576, "test_loss": 6.68877933883667, "test_acc": 0.0798, "lyapunov": null, "grad_norm": 0.638990192022336, "grad_max_sv": 0.2177750900387764, "grad_min_sv": 1.1837285757154703e-08, "grad_condition": 30448032.105450857, "lr": 0.0005313952597646563, "time_sec": 49.63543653488159 }, { "epoch": 73, "train_loss": 1.8911805786514282, "train_acc": 0.4813, "test_loss": 7.259025004577636, "test_acc": 0.1017, "lyapunov": null, "grad_norm": 0.6388927531170105, "grad_max_sv": 0.2268439143896103, "grad_min_sv": 1.2116396552741548e-08, "grad_condition": 25828769.58088143, "lr": 0.0005209378268645994, "time_sec": 49.63246250152588 }, { "epoch": 74, "train_loss": 1.87730663772583, "train_acc": 0.4856, "test_loss": 6.621179290771485, "test_acc": 0.1118, "lyapunov": null, "grad_norm": 0.6382424632105009, "grad_max_sv": 0.22017028257250787, "grad_min_sv": 1.1917627623647676e-08, "grad_condition": 36459230.544282585, "lr": 0.0005104712099416781, "time_sec": 49.63705110549927 }, { "epoch": 75, "train_loss": 1.8676763352966308, "train_acc": 0.4867, "test_loss": 6.639352639770507, "test_acc": 0.1035, "lyapunov": null, "grad_norm": 0.6471776484855016, "grad_max_sv": 0.22313491702079774, "grad_min_sv": 1.2076539387256834e-08, "grad_condition": 168096640.34612545, "lr": 0.0004999999999999996, "time_sec": 49.62802839279175 }, { "epoch": 76, "train_loss": 1.8601240715026854, "train_acc": 0.48752, "test_loss": 7.69632975769043, "test_acc": 0.093, "lyapunov": null, "grad_norm": 0.6373532537157988, "grad_max_sv": 0.21818222440779209, "grad_min_sv": 1.1897569247160123e-08, "grad_condition": 49575276.624648556, "lr": 0.0004895287900583212, "time_sec": 49.61473488807678 }, { "epoch": 77, "train_loss": 1.844694657020569, "train_acc": 0.49, "test_loss": 7.673219400024414, "test_acc": 0.0971, "lyapunov": null, "grad_norm": 0.6357429485708425, "grad_max_sv": 0.21753050275146962, "grad_min_sv": 1.1727277435258366e-08, "grad_condition": 25108982.07055033, "lr": 0.0004790621731353997, "time_sec": 49.61942458152771 }, { "epoch": 78, "train_loss": 1.8382536688232423, "train_acc": 0.49426, "test_loss": 8.053473236083985, "test_acc": 0.0877, "lyapunov": null, "grad_norm": 0.6413732546621618, "grad_max_sv": 0.22126910798251628, "grad_min_sv": 1.217776433408424e-08, "grad_condition": 50630196.79387429, "lr": 0.000468604740235343, "time_sec": 49.620675802230835 }, { "epoch": 79, "train_loss": 1.8119768780899048, "train_acc": 0.50004, "test_loss": 7.10159133605957, "test_acc": 0.103, "lyapunov": null, "grad_norm": 0.64075038803741, "grad_max_sv": 0.22004345506429673, "grad_min_sv": 1.179401228554311e-08, "grad_condition": 39644724.18434289, "lr": 0.00045816107833384175, "time_sec": 49.65424633026123 }, { "epoch": 80, "train_loss": 1.805297444114685, "train_acc": 0.50122, "test_loss": 7.127357855224609, "test_acc": 0.1076, "lyapunov": null, "grad_norm": 0.6452326753546996, "grad_max_sv": 0.2212912131100893, "grad_min_sv": 1.2059882024961777e-08, "grad_condition": 29968320.229064513, "lr": 0.0004477357683661729, "time_sec": 49.62116003036499 }, { "epoch": 81, "train_loss": 1.792769065246582, "train_acc": 0.50348, "test_loss": 7.439458018493652, "test_acc": 0.0985, "lyapunov": null, "grad_norm": 0.6408257507786687, "grad_max_sv": 0.22126449905335904, "grad_min_sv": 1.1952658901526191e-08, "grad_condition": 23156470.62447612, "lr": 0.00043733338321784746, "time_sec": 49.64424705505371 }, { "epoch": 82, "train_loss": 1.770621812400818, "train_acc": 0.51052, "test_loss": 7.155345419311524, "test_acc": 0.1127, "lyapunov": null, "grad_norm": 0.6446017522348026, "grad_max_sv": 0.22318419590592384, "grad_min_sv": 1.1969205995082665e-08, "grad_condition": 88594611.75801164, "lr": 0.0004269584857187939, "time_sec": 49.622429847717285 }, { "epoch": 83, "train_loss": 1.769109418029785, "train_acc": 0.50846, "test_loss": 7.010694668579101, "test_acc": 0.1057, "lyapunov": null, "grad_norm": 0.6502891030839932, "grad_max_sv": 0.2263760395348072, "grad_min_sv": 1.2018579030603772e-08, "grad_condition": 29299643.5314746, "lr": 0.0004166156266419484, "time_sec": 49.614967584609985 }, { "epoch": 84, "train_loss": 1.7552229693222046, "train_acc": 0.51318, "test_loss": 7.019638833618164, "test_acc": 0.1006, "lyapunov": null, "grad_norm": 0.6441122145546607, "grad_max_sv": 0.21587914675474168, "grad_min_sv": 1.1914460645509606e-08, "grad_condition": 54331112.96990696, "lr": 0.0004063093427071373, "time_sec": 49.63624048233032 }, { "epoch": 85, "train_loss": 1.7453889175796509, "train_acc": 0.5142, "test_loss": 6.935272999572754, "test_acc": 0.0772, "lyapunov": null, "grad_norm": 0.6354119534548792, "grad_max_sv": 0.22349480539560318, "grad_min_sv": 1.188125494724912e-08, "grad_condition": 54450146.559093714, "lr": 0.0003960441545911199, "time_sec": 49.63727903366089 }, { "epoch": 86, "train_loss": 1.7361508292388916, "train_acc": 0.51694, "test_loss": 6.903331332397461, "test_acc": 0.0874, "lyapunov": null, "grad_norm": 0.6433396686482765, "grad_max_sv": 0.2229986496269703, "grad_min_sv": 1.2302347957016124e-08, "grad_condition": 20829684.95092944, "lr": 0.0003858245649446718, "time_sec": 49.620397329330444 }, { "epoch": 87, "train_loss": 1.7140229907989502, "train_acc": 0.52362, "test_loss": 6.144080555725098, "test_acc": 0.0973, "lyapunov": null, "grad_norm": 0.6397281329733326, "grad_max_sv": 0.2236575834453106, "grad_min_sv": 1.2130321444536741e-08, "grad_condition": 24582093.327500105, "lr": 0.00037565505641757235, "time_sec": 49.63749957084656 }, { "epoch": 88, "train_loss": 1.698942677230835, "train_acc": 0.52702, "test_loss": 6.329557989501953, "test_acc": 0.1043, "lyapunov": null, "grad_norm": 0.6429735672215783, "grad_max_sv": 0.22443199381232262, "grad_min_sv": 1.2242971281217762e-08, "grad_condition": 21997184.984676402, "lr": 0.00036554008969236695, "time_sec": 49.64341187477112 }, { "epoch": 89, "train_loss": 1.6915926089859008, "train_acc": 0.52672, "test_loss": 6.97091061706543, "test_acc": 0.1064, "lyapunov": null, "grad_norm": 0.6396443107842517, "grad_max_sv": 0.21398231349885463, "grad_min_sv": 1.1860397219898289e-08, "grad_condition": 25819116.390227333, "lr": 0.0003554841015277638, "time_sec": 49.61740279197693 }, { "epoch": 90, "train_loss": 1.6705048236846924, "train_acc": 0.53226, "test_loss": 6.474410656738281, "test_acc": 0.1104, "lyapunov": null, "grad_norm": 0.6447874278631877, "grad_max_sv": 0.22352466247975827, "grad_min_sv": 1.1839073051078675e-08, "grad_condition": 194632597.18194634, "lr": 0.000345491502812526, "time_sec": 49.63944673538208 }, { "epoch": 91, "train_loss": 1.6604324224090576, "train_acc": 0.53478, "test_loss": 7.210493100738526, "test_acc": 0.1186, "lyapunov": null, "grad_norm": 0.6483901695782636, "grad_max_sv": 0.23147397823631763, "grad_min_sv": 1.2240159032281435e-08, "grad_condition": 833122995.4080375, "lr": 0.0003355666766307081, "time_sec": 49.65723490715027 }, { "epoch": 92, "train_loss": 1.655436181564331, "train_acc": 0.53562, "test_loss": 6.41819879989624, "test_acc": 0.1099, "lyapunov": null, "grad_norm": 0.6422800867205569, "grad_max_sv": 0.22188753299415112, "grad_min_sv": 1.1910704758588687e-08, "grad_condition": 31454971.248209517, "lr": 0.00032571397633909225, "time_sec": 49.62359666824341 }, { "epoch": 93, "train_loss": 1.6418727423477173, "train_acc": 0.53886, "test_loss": 6.5647822364807125, "test_acc": 0.1078, "lyapunov": null, "grad_norm": 0.6425002000385331, "grad_max_sv": 0.22996555864810944, "grad_min_sv": 1.214085261491693e-08, "grad_condition": 23136414.278494585, "lr": 0.00031593772365766094, "time_sec": 49.648432970047 }, { "epoch": 94, "train_loss": 1.6380917670822144, "train_acc": 0.54016, "test_loss": 6.60304995880127, "test_acc": 0.1013, "lyapunov": null, "grad_norm": 0.6435715746993702, "grad_max_sv": 0.22394425868988038, "grad_min_sv": 1.1969105850884176e-08, "grad_condition": 22813937.74993243, "lr": 0.0003062422067739483, "time_sec": 49.62917709350586 }, { "epoch": 95, "train_loss": 1.6159375607681274, "train_acc": 0.54468, "test_loss": 7.4295039352417, "test_acc": 0.1043, "lyapunov": null, "grad_norm": 0.6459265748151144, "grad_max_sv": 0.2222417715936899, "grad_min_sv": 1.2084532810541226e-08, "grad_condition": 23228929.65699155, "lr": 0.00029663167846209965, "time_sec": 49.633803606033325 }, { "epoch": 96, "train_loss": 1.6130770600128175, "train_acc": 0.54918, "test_loss": 7.755695833587646, "test_acc": 0.103, "lyapunov": null, "grad_norm": 0.6373845581356181, "grad_max_sv": 0.2166528631001711, "grad_min_sv": 1.1723080543812881e-08, "grad_condition": 61573060.408652686, "lr": 0.00028711035421746345, "time_sec": 49.63398790359497 }, { "epoch": 97, "train_loss": 1.5942238623046876, "train_acc": 0.55338, "test_loss": 7.366734781646729, "test_acc": 0.0942, "lyapunov": null, "grad_norm": 0.645954709653033, "grad_max_sv": 0.23344604782760142, "grad_min_sv": 1.211216281021832e-08, "grad_condition": 28920253.40686954, "lr": 0.00027768241040753615, "time_sec": 49.63687562942505 }, { "epoch": 98, "train_loss": 1.5829193838119506, "train_acc": 0.55468, "test_loss": 7.60546820526123, "test_acc": 0.0996, "lyapunov": null, "grad_norm": 0.6414940955031293, "grad_max_sv": 0.22326541543006898, "grad_min_sv": 1.18154431003048e-08, "grad_condition": 27850671.690087616, "lr": 0.00026835198244006903, "time_sec": 49.60518288612366 }, { "epoch": 99, "train_loss": 1.5702915887451172, "train_acc": 0.55388, "test_loss": 7.25171710357666, "test_acc": 0.0857, "lyapunov": null, "grad_norm": 0.6448707164382114, "grad_max_sv": 0.22703963220119477, "grad_min_sv": 1.2078747084476315e-08, "grad_condition": 30695848.89590156, "lr": 0.0002591231629491421, "time_sec": 49.6348443031311 }, { "epoch": 100, "train_loss": 1.563120531387329, "train_acc": 0.5575, "test_loss": 7.321073220062256, "test_acc": 0.0975, "lyapunov": null, "grad_norm": 0.6501432324709732, "grad_max_sv": 0.22466112971305846, "grad_min_sv": 1.1973627836447952e-08, "grad_condition": 23144250.2743996, "lr": 0.0002499999999999997, "time_sec": 49.639625549316406 }, { "epoch": 101, "train_loss": 1.5544149493026733, "train_acc": 0.562, "test_loss": 8.2606175201416, "test_acc": 0.0986, "lyapunov": null, "grad_norm": 0.6383634384668164, "grad_max_sv": 0.22597188949584962, "grad_min_sv": 1.1897128555232727e-08, "grad_condition": 42860913.99555977, "lr": 0.00024098649531343477, "time_sec": 49.64992117881775 }, { "epoch": 102, "train_loss": 1.547795528869629, "train_acc": 0.5621, "test_loss": 7.994213732910156, "test_acc": 0.1009, "lyapunov": null, "grad_norm": 0.6440457566084322, "grad_max_sv": 0.22605536915361882, "grad_min_sv": 1.21044593875963e-08, "grad_condition": 23222249.12666279, "lr": 0.0002320866025105016, "time_sec": 49.638099670410156 }, { "epoch": 103, "train_loss": 1.5383813903045653, "train_acc": 0.56598, "test_loss": 8.507730350494384, "test_acc": 0.0971, "lyapunov": null, "grad_norm": 0.6412277700079685, "grad_max_sv": 0.2286630392074585, "grad_min_sv": 1.1935943896451695e-08, "grad_condition": 61496117.17851217, "lr": 0.0002233042253783278, "time_sec": 49.624167919158936 }, { "epoch": 104, "train_loss": 1.5296855780792236, "train_acc": 0.56802, "test_loss": 7.766149099731446, "test_acc": 0.1005, "lyapunov": null, "grad_norm": 0.6402323929530521, "grad_max_sv": 0.2234394859522581, "grad_min_sv": 1.1708301472790339e-08, "grad_condition": 51957414.29232074, "lr": 0.000214643216157784, "time_sec": 49.62683367729187 }, { "epoch": 105, "train_loss": 1.515010786781311, "train_acc": 0.5704, "test_loss": 7.568338539123535, "test_acc": 0.1172, "lyapunov": null, "grad_norm": 0.6478082803296404, "grad_max_sv": 0.23342282325029373, "grad_min_sv": 1.216084826727304e-08, "grad_condition": 26048714.73020513, "lr": 0.00020610737385376332, "time_sec": 49.63592481613159 }, { "epoch": 106, "train_loss": 1.512930496749878, "train_acc": 0.56978, "test_loss": 7.760108979797363, "test_acc": 0.1047, "lyapunov": null, "grad_norm": 0.6453652740846443, "grad_max_sv": 0.22414597682654858, "grad_min_sv": 1.1973005337173603e-08, "grad_condition": 26272467.73653502, "lr": 0.00019770044256881242, "time_sec": 49.61698055267334 }, { "epoch": 107, "train_loss": 1.4956118043899536, "train_acc": 0.57444, "test_loss": 8.33652488708496, "test_acc": 0.1011, "lyapunov": null, "grad_norm": 0.6438260578925417, "grad_max_sv": 0.2238406077027321, "grad_min_sv": 1.1764498750177488e-08, "grad_condition": 28981818.37375744, "lr": 0.0001894261098608447, "time_sec": 49.63762021064758 }, { "epoch": 108, "train_loss": 1.491361379776001, "train_acc": 0.57876, "test_loss": 8.52306475906372, "test_acc": 0.1029, "lyapunov": null, "grad_norm": 0.6413105894442734, "grad_max_sv": 0.22412343323230743, "grad_min_sv": 1.2146300558402157e-08, "grad_condition": 34732320.931619205, "lr": 0.000181288005125655, "time_sec": 49.6246235370636 }, { "epoch": 109, "train_loss": 1.4785979221343994, "train_acc": 0.5778, "test_loss": 7.686713803100586, "test_acc": 0.0994, "lyapunov": null, "grad_norm": 0.6419467845001164, "grad_max_sv": 0.22575648352503777, "grad_min_sv": 1.1847785963414737e-08, "grad_condition": 32480603.86279717, "lr": 0.0001732896980049473, "time_sec": 49.628063678741455 }, { "epoch": 110, "train_loss": 1.4723126147842407, "train_acc": 0.57888, "test_loss": 8.482755671691894, "test_acc": 0.1053, "lyapunov": null, "grad_norm": 0.6427405399098718, "grad_max_sv": 0.2258045580238104, "grad_min_sv": 1.177179903347203e-08, "grad_condition": 55737890.93326217, "lr": 0.00016543469682057076, "time_sec": 49.82239508628845 }, { "epoch": 111, "train_loss": 1.4714193873977661, "train_acc": 0.5821, "test_loss": 8.059153175354004, "test_acc": 0.1095, "lyapunov": null, "grad_norm": 0.643358384906005, "grad_max_sv": 0.2271666146814823, "grad_min_sv": 1.1828724497814358e-08, "grad_condition": 53541240.65537085, "lr": 0.00015772644703565552, "time_sec": 49.64692163467407 }, { "epoch": 112, "train_loss": 1.4565179361724854, "train_acc": 0.58618, "test_loss": 8.070704318237304, "test_acc": 0.0989, "lyapunov": null, "grad_norm": 0.6414562113271406, "grad_max_sv": 0.22715382017195224, "grad_min_sv": 1.2078682694316445e-08, "grad_condition": 27450211.87146064, "lr": 0.00015016832974331713, "time_sec": 49.634828329086304 }, { "epoch": 113, "train_loss": 1.445754097442627, "train_acc": 0.58848, "test_loss": 8.390233863830566, "test_acc": 0.1078, "lyapunov": null, "grad_norm": 0.6411801061752302, "grad_max_sv": 0.2343009330332279, "grad_min_sv": 1.2054243894374373e-08, "grad_condition": 73622071.21411385, "lr": 0.00014276366018359834, "time_sec": 49.62168598175049 }, { "epoch": 114, "train_loss": 1.4396562029647828, "train_acc": 0.59112, "test_loss": 7.990397840881347, "test_acc": 0.1207, "lyapunov": null, "grad_norm": 0.6446675700592518, "grad_max_sv": 0.22858907766640185, "grad_min_sv": 1.2150255043752444e-08, "grad_condition": 23031763.367673956, "lr": 0.00013551568628929425, "time_sec": 49.621737480163574 }, { "epoch": 115, "train_loss": 1.4295790006256104, "train_acc": 0.5919, "test_loss": 7.907929286956787, "test_acc": 0.1088, "lyapunov": null, "grad_norm": 0.6414787996170513, "grad_max_sv": 0.22259003035724162, "grad_min_sv": 1.1937235663839196e-08, "grad_condition": 26925988.130458646, "lr": 0.00012842758726130276, "time_sec": 49.702799558639526 }, { "epoch": 116, "train_loss": 1.419941686477661, "train_acc": 0.59402, "test_loss": 7.794718334197998, "test_acc": 0.118, "lyapunov": null, "grad_norm": 0.6403562503796186, "grad_max_sv": 0.23044625744223596, "grad_min_sv": 1.1990111638271461e-08, "grad_condition": 86324103.75912428, "lr": 0.0001215024721741218, "time_sec": 49.6519889831543 }, { "epoch": 117, "train_loss": 1.4125151259613038, "train_acc": 0.59724, "test_loss": 8.082193556976318, "test_acc": 0.1093, "lyapunov": null, "grad_norm": 0.6390276536629967, "grad_max_sv": 0.22913259454071522, "grad_min_sv": 1.1846856870501021e-08, "grad_condition": 38051050.155520104, "lr": 0.00011474337861210538, "time_sec": 49.67843008041382 }, { "epoch": 118, "train_loss": 1.4061624579238892, "train_acc": 0.59848, "test_loss": 7.994955434417725, "test_acc": 0.1217, "lyapunov": null, "grad_norm": 0.6431427525608711, "grad_max_sv": 0.22681293152272702, "grad_min_sv": 1.2012494199353796e-08, "grad_condition": 22440692.932778567, "lr": 0.00010815327133708009, "time_sec": 49.65889072418213 }, { "epoch": 119, "train_loss": 1.4033130680847168, "train_acc": 0.59806, "test_loss": 7.7351758087158204, "test_acc": 0.1159, "lyapunov": null, "grad_norm": 0.6393512801434791, "grad_max_sv": 0.22470695674419403, "grad_min_sv": 1.173807711446484e-08, "grad_condition": 33523113.628067147, "lr": 0.00010173504098790182, "time_sec": 49.65284276008606 }, { "epoch": 120, "train_loss": 1.3988560864257813, "train_acc": 0.59928, "test_loss": 8.596598931121827, "test_acc": 0.104, "lyapunov": null, "grad_norm": 0.6430512338238313, "grad_max_sv": 0.23124604262411594, "grad_min_sv": 1.2035057309067731e-08, "grad_condition": 27263284.07382477, "lr": 9.549150281252629e-05, "time_sec": 49.64090633392334 }, { "epoch": 121, "train_loss": 1.3857270031356812, "train_acc": 0.60484, "test_loss": 7.9892033752441405, "test_acc": 0.1183, "lyapunov": null, "grad_norm": 0.6395461283787793, "grad_max_sv": 0.22570451460778712, "grad_min_sv": 1.2030840006518884e-08, "grad_condition": 53181043.26539834, "lr": 8.942539543314794e-05, "time_sec": 49.60771918296814 }, { "epoch": 122, "train_loss": 1.3880330154037475, "train_acc": 0.60376, "test_loss": 8.22642307357788, "test_acc": 0.115, "lyapunov": null, "grad_norm": 0.6427946655580464, "grad_max_sv": 0.22782764062285424, "grad_min_sv": 1.1785313203116487e-08, "grad_condition": 24787267.408791415, "lr": 8.353937964495024e-05, "time_sec": 49.64048886299133 }, { "epoch": 123, "train_loss": 1.377012547569275, "train_acc": 0.60464, "test_loss": 7.7657553009033204, "test_acc": 0.114, "lyapunov": null, "grad_norm": 0.6396634441881897, "grad_max_sv": 0.23086622469127177, "grad_min_sv": 1.198922548739656e-08, "grad_condition": 23123320.372294467, "lr": 7.783603724899243e-05, "time_sec": 49.63312888145447 }, { "epoch": 124, "train_loss": 1.376011091003418, "train_acc": 0.60928, "test_loss": 7.944722248840332, "test_acc": 0.1039, "lyapunov": null, "grad_norm": 0.6321494808563242, "grad_max_sv": 0.22378434427082539, "grad_min_sv": 1.1604401764855887e-08, "grad_condition": 58244211.34800786, "lr": 7.231786991974666e-05, "time_sec": 49.64424800872803 }, { "epoch": 125, "train_loss": 1.368886891708374, "train_acc": 0.60824, "test_loss": 8.258360435485839, "test_acc": 0.1147, "lyapunov": null, "grad_norm": 0.6400148651728099, "grad_max_sv": 0.22423702478408813, "grad_min_sv": 1.175346897655527e-08, "grad_condition": 47951723.35743973, "lr": 6.698729810778072e-05, "time_sec": 49.635197162628174 }, { "epoch": 126, "train_loss": 1.368887268447876, "train_acc": 0.60784, "test_loss": 8.00912710647583, "test_acc": 0.1098, "lyapunov": null, "grad_norm": 0.6414620945866057, "grad_max_sv": 0.22984928116202355, "grad_min_sv": 1.1862470802870284e-08, "grad_condition": 27488218.9085432, "lr": 6.184665997806817e-05, "time_sec": 49.63115334510803 }, { "epoch": 127, "train_loss": 1.3691972059631348, "train_acc": 0.60894, "test_loss": 8.099956825256347, "test_acc": 0.1137, "lyapunov": null, "grad_norm": 0.6379342286587659, "grad_max_sv": 0.22721209563314915, "grad_min_sv": 1.1842124452571268e-08, "grad_condition": 66054597.76675473, "lr": 5.6898210384392595e-05, "time_sec": 49.64264273643494 }, { "epoch": 128, "train_loss": 1.3585320538711547, "train_acc": 0.61176, "test_loss": 8.168904312896728, "test_acc": 0.1178, "lyapunov": null, "grad_norm": 0.6384779111033096, "grad_max_sv": 0.2258748199790716, "grad_min_sv": 1.1702591148909925e-08, "grad_condition": 121211424.44652918, "lr": 5.214411988029363e-05, "time_sec": 49.62958645820618 }, { "epoch": 129, "train_loss": 1.3585711254501343, "train_acc": 0.6101, "test_loss": 7.90961298828125, "test_acc": 0.1095, "lyapunov": null, "grad_norm": 0.6412738082737135, "grad_max_sv": 0.22799600511789322, "grad_min_sv": 1.2047476663501478e-08, "grad_condition": 44984170.42448841, "lr": 4.7586473766990294e-05, "time_sec": 49.62019920349121 }, { "epoch": 130, "train_loss": 1.3606473222351074, "train_acc": 0.60866, "test_loss": 7.8885728500366215, "test_acc": 0.1165, "lyapunov": null, "grad_norm": 0.6429377341506345, "grad_max_sv": 0.22763566635549068, "grad_min_sv": 1.1949406383826578e-08, "grad_condition": 23238593.216242827, "lr": 4.32272711786996e-05, "time_sec": 49.60610270500183 }, { "epoch": 131, "train_loss": 1.340769683189392, "train_acc": 0.61422, "test_loss": 7.97282382888794, "test_acc": 0.1176, "lyapunov": null, "grad_norm": 0.6365898965081005, "grad_max_sv": 0.22698684968054295, "grad_min_sv": 1.1841301903944835e-08, "grad_condition": 57050057.91630666, "lr": 3.906842420574966e-05, "time_sec": 49.639729738235474 }, { "epoch": 132, "train_loss": 1.3506625385284423, "train_acc": 0.61254, "test_loss": 8.237340574645996, "test_acc": 0.1112, "lyapunov": null, "grad_norm": 0.6405822016126281, "grad_max_sv": 0.2313113920390606, "grad_min_sv": 1.1943680751358432e-08, "grad_condition": 32855860.000038534, "lr": 3.5111757055874305e-05, "time_sec": 49.62140464782715 }, { "epoch": 133, "train_loss": 1.3537355774307251, "train_acc": 0.60946, "test_loss": 8.220967332458496, "test_acc": 0.1107, "lyapunov": null, "grad_norm": 0.6424071935223469, "grad_max_sv": 0.2330889504402876, "grad_min_sv": 1.1997084857148787e-08, "grad_condition": 44613447.03937371, "lr": 3.1359005254054254e-05, "time_sec": 49.62578868865967 }, { "epoch": 134, "train_loss": 1.33552843044281, "train_acc": 0.61362, "test_loss": 8.059291929626465, "test_acc": 0.1019, "lyapunov": null, "grad_norm": 0.6408761914883747, "grad_max_sv": 0.2316820841282606, "grad_min_sv": 1.1778968132813982e-08, "grad_condition": 105523171.68805893, "lr": 2.7811814881259484e-05, "time_sec": 49.62417006492615 }, { "epoch": 135, "train_loss": 1.3386833112335206, "train_acc": 0.61374, "test_loss": 7.973577444458008, "test_acc": 0.1097, "lyapunov": null, "grad_norm": 0.6388300432658766, "grad_max_sv": 0.22841673195362092, "grad_min_sv": 1.1936609616361448e-08, "grad_condition": 69324765.09964362, "lr": 2.4471741852423218e-05, "time_sec": 49.65416145324707 }, { "epoch": 136, "train_loss": 1.3311992990112305, "train_acc": 0.618, "test_loss": 8.200102568817139, "test_acc": 0.1214, "lyapunov": null, "grad_norm": 0.638950694855791, "grad_max_sv": 0.2365179505199194, "grad_min_sv": 1.1939427453644402e-08, "grad_condition": 27475716.41514334, "lr": 2.1340251233966362e-05, "time_sec": 49.64095640182495 }, { "epoch": 137, "train_loss": 1.3340746058273316, "train_acc": 0.61812, "test_loss": 7.946666102600098, "test_acc": 0.1106, "lyapunov": null, "grad_norm": 0.6352812169452327, "grad_max_sv": 0.22020692974328995, "grad_min_sv": 1.1623311241271139e-08, "grad_condition": 29930613.060724013, "lr": 1.8418716601170932e-05, "time_sec": 49.633143186569214 }, { "epoch": 138, "train_loss": 1.336420276031494, "train_acc": 0.61512, "test_loss": 8.25653330230713, "test_acc": 0.112, "lyapunov": null, "grad_norm": 0.6397251204580275, "grad_max_sv": 0.23347726799547672, "grad_min_sv": 1.1918404803357152e-08, "grad_condition": 81456104.36957063, "lr": 1.570841943568445e-05, "time_sec": 49.639748334884644 }, { "epoch": 139, "train_loss": 1.3220760538482665, "train_acc": 0.61838, "test_loss": 8.026485778808594, "test_acc": 0.1138, "lyapunov": null, "grad_norm": 0.6398193491025633, "grad_max_sv": 0.2238193929195404, "grad_min_sv": 1.1681687835801702e-08, "grad_condition": 38144371.645152286, "lr": 1.3210548563419845e-05, "time_sec": 49.63212180137634 }, { "epoch": 140, "train_loss": 1.3198553924942016, "train_acc": 0.61854, "test_loss": 8.029016185760499, "test_acc": 0.1179, "lyapunov": null, "grad_norm": 0.639466602267434, "grad_max_sv": 0.22324420213699342, "grad_min_sv": 1.1702349164699477e-08, "grad_condition": 28474783.149248235, "lr": 1.0926199633097203e-05, "time_sec": 49.65198302268982 }, { "epoch": 141, "train_loss": 1.3253049739837646, "train_acc": 0.62014, "test_loss": 8.258732906341553, "test_acc": 0.1086, "lyapunov": null, "grad_norm": 0.6377969869493302, "grad_max_sv": 0.23066396303474904, "grad_min_sv": 1.1955105984340354e-08, "grad_condition": 28290681.03527581, "lr": 8.856374635655688e-06, "time_sec": 49.712565183639526 }, { "epoch": 142, "train_loss": 1.3294593518066407, "train_acc": 0.6165, "test_loss": 8.097643237304688, "test_acc": 0.1079, "lyapunov": null, "grad_norm": 0.6416721044495594, "grad_max_sv": 0.22946001626551152, "grad_min_sv": 1.1918349693273988e-08, "grad_condition": 33830275.99348913, "lr": 7.001981464747503e-06, "time_sec": 49.62647032737732 }, { "epoch": 143, "train_loss": 1.3246013949203492, "train_acc": 0.619, "test_loss": 8.003326276397704, "test_acc": 0.1093, "lyapunov": null, "grad_norm": 0.6406658358506779, "grad_max_sv": 0.22979442439973355, "grad_min_sv": 1.1885957310075503e-08, "grad_condition": 1265929967.3983974, "lr": 5.3638335185058295e-06, "time_sec": 49.64323043823242 }, { "epoch": 144, "train_loss": 1.3237170028686522, "train_acc": 0.61912, "test_loss": 8.245773946380615, "test_acc": 0.1116, "lyapunov": null, "grad_norm": 0.640154182788332, "grad_max_sv": 0.22960694395005704, "grad_min_sv": 1.1789325913159205e-08, "grad_condition": 220785020.05461937, "lr": 3.942649342761114e-06, "time_sec": 49.62677884101868 }, { "epoch": 145, "train_loss": 1.323034522781372, "train_acc": 0.61748, "test_loss": 8.367132460784912, "test_acc": 0.1101, "lyapunov": null, "grad_norm": 0.6399875505077857, "grad_max_sv": 0.2292648758739233, "grad_min_sv": 1.1756407276852787e-08, "grad_condition": 46749240.33218758, "lr": 2.7390523158633524e-06, "time_sec": 49.61358666419983 }, { "epoch": 146, "train_loss": 1.3221456618118286, "train_acc": 0.61958, "test_loss": 8.256616510772705, "test_acc": 0.1088, "lyapunov": null, "grad_norm": 0.6401843350865242, "grad_max_sv": 0.23075628280639648, "grad_min_sv": 1.1929567545268527e-08, "grad_condition": 56821403.658394314, "lr": 1.7535703752478133e-06, "time_sec": 49.62871527671814 }, { "epoch": 147, "train_loss": 1.32188304227829, "train_acc": 0.62262, "test_loss": 7.983602857208252, "test_acc": 0.115, "lyapunov": null, "grad_norm": 0.6377455957871468, "grad_max_sv": 0.2265624139457941, "grad_min_sv": 1.1661963828825395e-08, "grad_condition": 178436067.44761798, "lr": 9.866357858642196e-07, "time_sec": 49.63710594177246 }, { "epoch": 148, "train_loss": 1.3234341220855712, "train_acc": 0.61708, "test_loss": 8.329111752319337, "test_acc": 0.1046, "lyapunov": null, "grad_norm": 0.6428801038701755, "grad_max_sv": 0.2313603863120079, "grad_min_sv": 1.1845945344264585e-08, "grad_condition": 144408842.21709472, "lr": 4.38584950570808e-07, "time_sec": 49.63905072212219 }, { "epoch": 149, "train_loss": 1.3202154207611083, "train_acc": 0.61986, "test_loss": 8.021684009552002, "test_acc": 0.1127, "lyapunov": null, "grad_norm": 0.6406912156142667, "grad_max_sv": 0.2288107428699732, "grad_min_sv": 1.181119294590971e-08, "grad_condition": 65688308.80478315, "lr": 1.096582625772501e-07, "time_sec": 49.61029553413391 }, { "epoch": 150, "train_loss": 1.3158636585235595, "train_acc": 0.62006, "test_loss": 8.094485763549805, "test_acc": 0.1123, "lyapunov": null, "grad_norm": 0.6406489877650078, "grad_max_sv": 0.23017469234764576, "grad_min_sv": 1.1906818318807578e-08, "grad_condition": 37789807.4961655, "lr": 0.0, "time_sec": 49.65584897994995 } ], "16": [ { "epoch": 1, "train_loss": 5.089254416656495, "train_acc": 0.01344, "test_loss": 4.870831555175781, "test_acc": 0.01, "lyapunov": null, "grad_norm": 5.582063459208639, "grad_max_sv": 5.0306542873382565, "grad_min_sv": 8.441757832766683e-08, "grad_condition": 74707534.78681344, "lr": 0.0009998903417374227, "time_sec": 66.70097637176514 }, { "epoch": 2, "train_loss": 4.736304296569824, "train_acc": 0.02172, "test_loss": 4.92340059890747, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.087296772772229, "grad_max_sv": 3.672157108783722, "grad_min_sv": 6.109624839933935e-08, "grad_condition": 230714811.36310124, "lr": 0.0009995614150494292, "time_sec": 66.83215641975403 }, { "epoch": 3, "train_loss": 4.52685978515625, "train_acc": 0.03204, "test_loss": 5.045831031799317, "test_acc": 0.0094, "lyapunov": null, "grad_norm": 3.1470044543912175, "grad_max_sv": 2.6447540044784548, "grad_min_sv": 4.639755384339139e-08, "grad_condition": 65625701.84585605, "lr": 0.0009990133642141358, "time_sec": 66.70765495300293 }, { "epoch": 4, "train_loss": 4.371717319641113, "train_acc": 0.04112, "test_loss": 4.993129699707032, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 2.5123688948843395, "grad_max_sv": 2.1027904629707335, "grad_min_sv": 3.615837387664633e-08, "grad_condition": 418817692.03399765, "lr": 0.0009982464296247522, "time_sec": 66.70319509506226 }, { "epoch": 5, "train_loss": 4.27407361251831, "train_acc": 0.0488, "test_loss": 5.161634465789795, "test_acc": 0.0119, "lyapunov": null, "grad_norm": 1.9573801826064445, "grad_max_sv": 1.613087645173073, "grad_min_sv": 2.8529539808364034e-08, "grad_condition": 62747668.20627429, "lr": 0.0009972609476841367, "time_sec": 66.74726390838623 }, { "epoch": 6, "train_loss": 4.183251854553222, "train_acc": 0.05812, "test_loss": 5.447854755401611, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 1.436449079599314, "grad_max_sv": 1.0459295481443405, "grad_min_sv": 2.0654144772258576e-08, "grad_condition": 94732574.16372415, "lr": 0.000996057350657239, "time_sec": 66.68073081970215 }, { "epoch": 7, "train_loss": 4.103355536193848, "train_acc": 0.06872, "test_loss": 5.544150679016114, "test_acc": 0.0124, "lyapunov": null, "grad_norm": 1.082624040556548, "grad_max_sv": 0.678101472556591, "grad_min_sv": 1.6660088839048904e-08, "grad_condition": 49338508.46283151, "lr": 0.000994636166481494, "time_sec": 66.77410340309143 }, { "epoch": 8, "train_loss": 4.040529095458984, "train_acc": 0.07876, "test_loss": 5.577163777160645, "test_acc": 0.0172, "lyapunov": null, "grad_norm": 0.963869121683512, "grad_max_sv": 0.5578698106110096, "grad_min_sv": 1.4817374840991882e-08, "grad_condition": 46172185.25999212, "lr": 0.0009929980185352525, "time_sec": 66.7442455291748 }, { "epoch": 9, "train_loss": 3.999490645446777, "train_acc": 0.0856, "test_loss": 5.472281336975097, "test_acc": 0.0116, "lyapunov": null, "grad_norm": 0.9198022107734598, "grad_max_sv": 0.5003849364817142, "grad_min_sv": 1.3862486752946878e-08, "grad_condition": 137028895.09887612, "lr": 0.0009911436253643444, "time_sec": 66.71199488639832 }, { "epoch": 10, "train_loss": 3.9641557629394533, "train_acc": 0.09124, "test_loss": 5.43024553604126, "test_acc": 0.0112, "lyapunov": null, "grad_norm": 0.8539816540258655, "grad_max_sv": 0.4397390566766262, "grad_min_sv": 1.3177782898221579e-08, "grad_condition": 50953468.3517745, "lr": 0.0009890738003669028, "time_sec": 66.71694684028625 }, { "epoch": 11, "train_loss": 3.9142907052612306, "train_acc": 0.09788, "test_loss": 5.24972756652832, "test_acc": 0.0174, "lyapunov": null, "grad_norm": 0.8303589651826888, "grad_max_sv": 0.4246540553867817, "grad_min_sv": 1.288730961390705e-08, "grad_condition": 88294678.08247125, "lr": 0.00098678945143658, "time_sec": 66.70689487457275 }, { "epoch": 12, "train_loss": 3.881778168411255, "train_acc": 0.1037, "test_loss": 5.765969756317139, "test_acc": 0.0186, "lyapunov": null, "grad_norm": 0.7855031029198277, "grad_max_sv": 0.3756070680916309, "grad_min_sv": 1.2611303298881715e-08, "grad_condition": 36786532.210794725, "lr": 0.0009842915805643154, "time_sec": 66.73540306091309 }, { "epoch": 13, "train_loss": 3.8490214154815674, "train_acc": 0.1068, "test_loss": 5.832162282562256, "test_acc": 0.0138, "lyapunov": null, "grad_norm": 0.7681061932199776, "grad_max_sv": 0.3604050487279892, "grad_min_sv": 1.2243067453593382e-08, "grad_condition": 131143000.26933214, "lr": 0.000981581283398829, "time_sec": 66.73431468009949 }, { "epoch": 14, "train_loss": 3.828877674636841, "train_acc": 0.11234, "test_loss": 6.293205305480957, "test_acc": 0.0134, "lyapunov": null, "grad_norm": 0.7460407539013362, "grad_max_sv": 0.34510768875479697, "grad_min_sv": 1.1813573212726692e-08, "grad_condition": 49629148.15911349, "lr": 0.0009786597487660333, "time_sec": 66.77479386329651 }, { "epoch": 15, "train_loss": 3.803487832107544, "train_acc": 0.1159, "test_loss": 6.4087516273498535, "test_acc": 0.013, "lyapunov": null, "grad_norm": 0.716379034773642, "grad_max_sv": 0.3261814657598734, "grad_min_sv": 1.1572917107960378e-08, "grad_condition": 31644703.4401185, "lr": 0.0009755282581475766, "time_sec": 66.73083448410034 }, { "epoch": 16, "train_loss": 3.7821172668457033, "train_acc": 0.11904, "test_loss": 6.406122239685058, "test_acc": 0.0123, "lyapunov": null, "grad_norm": 0.697749546532161, "grad_max_sv": 0.31582852490246294, "grad_min_sv": 1.1393312793206434e-08, "grad_condition": 39132519.74005551, "lr": 0.0009721881851187403, "time_sec": 66.74327826499939 }, { "epoch": 17, "train_loss": 3.7480180199432374, "train_acc": 0.12526, "test_loss": 6.8633532814025875, "test_acc": 0.0132, "lyapunov": null, "grad_norm": 0.6758633251362415, "grad_max_sv": 0.2994280070066452, "grad_min_sv": 1.1069095015581176e-08, "grad_condition": 36563832.03358241, "lr": 0.0009686409947459456, "time_sec": 66.76521873474121 }, { "epoch": 18, "train_loss": 3.730831000213623, "train_acc": 0.12792, "test_loss": 6.246407075500488, "test_acc": 0.0177, "lyapunov": null, "grad_norm": 0.664831990265232, "grad_max_sv": 0.2994547080248594, "grad_min_sv": 1.0997234457625626e-08, "grad_condition": 122736750.78260681, "lr": 0.0009648882429441254, "time_sec": 66.71729445457458 }, { "epoch": 19, "train_loss": 3.716553072052002, "train_acc": 0.12942, "test_loss": 5.873876965332031, "test_acc": 0.0149, "lyapunov": null, "grad_norm": 0.6518241757841252, "grad_max_sv": 0.29539270177483556, "grad_min_sv": 1.0741561572852331e-08, "grad_condition": 49669322.25294405, "lr": 0.00096093157579425, "time_sec": 66.81875944137573 }, { "epoch": 20, "train_loss": 3.6975706172180174, "train_acc": 0.13298, "test_loss": 6.400744886779785, "test_acc": 0.0155, "lyapunov": null, "grad_norm": 0.6347864002121714, "grad_max_sv": 0.28284979946911337, "grad_min_sv": 1.0701284272607303e-08, "grad_condition": 30013146.4819826, "lr": 0.0009567727288213001, "time_sec": 66.8477098941803 }, { "epoch": 21, "train_loss": 3.673498316040039, "train_acc": 0.13564, "test_loss": 6.160238801574707, "test_acc": 0.0204, "lyapunov": null, "grad_norm": 0.6252581472584972, "grad_max_sv": 0.27260397262871267, "grad_min_sv": 1.0594542484282377e-08, "grad_condition": 46350413.24314589, "lr": 0.0009524135262330095, "time_sec": 66.72814178466797 }, { "epoch": 22, "train_loss": 3.654527678833008, "train_acc": 0.1393, "test_loss": 6.9474281982421875, "test_acc": 0.0176, "lyapunov": null, "grad_norm": 0.6149063083720292, "grad_max_sv": 0.26224171184003353, "grad_min_sv": 1.035294387718988e-08, "grad_condition": 32282705.350815333, "lr": 0.0009478558801197061, "time_sec": 66.82811260223389 }, { "epoch": 23, "train_loss": 3.6450364729309084, "train_acc": 0.14028, "test_loss": 7.2393467880249025, "test_acc": 0.0127, "lyapunov": null, "grad_norm": 0.6067467053692205, "grad_max_sv": 0.26614573895931243, "grad_min_sv": 1.0267544686692886e-08, "grad_condition": 28213061.075003404, "lr": 0.000943101789615607, "time_sec": 66.74721336364746 }, { "epoch": 24, "train_loss": 3.623104200592041, "train_acc": 0.14594, "test_loss": 6.526107063293457, "test_acc": 0.0187, "lyapunov": null, "grad_norm": 0.5980858749774747, "grad_max_sv": 0.25203392654657364, "grad_min_sv": 1.0098680717357534e-08, "grad_condition": 50563247.00258337, "lr": 0.0009381533400219313, "time_sec": 66.77076554298401 }, { "epoch": 25, "train_loss": 3.6136645338439943, "train_acc": 0.14728, "test_loss": 7.030907647705078, "test_acc": 0.0182, "lyapunov": null, "grad_norm": 0.594016587561951, "grad_max_sv": 0.25378315448760985, "grad_min_sv": 9.976338428627219e-09, "grad_condition": 72065195.62747766, "lr": 0.0009330127018922189, "time_sec": 66.78083634376526 }, { "epoch": 26, "train_loss": 3.5951533477020265, "train_acc": 0.15, "test_loss": 6.8098891067504885, "test_acc": 0.0193, "lyapunov": null, "grad_norm": 0.5888833643522708, "grad_max_sv": 0.24365438856184482, "grad_min_sv": 9.933017187935267e-09, "grad_condition": 44149369.91233202, "lr": 0.000927682130080253, "time_sec": 66.72774887084961 }, { "epoch": 27, "train_loss": 3.5870719739532473, "train_acc": 0.15012, "test_loss": 6.188968405151368, "test_acc": 0.0198, "lyapunov": null, "grad_norm": 0.5778870286561091, "grad_max_sv": 0.23904258161783218, "grad_min_sv": 9.864321945385335e-09, "grad_condition": 29413784.94482057, "lr": 0.0009221639627510072, "time_sec": 66.7466390132904 }, { "epoch": 28, "train_loss": 3.5677108099365236, "train_acc": 0.15438, "test_loss": 7.111977198028565, "test_acc": 0.0186, "lyapunov": null, "grad_norm": 0.565332521044754, "grad_max_sv": 0.22653766870498657, "grad_min_sv": 9.587734812674387e-09, "grad_condition": 61781100.03898337, "lr": 0.0009164606203550494, "time_sec": 66.74424004554749 }, { "epoch": 29, "train_loss": 3.5525446216583254, "train_acc": 0.1561, "test_loss": 6.844758932495117, "test_acc": 0.0209, "lyapunov": null, "grad_norm": 0.5709459777275144, "grad_max_sv": 0.22716681994497775, "grad_min_sv": 9.63618568827762e-09, "grad_condition": 26044218.51829529, "lr": 0.0009105746045668516, "time_sec": 66.73790216445923 }, { "epoch": 30, "train_loss": 3.5511199297332765, "train_acc": 0.15632, "test_loss": 6.829617092895508, "test_acc": 0.0179, "lyapunov": null, "grad_norm": 0.5599177583176913, "grad_max_sv": 0.22315906584262848, "grad_min_sv": 9.481845958392298e-09, "grad_condition": 31696446.039096247, "lr": 0.0009045084971874733, "time_sec": 66.74309277534485 }, { "epoch": 31, "train_loss": 3.5346223778533936, "train_acc": 0.15964, "test_loss": 7.171929656982422, "test_acc": 0.0181, "lyapunov": null, "grad_norm": 0.5560980115082016, "grad_max_sv": 0.22190811820328235, "grad_min_sv": 9.472099816998369e-09, "grad_condition": 65999783.19253375, "lr": 0.0008982649590120977, "time_sec": 66.72736811637878 }, { "epoch": 32, "train_loss": 3.523619603424072, "train_acc": 0.16298, "test_loss": 7.11264291381836, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.5484008571230936, "grad_max_sv": 0.21031202785670758, "grad_min_sv": 9.324677128358382e-09, "grad_condition": 59831756.702754, "lr": 0.0008918467286629196, "time_sec": 66.70681715011597 }, { "epoch": 33, "train_loss": 3.503953924026489, "train_acc": 0.1662, "test_loss": 6.848249008178711, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5416204323895276, "grad_max_sv": 0.2181798741221428, "grad_min_sv": 9.399793365156769e-09, "grad_condition": 389136802.1825175, "lr": 0.0008852566213878943, "time_sec": 66.73786091804504 }, { "epoch": 34, "train_loss": 3.505652629928589, "train_acc": 0.16502, "test_loss": 6.877189469909668, "test_acc": 0.02, "lyapunov": null, "grad_norm": 0.5355113980631458, "grad_max_sv": 0.20969012342393398, "grad_min_sv": 9.270577998321538e-09, "grad_condition": 31525454.84069126, "lr": 0.000878497527825878, "time_sec": 66.72686457633972 }, { "epoch": 35, "train_loss": 3.486978895339966, "train_acc": 0.16714, "test_loss": 7.1552359481811525, "test_acc": 0.0172, "lyapunov": null, "grad_norm": 0.5346080374847578, "grad_max_sv": 0.20298720821738242, "grad_min_sv": 9.306896420202548e-09, "grad_condition": 25441508.50613912, "lr": 0.000871572412738697, "time_sec": 66.75551271438599 }, { "epoch": 36, "train_loss": 3.479604592208862, "train_acc": 0.16902, "test_loss": 6.844674809265137, "test_acc": 0.0223, "lyapunov": null, "grad_norm": 0.5311517334543933, "grad_max_sv": 0.20205551721155643, "grad_min_sv": 9.200601613218452e-09, "grad_condition": 45450108.39040236, "lr": 0.0008644843137107055, "time_sec": 66.7082417011261 }, { "epoch": 37, "train_loss": 3.4750630870819093, "train_acc": 0.16898, "test_loss": 7.165343771362305, "test_acc": 0.0171, "lyapunov": null, "grad_norm": 0.5255800840531358, "grad_max_sv": 0.19590781554579734, "grad_min_sv": 9.155419039910683e-09, "grad_condition": 108339245.17679186, "lr": 0.0008572363398164014, "time_sec": 66.71217584609985 }, { "epoch": 38, "train_loss": 3.461921478424072, "train_acc": 0.17176, "test_loss": 7.6983903167724606, "test_acc": 0.0204, "lyapunov": null, "grad_norm": 0.5291599359124736, "grad_max_sv": 0.19806304536759853, "grad_min_sv": 9.252919158653227e-09, "grad_condition": 26129114.857841287, "lr": 0.0008498316702566826, "time_sec": 66.83607125282288 }, { "epoch": 39, "train_loss": 3.4502412219238283, "train_acc": 0.1729, "test_loss": 6.8047522277832035, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.5281639901017625, "grad_max_sv": 0.20096433460712432, "grad_min_sv": 9.085016680621116e-09, "grad_condition": 33958186.51443162, "lr": 0.0008422735529643442, "time_sec": 66.73851490020752 }, { "epoch": 40, "train_loss": 3.4376924714660646, "train_acc": 0.17616, "test_loss": 7.263092966461182, "test_acc": 0.0182, "lyapunov": null, "grad_norm": 0.5216932066323713, "grad_max_sv": 0.19504240863025188, "grad_min_sv": 9.154586153026223e-09, "grad_condition": 25458573.387380652, "lr": 0.0008345653031794289, "time_sec": 66.7052755355835 }, { "epoch": 41, "train_loss": 3.4279933405303957, "train_acc": 0.17836, "test_loss": 6.396369320678711, "test_acc": 0.0195, "lyapunov": null, "grad_norm": 0.5194410647845549, "grad_max_sv": 0.19078941717743875, "grad_min_sv": 9.012956635884306e-09, "grad_condition": 42363604.716461524, "lr": 0.0008267103019950526, "time_sec": 66.72479486465454 }, { "epoch": 42, "train_loss": 3.4256856929016113, "train_acc": 0.17732, "test_loss": 6.679870991516113, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.5198265520764738, "grad_max_sv": 0.19169757179915906, "grad_min_sv": 9.036233127035497e-09, "grad_condition": 51260505.579239644, "lr": 0.0008187119948743447, "time_sec": 66.75225281715393 }, { "epoch": 43, "train_loss": 3.411117221832275, "train_acc": 0.18158, "test_loss": 7.357481904602051, "test_acc": 0.0185, "lyapunov": null, "grad_norm": 0.5156740849780826, "grad_max_sv": 0.19417562745511532, "grad_min_sv": 9.037307471815303e-09, "grad_condition": 35283510.30299447, "lr": 0.000810573890139155, "time_sec": 66.72709918022156 }, { "epoch": 44, "train_loss": 3.4085953338623045, "train_acc": 0.18096, "test_loss": 7.635249890899658, "test_acc": 0.0161, "lyapunov": null, "grad_norm": 0.5119612982206426, "grad_max_sv": 0.18738919235765933, "grad_min_sv": 8.878314214366689e-09, "grad_condition": 31365951.59678828, "lr": 0.0008022995574311873, "time_sec": 66.72823333740234 }, { "epoch": 45, "train_loss": 3.391282188873291, "train_acc": 0.18358, "test_loss": 7.057773623657226, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.512636753960722, "grad_max_sv": 0.18591308295726777, "grad_min_sv": 8.905265155845221e-09, "grad_condition": 34037092.10974729, "lr": 0.0007938926261462363, "time_sec": 66.75207853317261 }, { "epoch": 46, "train_loss": 3.385137359466553, "train_acc": 0.18694, "test_loss": 7.400888244628907, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.5082656505289807, "grad_max_sv": 0.18733446709811688, "grad_min_sv": 8.893193696474926e-09, "grad_condition": 125851280.80010274, "lr": 0.0007853567838422158, "time_sec": 66.7163679599762 }, { "epoch": 47, "train_loss": 3.376342626800537, "train_acc": 0.18838, "test_loss": 7.475112818908691, "test_acc": 0.0175, "lyapunov": null, "grad_norm": 0.5045706953392911, "grad_max_sv": 0.18063193671405314, "grad_min_sv": 8.950101182403359e-09, "grad_condition": 22625503.611506984, "lr": 0.0007766957746216719, "time_sec": 66.7100522518158 }, { "epoch": 48, "train_loss": 3.3649324946594237, "train_acc": 0.18694, "test_loss": 8.045938752746583, "test_acc": 0.0189, "lyapunov": null, "grad_norm": 0.5007866825544302, "grad_max_sv": 0.1830794021487236, "grad_min_sv": 8.805358707453248e-09, "grad_condition": 27558131.426934887, "lr": 0.0007679133974894982, "time_sec": 66.70468735694885 }, { "epoch": 49, "train_loss": 3.3610028453063965, "train_acc": 0.1888, "test_loss": 7.112044483947754, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 0.5007184914478864, "grad_max_sv": 0.18336209803819656, "grad_min_sv": 9.024269038288013e-09, "grad_condition": 33518235.006607275, "lr": 0.000759013504686565, "time_sec": 66.7611026763916 }, { "epoch": 50, "train_loss": 3.3484571326446533, "train_acc": 0.1906, "test_loss": 7.519181715393066, "test_acc": 0.0209, "lyapunov": null, "grad_norm": 0.5018491559425493, "grad_max_sv": 0.18028105311095716, "grad_min_sv": 8.925991949043643e-09, "grad_condition": 33524852.83647134, "lr": 0.0007499999999999998, "time_sec": 66.76505136489868 }, { "epoch": 51, "train_loss": 3.3410891053009033, "train_acc": 0.1921, "test_loss": 7.056560147094727, "test_acc": 0.0249, "lyapunov": null, "grad_norm": 0.4996656726107064, "grad_max_sv": 0.17895969636738301, "grad_min_sv": 8.92833956489536e-09, "grad_condition": 30339744.194165338, "lr": 0.0007408768370508575, "time_sec": 66.76679730415344 }, { "epoch": 52, "train_loss": 3.329959710845947, "train_acc": 0.19464, "test_loss": 7.733986283874512, "test_acc": 0.02, "lyapunov": null, "grad_norm": 0.49662871046839857, "grad_max_sv": 0.17035150155425072, "grad_min_sv": 8.920055267341853e-09, "grad_condition": 39560292.40680326, "lr": 0.0007316480175599307, "time_sec": 66.73509478569031 }, { "epoch": 53, "train_loss": 3.328139169998169, "train_acc": 0.1964, "test_loss": 8.010476211547852, "test_acc": 0.0211, "lyapunov": null, "grad_norm": 0.4958475219811756, "grad_max_sv": 0.17490845173597336, "grad_min_sv": 8.784460091802727e-09, "grad_condition": 71860322.54887062, "lr": 0.0007223175895924635, "time_sec": 66.72841596603394 }, { "epoch": 54, "train_loss": 3.3162127281188964, "train_acc": 0.19728, "test_loss": 7.010640211486816, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.4961833449463003, "grad_max_sv": 0.17223588079214097, "grad_min_sv": 8.753281316442596e-09, "grad_condition": 22715187.33107339, "lr": 0.0007128896457825361, "time_sec": 66.72108912467957 }, { "epoch": 55, "train_loss": 3.3105887175750732, "train_acc": 0.1977, "test_loss": 8.294336575317383, "test_acc": 0.0177, "lyapunov": null, "grad_norm": 0.4959871213831781, "grad_max_sv": 0.17211879640817643, "grad_min_sv": 8.85512002890554e-09, "grad_condition": 22832904.69554911, "lr": 0.0007033683215378998, "time_sec": 66.77683353424072 }, { "epoch": 56, "train_loss": 3.3091206261444093, "train_acc": 0.19822, "test_loss": 6.872190827941894, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 0.4968424527269832, "grad_max_sv": 0.16929374635219574, "grad_min_sv": 8.852659438840504e-09, "grad_condition": 21482011.311691545, "lr": 0.0006937577932260512, "time_sec": 66.7394802570343 }, { "epoch": 57, "train_loss": 3.2911807606506347, "train_acc": 0.20104, "test_loss": 6.781019482421875, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.49806961864225907, "grad_max_sv": 0.17269197143614293, "grad_min_sv": 9.028358619045385e-09, "grad_condition": 21860182.81813491, "lr": 0.0006840622763423388, "time_sec": 66.74213409423828 }, { "epoch": 58, "train_loss": 3.28923882019043, "train_acc": 0.2009, "test_loss": 7.48718016204834, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 0.497037583502488, "grad_max_sv": 0.17720941305160523, "grad_min_sv": 8.923951845540844e-09, "grad_condition": 25638959.340645056, "lr": 0.0006742860236609073, "time_sec": 66.70864987373352 }, { "epoch": 59, "train_loss": 3.288974278411865, "train_acc": 0.2022, "test_loss": 6.711775099182129, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.5006739014854031, "grad_max_sv": 0.1799727737903595, "grad_min_sv": 8.922615390982714e-09, "grad_condition": 22962596.945499133, "lr": 0.0006644333233692913, "time_sec": 66.72898769378662 }, { "epoch": 60, "train_loss": 3.283515991897583, "train_acc": 0.20374, "test_loss": 7.436810195922852, "test_acc": 0.0217, "lyapunov": null, "grad_norm": 0.4970314759637393, "grad_max_sv": 0.1713873755186796, "grad_min_sv": 8.852956717708694e-09, "grad_condition": 21460924.515540235, "lr": 0.0006545084971874734, "time_sec": 66.77793312072754 }, { "epoch": 61, "train_loss": 3.2660218312072753, "train_acc": 0.2052, "test_loss": 7.1023060356140135, "test_acc": 0.0237, "lyapunov": null, "grad_norm": 0.49642283106124174, "grad_max_sv": 0.17171172685921193, "grad_min_sv": 9.03237155625014e-09, "grad_condition": 23554914.711565603, "lr": 0.0006445158984722354, "time_sec": 66.71418523788452 }, { "epoch": 62, "train_loss": 3.254552359466553, "train_acc": 0.2084, "test_loss": 7.483150309753418, "test_acc": 0.0225, "lyapunov": null, "grad_norm": 0.4960786681631791, "grad_max_sv": 0.1668458305299282, "grad_min_sv": 8.818685695577421e-09, "grad_condition": 74094011.9951904, "lr": 0.0006344599103076324, "time_sec": 66.70579290390015 }, { "epoch": 63, "train_loss": 3.2479764625549317, "train_acc": 0.20702, "test_loss": 7.495381002807617, "test_acc": 0.0243, "lyapunov": null, "grad_norm": 0.4917077399114027, "grad_max_sv": 0.16495948433876037, "grad_min_sv": 8.864074795694732e-09, "grad_condition": 30857102.41845674, "lr": 0.0006243449435824269, "time_sec": 66.72497200965881 }, { "epoch": 64, "train_loss": 3.245808661117554, "train_acc": 0.20704, "test_loss": 6.5149994140625, "test_acc": 0.0299, "lyapunov": null, "grad_norm": 0.4942308484852371, "grad_max_sv": 0.16808778569102287, "grad_min_sv": 8.905879750331636e-09, "grad_condition": 21297665.020826895, "lr": 0.0006141754350553275, "time_sec": 66.71531987190247 }, { "epoch": 65, "train_loss": 3.2359812786102293, "train_acc": 0.20964, "test_loss": 6.7083621681213375, "test_acc": 0.0257, "lyapunov": null, "grad_norm": 0.4924300564127143, "grad_max_sv": 0.1668924294412136, "grad_min_sv": 8.814785660855167e-09, "grad_condition": 387068362.7974197, "lr": 0.0006039558454088793, "time_sec": 66.739919424057 }, { "epoch": 66, "train_loss": 3.2231747630310057, "train_acc": 0.21288, "test_loss": 6.6462861267089846, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.49278283649554394, "grad_max_sv": 0.16672560423612595, "grad_min_sv": 8.910612160628607e-09, "grad_condition": 23460863.699399397, "lr": 0.000593690657292862, "time_sec": 66.73168134689331 }, { "epoch": 67, "train_loss": 3.2156623792266847, "train_acc": 0.21342, "test_loss": 7.029375877380371, "test_acc": 0.0223, "lyapunov": null, "grad_norm": 0.4909443834963243, "grad_max_sv": 0.16597550213336945, "grad_min_sv": 8.912085689566362e-09, "grad_condition": 31291994.15683285, "lr": 0.0005833843733580507, "time_sec": 66.72268962860107 }, { "epoch": 68, "train_loss": 3.2102099297332765, "train_acc": 0.21536, "test_loss": 6.8582941429138184, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.49321037808878027, "grad_max_sv": 0.16992229372262954, "grad_min_sv": 8.80631389199582e-09, "grad_condition": 129842817.14263825, "lr": 0.0005730415142812054, "time_sec": 66.73015308380127 }, { "epoch": 69, "train_loss": 3.2087192346191404, "train_acc": 0.21692, "test_loss": 6.703964881134033, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.4884522648005531, "grad_max_sv": 0.16176489181816578, "grad_min_sv": 8.772693779746099e-09, "grad_condition": 26469955.870484192, "lr": 0.0005626666167821517, "time_sec": 66.71746468544006 }, { "epoch": 70, "train_loss": 3.195241547088623, "train_acc": 0.21844, "test_loss": 6.542587074279785, "test_acc": 0.0284, "lyapunov": null, "grad_norm": 0.49091657002079947, "grad_max_sv": 0.16242207810282708, "grad_min_sv": 9.02578579792257e-09, "grad_condition": 23591537.371170804, "lr": 0.0005522642316338265, "time_sec": 66.72597932815552 }, { "epoch": 71, "train_loss": 3.1896180830383303, "train_acc": 0.21886, "test_loss": 6.82057219543457, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.4892216781222015, "grad_max_sv": 0.1621775720268488, "grad_min_sv": 8.926039651857565e-09, "grad_condition": 20890687.882442366, "lr": 0.0005418389216661573, "time_sec": 66.7145037651062 }, { "epoch": 72, "train_loss": 3.18413442276001, "train_acc": 0.21908, "test_loss": 7.1544591903686525, "test_acc": 0.0243, "lyapunov": null, "grad_norm": 0.48870515357132727, "grad_max_sv": 0.16475776992738247, "grad_min_sv": 8.91442188816205e-09, "grad_condition": 35365218.5794013, "lr": 0.0005313952597646563, "time_sec": 66.72212243080139 }, { "epoch": 73, "train_loss": 3.1829597901153566, "train_acc": 0.21974, "test_loss": 7.2174785011291505, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.4892142900976219, "grad_max_sv": 0.16382574513554574, "grad_min_sv": 8.810792702352264e-09, "grad_condition": 2088135479.3673325, "lr": 0.0005209378268645994, "time_sec": 66.73431754112244 }, { "epoch": 74, "train_loss": 3.172711128463745, "train_acc": 0.22268, "test_loss": 7.406581823730469, "test_acc": 0.0232, "lyapunov": null, "grad_norm": 0.48885933422631656, "grad_max_sv": 0.1622017789632082, "grad_min_sv": 8.900176362569568e-09, "grad_condition": 22065867.848713316, "lr": 0.0005104712099416781, "time_sec": 66.76118803024292 }, { "epoch": 75, "train_loss": 3.1605979063415526, "train_acc": 0.22268, "test_loss": 7.909864106750488, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.4864315646638775, "grad_max_sv": 0.16106058210134505, "grad_min_sv": 8.83298489941231e-09, "grad_condition": 46212562.907684386, "lr": 0.0004999999999999996, "time_sec": 66.70442318916321 }, { "epoch": 76, "train_loss": 3.1487682283020018, "train_acc": 0.22692, "test_loss": 7.801919015502929, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.49432790922941905, "grad_max_sv": 0.1653361301869154, "grad_min_sv": 9.004006756851979e-09, "grad_condition": 21481137.43510855, "lr": 0.0004895287900583212, "time_sec": 66.72583270072937 }, { "epoch": 77, "train_loss": 3.150441154251099, "train_acc": 0.22298, "test_loss": 7.5658083923339845, "test_acc": 0.0206, "lyapunov": null, "grad_norm": 0.4905609551233629, "grad_max_sv": 0.16559089235961438, "grad_min_sv": 9.02131503666137e-09, "grad_condition": 20767700.255871035, "lr": 0.0004790621731353997, "time_sec": 66.69700527191162 }, { "epoch": 78, "train_loss": 3.1500933878326416, "train_acc": 0.22786, "test_loss": 7.626110935974121, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.4905443897236645, "grad_max_sv": 0.16319101713597775, "grad_min_sv": 8.856467318546501e-09, "grad_condition": 30384641.86177106, "lr": 0.000468604740235343, "time_sec": 66.70938420295715 }, { "epoch": 79, "train_loss": 3.1403994177246095, "train_acc": 0.22896, "test_loss": 7.712996089172363, "test_acc": 0.0224, "lyapunov": null, "grad_norm": 0.4915245764953966, "grad_max_sv": 0.16383215487003328, "grad_min_sv": 9.000386157198559e-09, "grad_condition": 24292562.845880195, "lr": 0.00045816107833384175, "time_sec": 66.70869493484497 }, { "epoch": 80, "train_loss": 3.135038282623291, "train_acc": 0.22664, "test_loss": 7.267129122161865, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.49111047918715733, "grad_max_sv": 0.1639216773211956, "grad_min_sv": 8.921349751783367e-09, "grad_condition": 420151306.09404176, "lr": 0.0004477357683661729, "time_sec": 66.7166097164154 }, { "epoch": 81, "train_loss": 3.1244947747802736, "train_acc": 0.22956, "test_loss": 7.662328411865234, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.49289166159918185, "grad_max_sv": 0.16057575568556787, "grad_min_sv": 9.007528779803043e-09, "grad_condition": 25322164.642992593, "lr": 0.00043733338321784746, "time_sec": 66.70411825180054 }, { "epoch": 82, "train_loss": 3.1161900270080567, "train_acc": 0.23102, "test_loss": 6.92779616394043, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.49270870414948964, "grad_max_sv": 0.1599017258733511, "grad_min_sv": 9.11951086590701e-09, "grad_condition": 20698906.206454754, "lr": 0.0004269584857187939, "time_sec": 66.70752501487732 }, { "epoch": 83, "train_loss": 3.117374754104614, "train_acc": 0.23338, "test_loss": 7.148474893188476, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.4925974195490984, "grad_max_sv": 0.16150497682392598, "grad_min_sv": 8.971566273219267e-09, "grad_condition": 20007661.368726093, "lr": 0.0004166156266419484, "time_sec": 66.70796918869019 }, { "epoch": 84, "train_loss": 3.1047154219055177, "train_acc": 0.23342, "test_loss": 7.627574306488037, "test_acc": 0.0234, "lyapunov": null, "grad_norm": 0.4921892080867045, "grad_max_sv": 0.16364577710628508, "grad_min_sv": 8.967278117277822e-09, "grad_condition": 20465428.39487014, "lr": 0.0004063093427071373, "time_sec": 66.70926451683044 }, { "epoch": 85, "train_loss": 3.0953226109313965, "train_acc": 0.23356, "test_loss": 7.637861351776123, "test_acc": 0.0254, "lyapunov": null, "grad_norm": 0.49401889904765806, "grad_max_sv": 0.16418364495038987, "grad_min_sv": 8.915860015990679e-09, "grad_condition": 203043858.99741915, "lr": 0.0003960441545911199, "time_sec": 66.6929943561554 }, { "epoch": 86, "train_loss": 3.0932106770324705, "train_acc": 0.23452, "test_loss": 7.435467148590088, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.4934388084197917, "grad_max_sv": 0.16211238466203212, "grad_min_sv": 9.0381108895643e-09, "grad_condition": 38210459.14289879, "lr": 0.0003858245649446718, "time_sec": 66.71461033821106 }, { "epoch": 87, "train_loss": 3.091542336883545, "train_acc": 0.23574, "test_loss": 7.27965379486084, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.49327307505927953, "grad_max_sv": 0.1624306257814169, "grad_min_sv": 9.051206378840603e-09, "grad_condition": 19977131.887911893, "lr": 0.00037565505641757235, "time_sec": 66.7017343044281 }, { "epoch": 88, "train_loss": 3.0846370722961427, "train_acc": 0.2367, "test_loss": 7.714011827087402, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.49521950469943726, "grad_max_sv": 0.16350008510053157, "grad_min_sv": 9.132233064201855e-09, "grad_condition": 20496153.697574906, "lr": 0.00036554008969236695, "time_sec": 66.80735445022583 }, { "epoch": 89, "train_loss": 3.067184111480713, "train_acc": 0.23956, "test_loss": 7.469543979644776, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.49450885750587337, "grad_max_sv": 0.16215350292623043, "grad_min_sv": 9.075074243122815e-09, "grad_condition": 63145499.63971396, "lr": 0.0003554841015277638, "time_sec": 66.7019522190094 }, { "epoch": 90, "train_loss": 3.0696119786071776, "train_acc": 0.23776, "test_loss": 7.227960666656494, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.49496033151417024, "grad_max_sv": 0.15985839106142521, "grad_min_sv": 9.114914140302688e-09, "grad_condition": 88232236.67419389, "lr": 0.000345491502812526, "time_sec": 66.71336770057678 }, { "epoch": 91, "train_loss": 3.0570466086578367, "train_acc": 0.24112, "test_loss": 7.087581924438476, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.49532470616490887, "grad_max_sv": 0.16271125935018063, "grad_min_sv": 9.14848334726548e-09, "grad_condition": 28858228.725753903, "lr": 0.0003355666766307081, "time_sec": 66.71155142784119 }, { "epoch": 92, "train_loss": 3.060674235687256, "train_acc": 0.24284, "test_loss": 7.354493684387207, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.49422169257384346, "grad_max_sv": 0.16212479658424855, "grad_min_sv": 9.094859150515777e-09, "grad_condition": 27013716.07646851, "lr": 0.00032571397633909225, "time_sec": 66.73360872268677 }, { "epoch": 93, "train_loss": 3.045851851577759, "train_acc": 0.24666, "test_loss": 6.961697528839111, "test_acc": 0.0257, "lyapunov": null, "grad_norm": 0.4943781413484412, "grad_max_sv": 0.15829392597079278, "grad_min_sv": 9.1174124181026e-09, "grad_condition": 24719922.26471028, "lr": 0.00031593772365766094, "time_sec": 66.72647047042847 }, { "epoch": 94, "train_loss": 3.0384512644958495, "train_acc": 0.24492, "test_loss": 7.376283264160156, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.49582915049730736, "grad_max_sv": 0.1624866124242544, "grad_min_sv": 9.118276048341972e-09, "grad_condition": 727643917.2657491, "lr": 0.0003062422067739483, "time_sec": 66.70089149475098 }, { "epoch": 95, "train_loss": 3.039133260345459, "train_acc": 0.24476, "test_loss": 7.406265617370606, "test_acc": 0.0298, "lyapunov": null, "grad_norm": 0.4964727526376002, "grad_max_sv": 0.15984426029026508, "grad_min_sv": 9.0936182872009e-09, "grad_condition": 53822276.22529755, "lr": 0.00029663167846209965, "time_sec": 66.71791744232178 }, { "epoch": 96, "train_loss": 3.0375169485473634, "train_acc": 0.24388, "test_loss": 7.3450915855407715, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.4980105941759735, "grad_max_sv": 0.1639113176614046, "grad_min_sv": 9.174823172204694e-09, "grad_condition": 75847501.33547327, "lr": 0.00028711035421746345, "time_sec": 66.74349761009216 }, { "epoch": 97, "train_loss": 3.036133956604004, "train_acc": 0.2481, "test_loss": 7.577465545654297, "test_acc": 0.0264, "lyapunov": null, "grad_norm": 0.4958252185119339, "grad_max_sv": 0.16029710061848162, "grad_min_sv": 8.978423951533366e-09, "grad_condition": 19961795.980553128, "lr": 0.00027768241040753615, "time_sec": 66.72821807861328 }, { "epoch": 98, "train_loss": 3.021324711227417, "train_acc": 0.25076, "test_loss": 7.219669580841065, "test_acc": 0.0303, "lyapunov": null, "grad_norm": 0.4970296963841891, "grad_max_sv": 0.16001575216650962, "grad_min_sv": 9.067042531715752e-09, "grad_condition": 41223693.265652105, "lr": 0.00026835198244006903, "time_sec": 66.74218535423279 }, { "epoch": 99, "train_loss": 3.0151924266815184, "train_acc": 0.25042, "test_loss": 7.808471519470215, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.497912540335549, "grad_max_sv": 0.1632791668176651, "grad_min_sv": 9.184349171464934e-09, "grad_condition": 23400737.365473915, "lr": 0.0002591231629491421, "time_sec": 66.70754623413086 }, { "epoch": 100, "train_loss": 3.0173143773651123, "train_acc": 0.24922, "test_loss": 7.265430112457276, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.49818870466542803, "grad_max_sv": 0.16289953589439393, "grad_min_sv": 9.281307221387091e-09, "grad_condition": 23108793.760435097, "lr": 0.0002499999999999997, "time_sec": 66.74620199203491 }, { "epoch": 101, "train_loss": 3.0063516328430175, "train_acc": 0.25068, "test_loss": 7.405182618713379, "test_acc": 0.0321, "lyapunov": null, "grad_norm": 0.4980158759477165, "grad_max_sv": 0.16276963874697686, "grad_min_sv": 9.112035989633505e-09, "grad_condition": 21414811.754604597, "lr": 0.00024098649531343477, "time_sec": 66.74015522003174 }, { "epoch": 102, "train_loss": 3.004280758743286, "train_acc": 0.25098, "test_loss": 7.399062448120117, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.500738337792044, "grad_max_sv": 0.1635062240064144, "grad_min_sv": 9.288643754157277e-09, "grad_condition": 21845553.2838238, "lr": 0.0002320866025105016, "time_sec": 66.69196605682373 }, { "epoch": 103, "train_loss": 2.9984512678527833, "train_acc": 0.2512, "test_loss": 7.320097260284424, "test_acc": 0.0284, "lyapunov": null, "grad_norm": 0.4980454163272628, "grad_max_sv": 0.1580117117613554, "grad_min_sv": 9.07426482149587e-09, "grad_condition": 30985957.899948187, "lr": 0.0002233042253783278, "time_sec": 66.74033546447754 }, { "epoch": 104, "train_loss": 2.99728506942749, "train_acc": 0.25086, "test_loss": 7.463210521697998, "test_acc": 0.0329, "lyapunov": null, "grad_norm": 0.5009998323620124, "grad_max_sv": 0.16469128727912902, "grad_min_sv": 9.2030743081839e-09, "grad_condition": 22045083.846339237, "lr": 0.000214643216157784, "time_sec": 66.72671890258789 }, { "epoch": 105, "train_loss": 2.9898451292419432, "train_acc": 0.25504, "test_loss": 7.531641695404053, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.5022636847492568, "grad_max_sv": 0.16528656147420406, "grad_min_sv": 9.158518983476415e-09, "grad_condition": 24732730.3300323, "lr": 0.00020610737385376332, "time_sec": 66.72895193099976 }, { "epoch": 106, "train_loss": 2.984173779754639, "train_acc": 0.25438, "test_loss": 7.581431744384766, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.5028431980176926, "grad_max_sv": 0.1630011171102524, "grad_min_sv": 9.238039688774791e-09, "grad_condition": 20675234.791328143, "lr": 0.00019770044256881242, "time_sec": 66.73670959472656 }, { "epoch": 107, "train_loss": 2.974853392868042, "train_acc": 0.25748, "test_loss": 7.1432702926635745, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.49959385619284613, "grad_max_sv": 0.16204869262874128, "grad_min_sv": 9.195193381716926e-09, "grad_condition": 21149671.894155927, "lr": 0.0001894261098608447, "time_sec": 66.74563598632812 }, { "epoch": 108, "train_loss": 2.9721791679382323, "train_acc": 0.25728, "test_loss": 7.795809649658203, "test_acc": 0.0298, "lyapunov": null, "grad_norm": 0.4995722502777866, "grad_max_sv": 0.15964266508817673, "grad_min_sv": 9.203898770904218e-09, "grad_condition": 20323974.743836712, "lr": 0.000181288005125655, "time_sec": 66.73793625831604 }, { "epoch": 109, "train_loss": 2.970719254760742, "train_acc": 0.25944, "test_loss": 7.365542489624024, "test_acc": 0.0299, "lyapunov": null, "grad_norm": 0.500757198933526, "grad_max_sv": 0.16609507314860822, "grad_min_sv": 9.356035884922065e-09, "grad_condition": 20439457.080971286, "lr": 0.0001732896980049473, "time_sec": 66.7298583984375 }, { "epoch": 110, "train_loss": 2.972525007095337, "train_acc": 0.25712, "test_loss": 7.133980830383301, "test_acc": 0.0312, "lyapunov": null, "grad_norm": 0.5042334021436244, "grad_max_sv": 0.15981336012482644, "grad_min_sv": 9.288604266299849e-09, "grad_condition": 21280953.98530178, "lr": 0.00016543469682057076, "time_sec": 66.76267719268799 }, { "epoch": 111, "train_loss": 2.9631910160827637, "train_acc": 0.25998, "test_loss": 7.417809590148925, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.5014056320574171, "grad_max_sv": 0.16821228563785554, "grad_min_sv": 9.333871581716779e-09, "grad_condition": 101661462.28679642, "lr": 0.00015772644703565552, "time_sec": 66.72111940383911 }, { "epoch": 112, "train_loss": 2.9575250452423094, "train_acc": 0.26008, "test_loss": 7.389129028320313, "test_acc": 0.0277, "lyapunov": null, "grad_norm": 0.5007918938537274, "grad_max_sv": 0.16079586669802665, "grad_min_sv": 9.307818968351534e-09, "grad_condition": 20753238.25422468, "lr": 0.00015016832974331713, "time_sec": 66.72973942756653 }, { "epoch": 113, "train_loss": 2.952999960632324, "train_acc": 0.26198, "test_loss": 7.37722262878418, "test_acc": 0.0287, "lyapunov": null, "grad_norm": 0.5013173930748581, "grad_max_sv": 0.16444203816354275, "grad_min_sv": 9.318139330971587e-09, "grad_condition": 26788166.113831718, "lr": 0.00014276366018359834, "time_sec": 66.83487486839294 }, { "epoch": 114, "train_loss": 2.948192635574341, "train_acc": 0.26038, "test_loss": 7.436811110687255, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.5032371113955786, "grad_max_sv": 0.1634738527238369, "grad_min_sv": 9.2874662635219e-09, "grad_condition": 319138381.19418097, "lr": 0.00013551568628929425, "time_sec": 66.70622992515564 }, { "epoch": 115, "train_loss": 2.9517051191711428, "train_acc": 0.26036, "test_loss": 7.19214797668457, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.5054472421665304, "grad_max_sv": 0.16728437952697278, "grad_min_sv": 9.324679213496e-09, "grad_condition": 26191438.542866766, "lr": 0.00012842758726130276, "time_sec": 66.71952223777771 }, { "epoch": 116, "train_loss": 2.9479563136291502, "train_acc": 0.25988, "test_loss": 7.865117324829102, "test_acc": 0.0272, "lyapunov": null, "grad_norm": 0.501425656974135, "grad_max_sv": 0.16254092417657376, "grad_min_sv": 9.171186369366646e-09, "grad_condition": 43416689.99828492, "lr": 0.0001215024721741218, "time_sec": 66.74095702171326 }, { "epoch": 117, "train_loss": 2.9373822256469726, "train_acc": 0.26326, "test_loss": 7.544526052856446, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.5031467536307935, "grad_max_sv": 0.16549900099635123, "grad_min_sv": 9.4188400051598e-09, "grad_condition": 19833315.44179687, "lr": 0.00011474337861210538, "time_sec": 66.72034072875977 }, { "epoch": 118, "train_loss": 2.9374622593688966, "train_acc": 0.26362, "test_loss": 7.940575238037109, "test_acc": 0.0276, "lyapunov": null, "grad_norm": 0.502189701036258, "grad_max_sv": 0.1663150992244482, "grad_min_sv": 9.337868267511595e-09, "grad_condition": 22055002.57718137, "lr": 0.00010815327133708009, "time_sec": 66.71819615364075 }, { "epoch": 119, "train_loss": 2.9290069982910154, "train_acc": 0.26682, "test_loss": 8.381109976196289, "test_acc": 0.0245, "lyapunov": null, "grad_norm": 0.5022580399945052, "grad_max_sv": 0.16189948543906213, "grad_min_sv": 9.334797540505591e-09, "grad_condition": 53795996.97598307, "lr": 0.00010173504098790182, "time_sec": 66.73639011383057 }, { "epoch": 120, "train_loss": 2.927497018890381, "train_acc": 0.26494, "test_loss": 8.134235343933106, "test_acc": 0.0268, "lyapunov": null, "grad_norm": 0.5044191934677914, "grad_max_sv": 0.1647841826081276, "grad_min_sv": 9.31749464250231e-09, "grad_condition": 21075801.592136864, "lr": 9.549150281252629e-05, "time_sec": 66.71619915962219 }, { "epoch": 121, "train_loss": 2.9210917962646485, "train_acc": 0.2676, "test_loss": 7.665898156738281, "test_acc": 0.0284, "lyapunov": null, "grad_norm": 0.505046124945648, "grad_max_sv": 0.16069133542478084, "grad_min_sv": 9.383237816254498e-09, "grad_condition": 53773449.70699586, "lr": 8.942539543314794e-05, "time_sec": 66.7949550151825 }, { "epoch": 122, "train_loss": 2.9300759950256348, "train_acc": 0.26686, "test_loss": 7.947439320373535, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5039924043792687, "grad_max_sv": 0.16329768523573876, "grad_min_sv": 9.309516596847645e-09, "grad_condition": 105483269.53547074, "lr": 8.353937964495024e-05, "time_sec": 66.70848250389099 }, { "epoch": 123, "train_loss": 2.91971375289917, "train_acc": 0.26734, "test_loss": 7.80317967376709, "test_acc": 0.0286, "lyapunov": null, "grad_norm": 0.5061715705620777, "grad_max_sv": 0.16143706440925598, "grad_min_sv": 9.3223205665377e-09, "grad_condition": 44714095.26064149, "lr": 7.783603724899243e-05, "time_sec": 66.75235438346863 }, { "epoch": 124, "train_loss": 2.920988783569336, "train_acc": 0.2672, "test_loss": 7.688530905151367, "test_acc": 0.0267, "lyapunov": null, "grad_norm": 0.5036561383144873, "grad_max_sv": 0.16541591919958593, "grad_min_sv": 9.339689868714807e-09, "grad_condition": 21082674.48603835, "lr": 7.231786991974666e-05, "time_sec": 66.7428572177887 }, { "epoch": 125, "train_loss": 2.9158429930877685, "train_acc": 0.26972, "test_loss": 7.870475231933594, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.5050163715028828, "grad_max_sv": 0.16450283974409102, "grad_min_sv": 9.300618648844239e-09, "grad_condition": 22745467.54728716, "lr": 6.698729810778072e-05, "time_sec": 66.70153951644897 }, { "epoch": 126, "train_loss": 2.9174345250701905, "train_acc": 0.26804, "test_loss": 7.7597047775268555, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.5054786147107485, "grad_max_sv": 0.16298311799764634, "grad_min_sv": 9.272562198105183e-09, "grad_condition": 355815933.8318427, "lr": 6.184665997806817e-05, "time_sec": 66.70234727859497 }, { "epoch": 127, "train_loss": 2.9025824697875975, "train_acc": 0.26988, "test_loss": 7.446964788818359, "test_acc": 0.0276, "lyapunov": null, "grad_norm": 0.5066198768830174, "grad_max_sv": 0.1645387414842844, "grad_min_sv": 9.428870359484698e-09, "grad_condition": 20208395.537682876, "lr": 5.6898210384392595e-05, "time_sec": 66.714515209198 }, { "epoch": 128, "train_loss": 2.915607092437744, "train_acc": 0.26734, "test_loss": 7.931312725830078, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.5071889354627791, "grad_max_sv": 0.16293769851326942, "grad_min_sv": 9.389047653241001e-09, "grad_condition": 19442274.807418514, "lr": 5.214411988029363e-05, "time_sec": 66.77645683288574 }, { "epoch": 129, "train_loss": 2.9043918053436277, "train_acc": 0.27058, "test_loss": 7.705898820495605, "test_acc": 0.0294, "lyapunov": null, "grad_norm": 0.5061548650342338, "grad_max_sv": 0.1668264877051115, "grad_min_sv": 9.293020419853803e-09, "grad_condition": 22634656.7147369, "lr": 4.7586473766990294e-05, "time_sec": 66.68853044509888 }, { "epoch": 130, "train_loss": 2.9112479612731934, "train_acc": 0.2704, "test_loss": 7.656457232666016, "test_acc": 0.0278, "lyapunov": null, "grad_norm": 0.5055330426804672, "grad_max_sv": 0.162294964119792, "grad_min_sv": 9.291567426572556e-09, "grad_condition": 22558154.425069276, "lr": 4.32272711786996e-05, "time_sec": 66.69644737243652 }, { "epoch": 131, "train_loss": 2.9026712393951417, "train_acc": 0.26934, "test_loss": 7.7139065521240235, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.5078534676699445, "grad_max_sv": 0.16336566992104054, "grad_min_sv": 9.403588141498886e-09, "grad_condition": 20579658.983666856, "lr": 3.906842420574966e-05, "time_sec": 66.69969606399536 }, { "epoch": 132, "train_loss": 2.8976589154815673, "train_acc": 0.27122, "test_loss": 7.718105026245118, "test_acc": 0.026, "lyapunov": null, "grad_norm": 0.5077215533015317, "grad_max_sv": 0.16301583163440228, "grad_min_sv": 9.312006112038862e-09, "grad_condition": 27087738.24954634, "lr": 3.5111757055874305e-05, "time_sec": 66.74734258651733 }, { "epoch": 133, "train_loss": 2.9053258415222167, "train_acc": 0.26974, "test_loss": 7.773404074859619, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.5077078460971154, "grad_max_sv": 0.16176522485911846, "grad_min_sv": 9.38179235271397e-09, "grad_condition": 22801102.593637146, "lr": 3.1359005254054254e-05, "time_sec": 66.71020007133484 }, { "epoch": 134, "train_loss": 2.90214939994812, "train_acc": 0.2685, "test_loss": 7.735068745422363, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.5056827916750407, "grad_max_sv": 0.16394426934421064, "grad_min_sv": 9.382484492375525e-09, "grad_condition": 273849135.71961355, "lr": 2.7811814881259484e-05, "time_sec": 66.72329211235046 }, { "epoch": 135, "train_loss": 2.8955694792175293, "train_acc": 0.27204, "test_loss": 8.074042736816406, "test_acc": 0.0263, "lyapunov": null, "grad_norm": 0.5072891279476816, "grad_max_sv": 0.1647134818136692, "grad_min_sv": 9.274373982681716e-09, "grad_condition": 20878941.234711803, "lr": 2.4471741852423218e-05, "time_sec": 66.69911003112793 }, { "epoch": 136, "train_loss": 2.901527007369995, "train_acc": 0.272, "test_loss": 7.88837564239502, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.5069997382716037, "grad_max_sv": 0.16248776540160179, "grad_min_sv": 9.28558460677742e-09, "grad_condition": 26142069.423716225, "lr": 2.1340251233966362e-05, "time_sec": 66.73573279380798 }, { "epoch": 137, "train_loss": 2.8907382415008547, "train_acc": 0.2728, "test_loss": 8.04134146270752, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.506922138474151, "grad_max_sv": 0.16456650160253047, "grad_min_sv": 9.394744830693025e-09, "grad_condition": 22952282.106423754, "lr": 1.8418716601170932e-05, "time_sec": 66.72893476486206 }, { "epoch": 138, "train_loss": 2.8925764886474608, "train_acc": 0.27096, "test_loss": 7.848298292541504, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.5070877996969257, "grad_max_sv": 0.16335688717663288, "grad_min_sv": 9.458600758183167e-09, "grad_condition": 21212816.652376812, "lr": 1.570841943568445e-05, "time_sec": 66.69498014450073 }, { "epoch": 139, "train_loss": 2.8905470305633547, "train_acc": 0.2723, "test_loss": 7.805370147705078, "test_acc": 0.0276, "lyapunov": null, "grad_norm": 0.5091697345599102, "grad_max_sv": 0.16748546734452247, "grad_min_sv": 9.554275959278158e-09, "grad_condition": 21817543.256782603, "lr": 1.3210548563419845e-05, "time_sec": 66.69882249832153 }, { "epoch": 140, "train_loss": 2.8900568451690676, "train_acc": 0.2725, "test_loss": 8.150068646240234, "test_acc": 0.0263, "lyapunov": null, "grad_norm": 0.5094580986389692, "grad_max_sv": 0.16614943966269494, "grad_min_sv": 9.441066034510115e-09, "grad_condition": 25708375.318254933, "lr": 1.0926199633097203e-05, "time_sec": 66.72957038879395 }, { "epoch": 141, "train_loss": 2.8928156049346923, "train_acc": 0.27302, "test_loss": 7.946534848022461, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.5089732688724395, "grad_max_sv": 0.1660338044166565, "grad_min_sv": 9.440311787671519e-09, "grad_condition": 79734166.44560626, "lr": 8.856374635655688e-06, "time_sec": 66.7075400352478 }, { "epoch": 142, "train_loss": 2.88548219871521, "train_acc": 0.27172, "test_loss": 8.169772109985352, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.5086553359451463, "grad_max_sv": 0.16840459816157818, "grad_min_sv": 9.377848261826749e-09, "grad_condition": 22023976.535071947, "lr": 7.001981464747503e-06, "time_sec": 66.71758651733398 }, { "epoch": 143, "train_loss": 2.89183920753479, "train_acc": 0.27372, "test_loss": 7.852110308837891, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.5094733139547303, "grad_max_sv": 0.16687579974532127, "grad_min_sv": 9.444928218693693e-09, "grad_condition": 24477411.004352577, "lr": 5.3638335185058295e-06, "time_sec": 66.72722506523132 }, { "epoch": 144, "train_loss": 2.8904072105407717, "train_acc": 0.27378, "test_loss": 8.066141241455078, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.5089427679493953, "grad_max_sv": 0.1690099250525236, "grad_min_sv": 9.382681727398978e-09, "grad_condition": 24070995.123834018, "lr": 3.942649342761114e-06, "time_sec": 66.73601293563843 }, { "epoch": 145, "train_loss": 2.8936181242370607, "train_acc": 0.27214, "test_loss": 8.10545317993164, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.507865092838002, "grad_max_sv": 0.1655246399343014, "grad_min_sv": 9.371320355833212e-09, "grad_condition": 20893591.384689607, "lr": 2.7390523158633524e-06, "time_sec": 66.70678782463074 }, { "epoch": 146, "train_loss": 2.894159292755127, "train_acc": 0.27236, "test_loss": 7.739997250366211, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.5079666742519956, "grad_max_sv": 0.16401765793561934, "grad_min_sv": 9.365164058139363e-09, "grad_condition": 30379279.137967873, "lr": 1.7535703752478133e-06, "time_sec": 66.73851418495178 }, { "epoch": 147, "train_loss": 2.892810397796631, "train_acc": 0.27236, "test_loss": 8.097870037841798, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.5083955380496783, "grad_max_sv": 0.16239417865872383, "grad_min_sv": 9.437153494773476e-09, "grad_condition": 22581567.79918761, "lr": 9.866357858642196e-07, "time_sec": 66.69952964782715 }, { "epoch": 148, "train_loss": 2.8858398888397216, "train_acc": 0.27292, "test_loss": 7.955520216369629, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.5081646285749641, "grad_max_sv": 0.1665601458400488, "grad_min_sv": 9.4039764724082e-09, "grad_condition": 2788122152.665894, "lr": 4.38584950570808e-07, "time_sec": 66.72941470146179 }, { "epoch": 149, "train_loss": 2.8937516955566407, "train_acc": 0.27344, "test_loss": 8.195967932128907, "test_acc": 0.0259, "lyapunov": null, "grad_norm": 0.5088598826502255, "grad_max_sv": 0.16467942893505097, "grad_min_sv": 9.292379346548252e-09, "grad_condition": 20098211.57433509, "lr": 1.096582625772501e-07, "time_sec": 66.7379686832428 }, { "epoch": 150, "train_loss": 2.8891425512695315, "train_acc": 0.27354, "test_loss": 8.199688424682618, "test_acc": 0.0264, "lyapunov": null, "grad_norm": 0.5085081625178647, "grad_max_sv": 0.17037647701799868, "grad_min_sv": 9.396511368997551e-09, "grad_condition": 30341616.600583784, "lr": 0.0, "time_sec": 66.7265522480011 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 4.600389208526611, "train_acc": 0.07146, "test_loss": 4.086850812530518, "test_acc": 0.089, "lyapunov": 2.088574398813955, "grad_norm": 5.951641147060766, "grad_max_sv": 4.604718941450119, "grad_min_sv": 1.0862287848634189e-07, "grad_condition": 102934308.40827194, "lr": 0.0009998903417374227, "time_sec": 41.90148162841797 }, { "epoch": 2, "train_loss": 4.154245112686157, "train_acc": 0.09378, "test_loss": 4.727289266204834, "test_acc": 0.049, "lyapunov": 1.675386021509195, "grad_norm": 3.9336812922654714, "grad_max_sv": 2.925524663925171, "grad_min_sv": 7.262743817529338e-08, "grad_condition": 424809238.9666936, "lr": 0.0009995614150494292, "time_sec": 41.78368663787842 }, { "epoch": 3, "train_loss": 4.027823886566162, "train_acc": 0.1086, "test_loss": 5.036119989776611, "test_acc": 0.0347, "lyapunov": 1.6001547501825006, "grad_norm": 3.0745862198210694, "grad_max_sv": 2.1295204132795336, "grad_min_sv": 5.70765142704488e-08, "grad_condition": 40571486.668118164, "lr": 0.0009990133642141358, "time_sec": 41.703768253326416 }, { "epoch": 4, "train_loss": 3.9490097280883787, "train_acc": 0.1205, "test_loss": 6.33214266204834, "test_acc": 0.0188, "lyapunov": 1.5750604392317555, "grad_norm": 2.373335141934517, "grad_max_sv": 1.5385636299848557, "grad_min_sv": 4.3810931549259635e-08, "grad_condition": 41690835.43861919, "lr": 0.0009982464296247522, "time_sec": 41.732722997665405 }, { "epoch": 5, "train_loss": 3.9766585917663573, "train_acc": 0.11954, "test_loss": 8.71332287902832, "test_acc": 0.0188, "lyapunov": 1.565549552593085, "grad_norm": 2.0246690982621796, "grad_max_sv": 1.2804439306259154, "grad_min_sv": 3.6991484700377165e-08, "grad_condition": 85372782.32745245, "lr": 0.0009972609476841367, "time_sec": 41.76529860496521 }, { "epoch": 6, "train_loss": 4.073858399047851, "train_acc": 0.11056, "test_loss": 9.466819995117188, "test_acc": 0.0223, "lyapunov": 1.5455034062685564, "grad_norm": 1.7934086339665274, "grad_max_sv": 1.104438428580761, "grad_min_sv": 3.247254408700328e-08, "grad_condition": 45291989.58759006, "lr": 0.000996057350657239, "time_sec": 41.74420213699341 }, { "epoch": 7, "train_loss": 4.1445047888183595, "train_acc": 0.10608, "test_loss": 10.480993731689454, "test_acc": 0.0156, "lyapunov": 1.5415380177900309, "grad_norm": 1.5679408505934445, "grad_max_sv": 0.9464981764554977, "grad_min_sv": 2.8262019316493968e-08, "grad_condition": 54295754.70226411, "lr": 0.000994636166481494, "time_sec": 41.73182463645935 }, { "epoch": 8, "train_loss": 4.26063258026123, "train_acc": 0.09112, "test_loss": 7.7578563934326175, "test_acc": 0.0186, "lyapunov": 1.5429353631670824, "grad_norm": 1.3464117763442929, "grad_max_sv": 0.7779564633965492, "grad_min_sv": 2.375586672376251e-08, "grad_condition": 62692972.26952485, "lr": 0.0009929980185352525, "time_sec": 41.739473819732666 }, { "epoch": 9, "train_loss": 4.513377053375244, "train_acc": 0.05922, "test_loss": 7.138281170654297, "test_acc": 0.011, "lyapunov": 1.5319068190996603, "grad_norm": 1.139364674598679, "grad_max_sv": 0.6511225394904614, "grad_min_sv": 1.8816128205534354e-08, "grad_condition": 44484041.03115648, "lr": 0.0009911436253643444, "time_sec": 41.73070311546326 }, { "epoch": 10, "train_loss": 4.696486204833985, "train_acc": 0.03644, "test_loss": 8.94805923461914, "test_acc": 0.01, "lyapunov": 1.4879300298593234, "grad_norm": 0.9658719057515597, "grad_max_sv": 0.6352818965911865, "grad_min_sv": 1.4476460679876436e-08, "grad_condition": 2057995491.241798, "lr": 0.0009890738003669028, "time_sec": 41.76564049720764 }, { "epoch": 11, "train_loss": 4.811119628295899, "train_acc": 0.03002, "test_loss": 8.594207092285156, "test_acc": 0.01, "lyapunov": 1.545145396381388, "grad_norm": 0.9564458204494278, "grad_max_sv": 0.6685591802001, "grad_min_sv": 1.3870340914018398e-08, "grad_condition": 146809154.0196677, "lr": 0.00098678945143658, "time_sec": 41.74543738365173 }, { "epoch": 12, "train_loss": 4.975349290466308, "train_acc": 0.01658, "test_loss": 8.6747091796875, "test_acc": 0.0114, "lyapunov": 1.4708023967645358, "grad_norm": 0.7817948112887597, "grad_max_sv": 0.603185323625803, "grad_min_sv": 9.743947088081129e-09, "grad_condition": 67868723.94202444, "lr": 0.0009842915805643154, "time_sec": 41.7559871673584 }, { "epoch": 13, "train_loss": 5.0296261746215825, "train_acc": 0.01604, "test_loss": 11.79697481994629, "test_acc": 0.01, "lyapunov": 1.5253148819784375, "grad_norm": 0.5736780904158933, "grad_max_sv": 0.42879281714558604, "grad_min_sv": 6.762437510681764e-09, "grad_condition": 1079134295.4881654, "lr": 0.000981581283398829, "time_sec": 41.76394009590149 }, { "epoch": 14, "train_loss": 5.057629988555909, "train_acc": 0.00992, "test_loss": 8.410659944152831, "test_acc": 0.01, "lyapunov": 1.4446861634169088, "grad_norm": 0.39926683732439516, "grad_max_sv": 0.33072102442383766, "grad_min_sv": 4.070671115463664e-09, "grad_condition": 171229170.03266063, "lr": 0.0009786597487660333, "time_sec": 41.78986120223999 }, { "epoch": 15, "train_loss": 5.068990168609619, "train_acc": 0.01004, "test_loss": 8.000550273132324, "test_acc": 0.01, "lyapunov": 1.4198117143357807, "grad_norm": 0.31403539953973636, "grad_max_sv": 0.261398883163929, "grad_min_sv": 2.518455900589597e-09, "grad_condition": 1889483827.2041466, "lr": 0.0009755282581475766, "time_sec": 41.803417682647705 }, { "epoch": 16, "train_loss": 5.098585692901612, "train_acc": 0.00948, "test_loss": 8.965616151428222, "test_acc": 0.01, "lyapunov": 1.4220252604130894, "grad_norm": 0.2674000226215519, "grad_max_sv": 0.2171985387802124, "grad_min_sv": 6.561514876139448e-10, "grad_condition": 51847368847.70773, "lr": 0.0009721881851187403, "time_sec": 41.763081789016724 }, { "epoch": 17, "train_loss": 5.128935182189942, "train_acc": 0.0104, "test_loss": 7.713327481842041, "test_acc": 0.01, "lyapunov": 1.4243087640503789, "grad_norm": 0.2268635753508302, "grad_max_sv": 0.17724891044199467, "grad_min_sv": 1.1410712791450972e-12, "grad_condition": 106447262687.9498, "lr": 0.0009686409947459456, "time_sec": 41.777748823165894 }, { "epoch": 18, "train_loss": 5.169684513702393, "train_acc": 0.00924, "test_loss": 9.309846389770508, "test_acc": 0.01, "lyapunov": 1.4357064035542482, "grad_norm": 0.2142537464973637, "grad_max_sv": 0.1502558846026659, "grad_min_sv": 4.244580750085834e-13, "grad_condition": 128309590371.45757, "lr": 0.0009648882429441254, "time_sec": 41.78967308998108 }, { "epoch": 19, "train_loss": 5.18758517288208, "train_acc": 0.01042, "test_loss": 9.819900524902344, "test_acc": 0.01, "lyapunov": 1.4233030394824875, "grad_norm": 0.1952009554667118, "grad_max_sv": 0.14073190968483687, "grad_min_sv": 2.6230090465217223e-13, "grad_condition": 123371153139.15, "lr": 0.00096093157579425, "time_sec": 41.77319002151489 }, { "epoch": 20, "train_loss": 5.217939367370605, "train_acc": 0.00912, "test_loss": 9.18544906463623, "test_acc": 0.01, "lyapunov": 1.4247246755053624, "grad_norm": 0.15876002882735193, "grad_max_sv": 0.10825764928013086, "grad_min_sv": 3.338896381884262e-15, "grad_condition": 107875834900.70416, "lr": 0.0009567727288213001, "time_sec": 41.805402517318726 }, { "epoch": 21, "train_loss": 5.2237202166748045, "train_acc": 0.00884, "test_loss": 7.853615603637695, "test_acc": 0.01, "lyapunov": 1.4316062283942768, "grad_norm": 0.16150401588518373, "grad_max_sv": 0.09900619480758906, "grad_min_sv": 6.6800742534662695e-15, "grad_condition": 98362933683.42502, "lr": 0.0009524135262330095, "time_sec": 41.81541037559509 }, { "epoch": 22, "train_loss": 5.223462156219482, "train_acc": 0.00896, "test_loss": 7.39350982055664, "test_acc": 0.01, "lyapunov": 1.4326209281106739, "grad_norm": 0.1473213530853359, "grad_max_sv": 0.07929724231362342, "grad_min_sv": 1.359730040562078e-16, "grad_condition": 79286860137.91084, "lr": 0.0009478558801197061, "time_sec": 41.77298974990845 }, { "epoch": 23, "train_loss": 5.2433684585571285, "train_acc": 0.0104, "test_loss": 7.137277140808106, "test_acc": 0.01, "lyapunov": 1.4520324453368516, "grad_norm": 0.1808576226701931, "grad_max_sv": 0.0958871865645051, "grad_min_sv": 8.016626722354409e-12, "grad_condition": 91441708516.60077, "lr": 0.000943101789615607, "time_sec": 41.78183579444885 }, { "epoch": 24, "train_loss": 5.227817250061035, "train_acc": 0.01018, "test_loss": 6.776467510986328, "test_acc": 0.01, "lyapunov": 1.4379125001180508, "grad_norm": 0.12771270098590454, "grad_max_sv": 0.06905819587409497, "grad_min_sv": 2.599435841374051e-17, "grad_condition": 69055853998.34868, "lr": 0.0009381533400219313, "time_sec": 41.771769285202026 }, { "epoch": 25, "train_loss": 5.245168194122314, "train_acc": 0.0099, "test_loss": 6.430454106140137, "test_acc": 0.01, "lyapunov": 1.4564172242913405, "grad_norm": 0.12472749302013317, "grad_max_sv": 0.05845061130821705, "grad_min_sv": 1.194259418817754e-40, "grad_condition": 58450611308.21704, "lr": 0.0009330127018922189, "time_sec": 41.770474433898926 }, { "epoch": 26, "train_loss": 5.246722939758301, "train_acc": 0.00928, "test_loss": 6.331733448791504, "test_acc": 0.01, "lyapunov": 1.4580842101055642, "grad_norm": 0.1662077239803915, "grad_max_sv": 0.06711247004568577, "grad_min_sv": 3.516773949087515e-14, "grad_condition": 65770012096.831566, "lr": 0.000927682130080253, "time_sec": 41.73953866958618 }, { "epoch": 27, "train_loss": 5.241074298706055, "train_acc": 0.00908, "test_loss": 5.877811084747314, "test_acc": 0.01, "lyapunov": 1.4511035900286702, "grad_norm": 0.11653593515355255, "grad_max_sv": 0.057695817202329636, "grad_min_sv": 2.245335846475005e-19, "grad_condition": 57695796508.56338, "lr": 0.0009221639627510072, "time_sec": 41.77058434486389 }, { "epoch": 28, "train_loss": 5.231804114685058, "train_acc": 0.00918, "test_loss": 5.65352537612915, "test_acc": 0.01, "lyapunov": 1.4424795046486818, "grad_norm": 0.11846210716711081, "grad_max_sv": 0.05332653652876616, "grad_min_sv": 1.997381835377637e-16, "grad_condition": 53305647188.1228, "lr": 0.0009164606203550494, "time_sec": 41.764750957489014 }, { "epoch": 29, "train_loss": 5.262847916870117, "train_acc": 0.01024, "test_loss": 6.106614427185058, "test_acc": 0.01, "lyapunov": 1.4771753000786236, "grad_norm": 0.12029871369481651, "grad_max_sv": 0.04656773656606674, "grad_min_sv": 3.853570776893247e-46, "grad_condition": 46567736566.06674, "lr": 0.0009105746045668516, "time_sec": 41.72984552383423 }, { "epoch": 30, "train_loss": 5.23929132598877, "train_acc": 0.00934, "test_loss": 5.9899550048828125, "test_acc": 0.01, "lyapunov": 1.4511136694637405, "grad_norm": 0.11304905556902457, "grad_max_sv": 0.047783416556194426, "grad_min_sv": 9.917357230877788e-21, "grad_condition": 47783415656.63218, "lr": 0.0009045084971874733, "time_sec": 41.7406222820282 }, { "epoch": 31, "train_loss": 5.248380351104736, "train_acc": 0.01028, "test_loss": 5.734669494628906, "test_acc": 0.01, "lyapunov": 1.461517483986857, "grad_norm": 0.10074340116724037, "grad_max_sv": 0.034037844324484465, "grad_min_sv": 0.0, "grad_condition": 34037844324.484474, "lr": 0.0008982649590120977, "time_sec": 41.74093008041382 }, { "epoch": 32, "train_loss": 5.236619085388184, "train_acc": 0.00984, "test_loss": 5.793693973541259, "test_acc": 0.01, "lyapunov": 1.4490889871821684, "grad_norm": 0.10695665831734988, "grad_max_sv": 0.04561040163971484, "grad_min_sv": 0.0, "grad_condition": 45610401639.71483, "lr": 0.0008918467286629196, "time_sec": 41.984901666641235 }, { "epoch": 33, "train_loss": 5.23296120513916, "train_acc": 0.00958, "test_loss": 5.439259308624267, "test_acc": 0.01, "lyapunov": 1.444964089661913, "grad_norm": 0.10554551126822227, "grad_max_sv": 0.042046601651236415, "grad_min_sv": 0.0, "grad_condition": 42046601651.23641, "lr": 0.0008852566213878943, "time_sec": 41.770121335983276 }, { "epoch": 34, "train_loss": 5.236159170837403, "train_acc": 0.00974, "test_loss": 5.683465595245361, "test_acc": 0.01, "lyapunov": 1.44912754269817, "grad_norm": 0.10158597595404413, "grad_max_sv": 0.0364499366376549, "grad_min_sv": 0.0, "grad_condition": 36449936637.6549, "lr": 0.000878497527825878, "time_sec": 41.73541307449341 }, { "epoch": 35, "train_loss": 5.244431438751221, "train_acc": 0.00982, "test_loss": 5.822091407775879, "test_acc": 0.01, "lyapunov": 1.4579007311550247, "grad_norm": 0.10227185751901953, "grad_max_sv": 0.04079357534646988, "grad_min_sv": 0.0, "grad_condition": 40793575346.46987, "lr": 0.000871572412738697, "time_sec": 41.72771143913269 }, { "epoch": 36, "train_loss": 5.242595237579346, "train_acc": 0.00948, "test_loss": 5.712351992797852, "test_acc": 0.01, "lyapunov": 1.4565396217433997, "grad_norm": 0.09594442137602498, "grad_max_sv": 0.023863840941339733, "grad_min_sv": 0.0, "grad_condition": 23863840941.33973, "lr": 0.0008644843137107055, "time_sec": 41.679956674575806 }, { "epoch": 37, "train_loss": 5.25272214477539, "train_acc": 0.00774, "test_loss": 5.519532617950439, "test_acc": 0.01, "lyapunov": 1.4673221968019101, "grad_norm": 0.09989553017175994, "grad_max_sv": 0.01326487297192216, "grad_min_sv": 0.0, "grad_condition": 13264872971.922161, "lr": 0.0008572363398164014, "time_sec": 41.665099143981934 }, { "epoch": 38, "train_loss": 5.239593379211426, "train_acc": 0.00894, "test_loss": 5.685215021514892, "test_acc": 0.01, "lyapunov": 1.4529655787646008, "grad_norm": 0.09888602041808069, "grad_max_sv": 0.03386777136474848, "grad_min_sv": 0.0, "grad_condition": 33867771364.748474, "lr": 0.0008498316702566826, "time_sec": 41.71084642410278 }, { "epoch": 39, "train_loss": 5.24351258758545, "train_acc": 0.00926, "test_loss": 5.718768641662598, "test_acc": 0.01, "lyapunov": 1.4566386227717485, "grad_norm": 0.10344101016289994, "grad_max_sv": 0.04082807558588684, "grad_min_sv": 0.0, "grad_condition": 40828075585.886826, "lr": 0.0008422735529643442, "time_sec": 41.73838138580322 }, { "epoch": 40, "train_loss": 5.241183159027099, "train_acc": 0.00956, "test_loss": 5.497510899353028, "test_acc": 0.01, "lyapunov": 1.4553583491488795, "grad_norm": 0.09390993405990472, "grad_max_sv": 0.015733347134664656, "grad_min_sv": 0.0, "grad_condition": 15733347134.664654, "lr": 0.0008345653031794289, "time_sec": 41.734697580337524 }, { "epoch": 41, "train_loss": 5.242352604675293, "train_acc": 0.00974, "test_loss": 5.167651419830322, "test_acc": 0.01, "lyapunov": 1.454840253076285, "grad_norm": 0.11429776991375327, "grad_max_sv": 0.05544604551978409, "grad_min_sv": 2.0339863136307694e-16, "grad_condition": 55425910698.75984, "lr": 0.0008267103019950526, "time_sec": 41.75088906288147 }, { "epoch": 42, "train_loss": 5.242215647735596, "train_acc": 0.00988, "test_loss": 5.260814582824707, "test_acc": 0.01, "lyapunov": 1.4554345080309816, "grad_norm": 0.10783002802519942, "grad_max_sv": 0.04959035101346672, "grad_min_sv": 4.912822630335892e-20, "grad_condition": 49590347491.3975, "lr": 0.0008187119948743447, "time_sec": 41.73639273643494 }, { "epoch": 43, "train_loss": 5.244567107543945, "train_acc": 0.01008, "test_loss": 4.993986747741699, "test_acc": 0.01, "lyapunov": 1.4585875352020459, "grad_norm": 0.10047934695930735, "grad_max_sv": 0.03824934270232916, "grad_min_sv": 3.853570776893247e-46, "grad_condition": 38249342702.329155, "lr": 0.000810573890139155, "time_sec": 41.74794268608093 }, { "epoch": 44, "train_loss": 5.244575652618408, "train_acc": 0.0093, "test_loss": 4.9594275024414065, "test_acc": 0.01, "lyapunov": 1.4588656959021489, "grad_norm": 0.09576972429911833, "grad_max_sv": 0.031089681945741177, "grad_min_sv": 0.0, "grad_condition": 31089681945.741173, "lr": 0.0008022995574311873, "time_sec": 41.72138214111328 }, { "epoch": 45, "train_loss": 5.2458512478637696, "train_acc": 0.00958, "test_loss": 4.983256524658203, "test_acc": 0.01, "lyapunov": 1.460322377017087, "grad_norm": 0.09632514814173115, "grad_max_sv": 0.02758595086634159, "grad_min_sv": 0.0, "grad_condition": 27585950866.34159, "lr": 0.0007938926261462363, "time_sec": 41.73388934135437 }, { "epoch": 46, "train_loss": 5.245156242980957, "train_acc": 0.00914, "test_loss": 5.5051834045410155, "test_acc": 0.01, "lyapunov": 1.459906402451303, "grad_norm": 0.09376667391500292, "grad_max_sv": 0.017312733735889197, "grad_min_sv": 0.0, "grad_condition": 17312733735.8892, "lr": 0.0007853567838422158, "time_sec": 41.682612657547 }, { "epoch": 47, "train_loss": 5.24946335647583, "train_acc": 0.0092, "test_loss": 5.037567407989502, "test_acc": 0.01, "lyapunov": 1.464009671260024, "grad_norm": 0.09467776161020446, "grad_max_sv": 0.01866090311668813, "grad_min_sv": 0.0, "grad_condition": 18660903116.688133, "lr": 0.0007766957746216719, "time_sec": 41.71859622001648 }, { "epoch": 48, "train_loss": 5.2716734535217284, "train_acc": 0.00954, "test_loss": 4.725313116455078, "test_acc": 0.01, "lyapunov": 1.4846527972794554, "grad_norm": 0.12086822830734321, "grad_max_sv": 0.020449956133961677, "grad_min_sv": 0.0, "grad_condition": 20449956133.961678, "lr": 0.0007679133974894982, "time_sec": 41.662288427352905 }, { "epoch": 49, "train_loss": 5.264281662597656, "train_acc": 0.0094, "test_loss": 4.704328326416015, "test_acc": 0.01, "lyapunov": 1.4808302587255493, "grad_norm": 0.1006442361474557, "grad_max_sv": 0.003648173250257969, "grad_min_sv": 0.0, "grad_condition": 3648173250.257969, "lr": 0.000759013504686565, "time_sec": 41.659945011138916 }, { "epoch": 50, "train_loss": 5.260963584136963, "train_acc": 0.00864, "test_loss": 4.687705662536621, "test_acc": 0.01, "lyapunov": 1.4764524859845485, "grad_norm": 0.08983274926440024, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 41.73585891723633 }, { "epoch": 51, "train_loss": 5.254029862213135, "train_acc": 0.00892, "test_loss": 4.650592637634277, "test_acc": 0.01, "lyapunov": 1.4702172300699727, "grad_norm": 0.08943196133143812, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508575, "time_sec": 41.63914966583252 }, { "epoch": 52, "train_loss": 5.253371743927002, "train_acc": 0.00914, "test_loss": 4.651584497070313, "test_acc": 0.01, "lyapunov": 1.469337931984221, "grad_norm": 0.09050035162045282, "grad_max_sv": 0.00823306110687554, "grad_min_sv": 0.0, "grad_condition": 8233061106.875539, "lr": 0.0007316480175599307, "time_sec": 41.676894187927246 }, { "epoch": 53, "train_loss": 5.25479355255127, "train_acc": 0.00884, "test_loss": 4.6638921875, "test_acc": 0.01, "lyapunov": 1.4709156809560477, "grad_norm": 0.0923409314747527, "grad_max_sv": 0.01720760380849242, "grad_min_sv": 0.0, "grad_condition": 17207603808.492424, "lr": 0.0007223175895924635, "time_sec": 41.68897199630737 }, { "epoch": 54, "train_loss": 5.255663233642578, "train_acc": 0.0087, "test_loss": 4.690281636047363, "test_acc": 0.01, "lyapunov": 1.4720432532717809, "grad_norm": 0.09116086408440177, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 41.65702509880066 }, { "epoch": 55, "train_loss": 5.255450089111328, "train_acc": 0.0089, "test_loss": 4.664666540527343, "test_acc": 0.01, "lyapunov": 1.4717262035135723, "grad_norm": 0.08960989934748306, "grad_max_sv": 0.0027584049850702284, "grad_min_sv": 0.0, "grad_condition": 2758404985.0702286, "lr": 0.0007033683215378998, "time_sec": 41.68492293357849 }, { "epoch": 56, "train_loss": 5.25642558013916, "train_acc": 0.00918, "test_loss": 4.672654594421386, "test_acc": 0.01, "lyapunov": 1.4729856798411025, "grad_norm": 0.08842004194228453, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 41.66422128677368 }, { "epoch": 57, "train_loss": 5.256343665313721, "train_acc": 0.00928, "test_loss": 4.675612693786621, "test_acc": 0.01, "lyapunov": 1.4728102668776841, "grad_norm": 0.0894492177832343, "grad_max_sv": 0.003824355313554406, "grad_min_sv": 0.0, "grad_condition": 3824355313.554406, "lr": 0.0006840622763423388, "time_sec": 41.66166043281555 }, { "epoch": 58, "train_loss": 5.256470738372803, "train_acc": 0.00846, "test_loss": 4.673555949401855, "test_acc": 0.01, "lyapunov": 1.473022796918669, "grad_norm": 0.09415093095699927, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 41.72664546966553 }, { "epoch": 59, "train_loss": 5.257105118560791, "train_acc": 0.0089, "test_loss": 4.662265467834473, "test_acc": 0.01, "lyapunov": 1.4737855485638085, "grad_norm": 0.08933320536804817, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 41.683704137802124 }, { "epoch": 60, "train_loss": 5.2567843800354, "train_acc": 0.00894, "test_loss": 4.67973249130249, "test_acc": 0.01, "lyapunov": 1.4734186650542043, "grad_norm": 0.08845010319296705, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 41.65764546394348 }, { "epoch": 61, "train_loss": 5.2586814794921874, "train_acc": 0.00832, "test_loss": 4.66929153137207, "test_acc": 0.01, "lyapunov": 1.4755458350071822, "grad_norm": 0.08796570828809193, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 41.66641640663147 }, { "epoch": 62, "train_loss": 5.257138239135743, "train_acc": 0.00822, "test_loss": 4.672049102783203, "test_acc": 0.01, "lyapunov": 1.4738077528946234, "grad_norm": 0.08897000656850247, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 41.66154670715332 }, { "epoch": 63, "train_loss": 5.25840109664917, "train_acc": 0.00872, "test_loss": 4.668118723297119, "test_acc": 0.01, "lyapunov": 1.4752026089012165, "grad_norm": 0.08994871774610383, "grad_max_sv": 0.0018751383759081364, "grad_min_sv": 0.0, "grad_condition": 1875138375.9081364, "lr": 0.0006243449435824269, "time_sec": 41.65010213851929 }, { "epoch": 64, "train_loss": 5.259331801910401, "train_acc": 0.009, "test_loss": 4.6509183990478515, "test_acc": 0.01, "lyapunov": 1.4761373133915465, "grad_norm": 0.09230518416704733, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 41.68602395057678 }, { "epoch": 65, "train_loss": 5.259325382080078, "train_acc": 0.00842, "test_loss": 4.649483604431152, "test_acc": 0.01, "lyapunov": 1.4762441697327986, "grad_norm": 0.09181035955304583, "grad_max_sv": 0.002657032757997513, "grad_min_sv": 0.0, "grad_condition": 2657032757.997513, "lr": 0.0006039558454088793, "time_sec": 41.649319648742676 }, { "epoch": 66, "train_loss": 5.258703485870361, "train_acc": 0.0089, "test_loss": 4.659050286865234, "test_acc": 0.01, "lyapunov": 1.475566557911046, "grad_norm": 0.08911107124283034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 41.66279911994934 }, { "epoch": 67, "train_loss": 5.258656344146728, "train_acc": 0.00868, "test_loss": 4.652145028686523, "test_acc": 0.01, "lyapunov": 1.4755408843155102, "grad_norm": 0.08984660357930904, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 41.65086126327515 }, { "epoch": 68, "train_loss": 5.259207654724121, "train_acc": 0.00934, "test_loss": 4.644708920288086, "test_acc": 0.01, "lyapunov": 1.476156848470878, "grad_norm": 0.08930414014303266, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 41.6753249168396 }, { "epoch": 69, "train_loss": 5.259739582061767, "train_acc": 0.00962, "test_loss": 4.635655142974853, "test_acc": 0.01, "lyapunov": 1.4767807136716136, "grad_norm": 0.08868883564267036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 41.6395525932312 }, { "epoch": 70, "train_loss": 5.258972863311768, "train_acc": 0.0098, "test_loss": 4.630142547607422, "test_acc": 0.01, "lyapunov": 1.4758698986009564, "grad_norm": 0.08847186803439672, "grad_max_sv": 0.0013374987989664077, "grad_min_sv": 0.0, "grad_condition": 1337498798.9664078, "lr": 0.0005522642316338265, "time_sec": 41.64910697937012 }, { "epoch": 71, "train_loss": 5.259250410003662, "train_acc": 0.00816, "test_loss": 4.623734491729737, "test_acc": 0.01, "lyapunov": 1.4762009812133086, "grad_norm": 0.0884158256705388, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 41.65673208236694 }, { "epoch": 72, "train_loss": 5.260035207519532, "train_acc": 0.00856, "test_loss": 4.622923696899414, "test_acc": 0.01, "lyapunov": 1.4770802146638446, "grad_norm": 0.08974113871672654, "grad_max_sv": 0.00768307838588953, "grad_min_sv": 0.0, "grad_condition": 7683078385.889531, "lr": 0.0005313952597646563, "time_sec": 41.65725779533386 }, { "epoch": 73, "train_loss": 5.258972092895508, "train_acc": 0.0089, "test_loss": 4.627894605255127, "test_acc": 0.01, "lyapunov": 1.4759459010780316, "grad_norm": 0.08863002112233408, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 41.67947006225586 }, { "epoch": 74, "train_loss": 5.260160232849121, "train_acc": 0.00854, "test_loss": 4.623137206268311, "test_acc": 0.01, "lyapunov": 1.4772573081428741, "grad_norm": 0.09051043005437374, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 41.64360570907593 }, { "epoch": 75, "train_loss": 5.261452306213379, "train_acc": 0.0086, "test_loss": 4.62108766708374, "test_acc": 0.01, "lyapunov": 1.478764491617832, "grad_norm": 0.08870478754258258, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 41.64626455307007 }, { "epoch": 76, "train_loss": 5.2611726042175295, "train_acc": 0.00886, "test_loss": 4.623955220794678, "test_acc": 0.01, "lyapunov": 1.4784429673953434, "grad_norm": 0.08878094000275963, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 41.656346797943115 }, { "epoch": 77, "train_loss": 5.261820520782471, "train_acc": 0.00874, "test_loss": 4.61466668548584, "test_acc": 0.01, "lyapunov": 1.479163033273214, "grad_norm": 0.088273880644991, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 41.629544734954834 }, { "epoch": 78, "train_loss": 5.262518656311035, "train_acc": 0.00864, "test_loss": 4.618248620605469, "test_acc": 0.01, "lyapunov": 1.4799401089358513, "grad_norm": 0.08861130102060333, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 41.636940240859985 }, { "epoch": 79, "train_loss": 5.262553581237793, "train_acc": 0.009, "test_loss": 4.612181239318848, "test_acc": 0.01, "lyapunov": 1.4799358280723358, "grad_norm": 0.0903783960157925, "grad_max_sv": 0.01033918051980436, "grad_min_sv": 0.0, "grad_condition": 10339180519.80436, "lr": 0.00045816107833384175, "time_sec": 41.68020677566528 }, { "epoch": 80, "train_loss": 5.261878743896484, "train_acc": 0.00886, "test_loss": 4.612385320281982, "test_acc": 0.01, "lyapunov": 1.4792317411173945, "grad_norm": 0.08815903777083657, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 41.65713667869568 }, { "epoch": 81, "train_loss": 5.270162540740967, "train_acc": 0.00948, "test_loss": 4.61169965209961, "test_acc": 0.01, "lyapunov": 1.4845762399151503, "grad_norm": 0.08933321451984454, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 41.67780160903931 }, { "epoch": 82, "train_loss": 5.261875872955322, "train_acc": 0.00904, "test_loss": 4.612089576721192, "test_acc": 0.01, "lyapunov": 1.47926344438587, "grad_norm": 0.08839554451712253, "grad_max_sv": 0.0006388438399881124, "grad_min_sv": 0.0, "grad_condition": 638843839.9881124, "lr": 0.0004269584857187939, "time_sec": 41.646398305892944 }, { "epoch": 83, "train_loss": 5.260851752319336, "train_acc": 0.00926, "test_loss": 4.605935791778564, "test_acc": 0.01, "lyapunov": 1.4780823766727886, "grad_norm": 0.08881372923156301, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 41.64280557632446 }, { "epoch": 84, "train_loss": 5.261813834838867, "train_acc": 0.0087, "test_loss": 4.608912050628662, "test_acc": 0.01, "lyapunov": 1.4791915989897746, "grad_norm": 0.08828411260554986, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 41.650211811065674 }, { "epoch": 85, "train_loss": 5.26105229888916, "train_acc": 0.00876, "test_loss": 4.607143463134766, "test_acc": 0.01, "lyapunov": 1.4783552308826495, "grad_norm": 0.08801037770330913, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 41.64579463005066 }, { "epoch": 86, "train_loss": 5.262948518676758, "train_acc": 0.0089, "test_loss": 4.605761601257324, "test_acc": 0.01, "lyapunov": 1.4804744302769146, "grad_norm": 0.08824824639135734, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 41.694432497024536 }, { "epoch": 87, "train_loss": 5.261626904449463, "train_acc": 0.00888, "test_loss": 4.605769618988037, "test_acc": 0.01, "lyapunov": 1.4789858986349667, "grad_norm": 0.08846494510980996, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 41.681015491485596 }, { "epoch": 88, "train_loss": 5.262741643371582, "train_acc": 0.00854, "test_loss": 4.60517066192627, "test_acc": 0.01, "lyapunov": 1.4802151354377533, "grad_norm": 0.08805740561566744, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 41.71163582801819 }, { "epoch": 89, "train_loss": 5.263213445281982, "train_acc": 0.00854, "test_loss": 4.605359262847901, "test_acc": 0.01, "lyapunov": 1.480777892005413, "grad_norm": 0.08816151399502117, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 41.67105174064636 }, { "epoch": 90, "train_loss": 5.262189238433838, "train_acc": 0.00928, "test_loss": 4.605318756103515, "test_acc": 0.01, "lyapunov": 1.4796337014269036, "grad_norm": 0.08930367772167215, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 41.640591859817505 }, { "epoch": 91, "train_loss": 5.261863013916016, "train_acc": 0.00846, "test_loss": 4.605316780853271, "test_acc": 0.01, "lyapunov": 1.4792772080282421, "grad_norm": 0.08825121039889311, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 41.705339193344116 }, { "epoch": 92, "train_loss": 5.263724805908203, "train_acc": 0.0084, "test_loss": 4.605317385101318, "test_acc": 0.01, "lyapunov": 1.4813950381925345, "grad_norm": 0.0876042035379079, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 41.64047455787659 }, { "epoch": 93, "train_loss": 5.263348481750488, "train_acc": 0.00826, "test_loss": 4.605170777893067, "test_acc": 0.01, "lyapunov": 1.480857576250725, "grad_norm": 0.09205208782948476, "grad_max_sv": 0.007683574734255671, "grad_min_sv": 0.0, "grad_condition": 7683574734.2556715, "lr": 0.00031593772365766094, "time_sec": 41.66976022720337 }, { "epoch": 94, "train_loss": 5.263678814697266, "train_acc": 0.0087, "test_loss": 4.605170695495605, "test_acc": 0.01, "lyapunov": 1.481314537775181, "grad_norm": 0.09018876116473232, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 41.65629434585571 }, { "epoch": 95, "train_loss": 5.262105151977539, "train_acc": 0.00832, "test_loss": 4.605170751190186, "test_acc": 0.01, "lyapunov": 1.479619727110314, "grad_norm": 0.08829391493330081, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 41.637601375579834 }, { "epoch": 96, "train_loss": 5.261454503326416, "train_acc": 0.00892, "test_loss": 4.605170954895019, "test_acc": 0.01, "lyapunov": 1.4788271173491807, "grad_norm": 0.08829025030553274, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 41.64588212966919 }, { "epoch": 97, "train_loss": 5.2617424992370605, "train_acc": 0.00796, "test_loss": 4.605170453643799, "test_acc": 0.01, "lyapunov": 1.4791636610275034, "grad_norm": 0.08832466346515266, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 41.67742967605591 }, { "epoch": 98, "train_loss": 5.263716314086914, "train_acc": 0.00858, "test_loss": 4.605170697784424, "test_acc": 0.01, "lyapunov": 1.4813884213147566, "grad_norm": 0.08840081765609732, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 41.668766260147095 }, { "epoch": 99, "train_loss": 5.263833166656494, "train_acc": 0.0087, "test_loss": 4.605170695495605, "test_acc": 0.01, "lyapunov": 1.4815085251313036, "grad_norm": 0.08792820202741711, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 41.66829442977905 }, { "epoch": 100, "train_loss": 5.262581251525879, "train_acc": 0.00938, "test_loss": 4.605170309448242, "test_acc": 0.01, "lyapunov": 1.480138891188385, "grad_norm": 0.08832421824906611, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 41.68127655982971 }, { "epoch": 101, "train_loss": 5.263155633087158, "train_acc": 0.00926, "test_loss": 4.605170729064941, "test_acc": 0.01, "lyapunov": 1.480774727928669, "grad_norm": 0.08869235909302142, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 41.64776301383972 }, { "epoch": 102, "train_loss": 5.263860197906494, "train_acc": 0.00848, "test_loss": 4.6051703002929685, "test_acc": 0.01, "lyapunov": 1.4815483535342204, "grad_norm": 0.08903961910912474, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 41.674145460128784 }, { "epoch": 103, "train_loss": 5.262970734710693, "train_acc": 0.00884, "test_loss": 4.605170517730713, "test_acc": 0.01, "lyapunov": 1.4805596624798787, "grad_norm": 0.08876501131615566, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 41.65722608566284 }, { "epoch": 104, "train_loss": 5.26228626159668, "train_acc": 0.00864, "test_loss": 4.6051704086303715, "test_acc": 0.01, "lyapunov": 1.4798069201466981, "grad_norm": 0.08768680006785402, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 41.67565131187439 }, { "epoch": 105, "train_loss": 5.262674415435791, "train_acc": 0.00838, "test_loss": 4.6051702949523925, "test_acc": 0.01, "lyapunov": 1.480235590654261, "grad_norm": 0.08782166200414132, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 41.69558024406433 }, { "epoch": 106, "train_loss": 5.261244326171875, "train_acc": 0.00838, "test_loss": 4.605170240020752, "test_acc": 0.01, "lyapunov": 1.4786384803864656, "grad_norm": 0.08788578987148214, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 41.650753021240234 }, { "epoch": 107, "train_loss": 5.261433357849121, "train_acc": 0.00904, "test_loss": 4.605170213317871, "test_acc": 0.01, "lyapunov": 1.47886505273297, "grad_norm": 0.08770929414544659, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 41.68164348602295 }, { "epoch": 108, "train_loss": 5.263026925201416, "train_acc": 0.009, "test_loss": 4.60517043762207, "test_acc": 0.01, "lyapunov": 1.480643398621503, "grad_norm": 0.08785423875011682, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 41.660765647888184 }, { "epoch": 109, "train_loss": 5.263078652801513, "train_acc": 0.00816, "test_loss": 4.605601066589355, "test_acc": 0.01, "lyapunov": 1.4807295979136397, "grad_norm": 0.08803442353918925, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 41.66913390159607 }, { "epoch": 110, "train_loss": 5.263812705535889, "train_acc": 0.00886, "test_loss": 4.605602632141113, "test_acc": 0.01, "lyapunov": 1.4815696554110789, "grad_norm": 0.08891727786082522, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 41.659369230270386 }, { "epoch": 111, "train_loss": 5.262115261535644, "train_acc": 0.0078, "test_loss": 4.605170052337646, "test_acc": 0.01, "lyapunov": 1.479651604771919, "grad_norm": 0.08875181240277763, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 41.70141959190369 }, { "epoch": 112, "train_loss": 5.261109837646484, "train_acc": 0.00874, "test_loss": 4.605170468139648, "test_acc": 0.01, "lyapunov": 1.4785008156086172, "grad_norm": 0.08816074014970703, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 41.72004580497742 }, { "epoch": 113, "train_loss": 5.262560579681397, "train_acc": 0.0086, "test_loss": 4.6051704193115235, "test_acc": 0.01, "lyapunov": 1.4801284751623793, "grad_norm": 0.08840941179148938, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 41.699143409729004 }, { "epoch": 114, "train_loss": 5.263074327697754, "train_acc": 0.00886, "test_loss": 4.605170431518554, "test_acc": 0.01, "lyapunov": 1.4807007001793904, "grad_norm": 0.08821068724217689, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 41.67876648902893 }, { "epoch": 115, "train_loss": 5.262186526947022, "train_acc": 0.0086, "test_loss": 4.60517013092041, "test_acc": 0.01, "lyapunov": 1.4797226050320793, "grad_norm": 0.0883831455880719, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 41.696322202682495 }, { "epoch": 116, "train_loss": 5.263145412445068, "train_acc": 0.00836, "test_loss": 4.605170120239258, "test_acc": 0.01, "lyapunov": 1.480826344026629, "grad_norm": 0.08792566727039719, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 41.70669603347778 }, { "epoch": 117, "train_loss": 5.263297129516602, "train_acc": 0.00834, "test_loss": 4.60517033996582, "test_acc": 0.01, "lyapunov": 1.4809697009718326, "grad_norm": 0.0880297462141732, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 41.66155934333801 }, { "epoch": 118, "train_loss": 5.263041806030273, "train_acc": 0.00838, "test_loss": 4.605170127868653, "test_acc": 0.01, "lyapunov": 1.4806942784267922, "grad_norm": 0.0885706870416634, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 41.6468141078949 }, { "epoch": 119, "train_loss": 5.2626050819396974, "train_acc": 0.00882, "test_loss": 4.6051702911376955, "test_acc": 0.01, "lyapunov": 1.4802038822027728, "grad_norm": 0.08805401420662645, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 41.67359256744385 }, { "epoch": 120, "train_loss": 5.262915015411377, "train_acc": 0.00904, "test_loss": 4.605170024108887, "test_acc": 0.01, "lyapunov": 1.4805879507528241, "grad_norm": 0.08796658508917193, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 41.736050844192505 }, { "epoch": 121, "train_loss": 5.263114930877686, "train_acc": 0.0083, "test_loss": 4.605170388031006, "test_acc": 0.01, "lyapunov": 1.4807836167952593, "grad_norm": 0.08806195734422055, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 41.839574337005615 }, { "epoch": 122, "train_loss": 5.262788164825439, "train_acc": 0.00866, "test_loss": 4.605170208740234, "test_acc": 0.01, "lyapunov": 1.4804405013618567, "grad_norm": 0.08816097534558247, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 41.688995599746704 }, { "epoch": 123, "train_loss": 5.26315210357666, "train_acc": 0.00874, "test_loss": 4.60517013168335, "test_acc": 0.01, "lyapunov": 1.480828346498787, "grad_norm": 0.08865951427268862, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 41.67227745056152 }, { "epoch": 124, "train_loss": 5.261944111022949, "train_acc": 0.00914, "test_loss": 4.605170402526856, "test_acc": 0.01, "lyapunov": 1.4794809848756132, "grad_norm": 0.08788803702349164, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 41.66115140914917 }, { "epoch": 125, "train_loss": 5.262568561401367, "train_acc": 0.0084, "test_loss": 4.60517010345459, "test_acc": 0.01, "lyapunov": 1.4801926018331972, "grad_norm": 0.08788675914126909, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 41.66165113449097 }, { "epoch": 126, "train_loss": 5.262280065460205, "train_acc": 0.00902, "test_loss": 4.605170187377929, "test_acc": 0.01, "lyapunov": 1.479902151295596, "grad_norm": 0.08819775554912056, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 41.69537806510925 }, { "epoch": 127, "train_loss": 5.263674239196777, "train_acc": 0.00884, "test_loss": 4.605170446777343, "test_acc": 0.01, "lyapunov": 1.48142600425369, "grad_norm": 0.08796249954554257, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 41.79696488380432 }, { "epoch": 128, "train_loss": 5.270508392181396, "train_acc": 0.00774, "test_loss": 4.6051702003479, "test_acc": 0.01, "lyapunov": 1.4854568767425653, "grad_norm": 0.0903277044807366, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 41.78498363494873 }, { "epoch": 129, "train_loss": 5.264521000213623, "train_acc": 0.00884, "test_loss": 4.60517049331665, "test_acc": 0.01, "lyapunov": 1.4823556894536518, "grad_norm": 0.08791573530006377, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 41.75825619697571 }, { "epoch": 130, "train_loss": 5.263497207641602, "train_acc": 0.00856, "test_loss": 4.605170115661621, "test_acc": 0.01, "lyapunov": 1.4812386575562264, "grad_norm": 0.08821103937271832, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 41.753769874572754 }, { "epoch": 131, "train_loss": 5.262869830932617, "train_acc": 0.00886, "test_loss": 4.605170347595215, "test_acc": 0.01, "lyapunov": 1.4805735938079523, "grad_norm": 0.08785954608269858, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 41.688891649246216 }, { "epoch": 132, "train_loss": 5.261720856323242, "train_acc": 0.0092, "test_loss": 4.605170230865479, "test_acc": 0.01, "lyapunov": 1.4792467572195145, "grad_norm": 0.087651258765062, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 41.77381873130798 }, { "epoch": 133, "train_loss": 5.262511810150147, "train_acc": 0.0094, "test_loss": 4.605170274353028, "test_acc": 0.01, "lyapunov": 1.480145969354283, "grad_norm": 0.08750516435565067, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 41.82425284385681 }, { "epoch": 134, "train_loss": 5.2628221615600586, "train_acc": 0.009, "test_loss": 4.605170260620117, "test_acc": 0.01, "lyapunov": 1.480488061295141, "grad_norm": 0.08767200957157907, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 41.67008709907532 }, { "epoch": 135, "train_loss": 5.262214541320801, "train_acc": 0.00906, "test_loss": 4.605170357513428, "test_acc": 0.01, "lyapunov": 1.479800993524244, "grad_norm": 0.08833622992837174, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 41.68112754821777 }, { "epoch": 136, "train_loss": 5.261716612854004, "train_acc": 0.00888, "test_loss": 4.605170449829101, "test_acc": 0.01, "lyapunov": 1.4792663523608156, "grad_norm": 0.0879915508382305, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 41.70846509933472 }, { "epoch": 137, "train_loss": 5.2621297309875485, "train_acc": 0.00882, "test_loss": 4.6051704208374025, "test_acc": 0.01, "lyapunov": 1.4797221123410003, "grad_norm": 0.08806309329797692, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 41.68800139427185 }, { "epoch": 138, "train_loss": 5.262034148254394, "train_acc": 0.009, "test_loss": 4.6051704246520995, "test_acc": 0.01, "lyapunov": 1.4796448052691682, "grad_norm": 0.08834842868525353, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 41.69483256340027 }, { "epoch": 139, "train_loss": 5.262303157958985, "train_acc": 0.00964, "test_loss": 4.605170336914062, "test_acc": 0.01, "lyapunov": 1.479908719696962, "grad_norm": 0.08774925576434625, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 41.66975927352905 }, { "epoch": 140, "train_loss": 5.262272278747559, "train_acc": 0.0093, "test_loss": 4.60517025756836, "test_acc": 0.01, "lyapunov": 1.4799000518706145, "grad_norm": 0.08772068441716457, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 41.66502594947815 }, { "epoch": 141, "train_loss": 5.262688246459961, "train_acc": 0.01, "test_loss": 4.605170532226563, "test_acc": 0.01, "lyapunov": 1.4803482586770411, "grad_norm": 0.08814041677323237, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 41.68389272689819 }, { "epoch": 142, "train_loss": 5.2666687211608885, "train_acc": 0.01, "test_loss": 4.605170266723633, "test_acc": 0.01, "lyapunov": 1.4834284483624236, "grad_norm": 0.08808456177000348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 41.70149374008179 }, { "epoch": 143, "train_loss": 5.2625910409545895, "train_acc": 0.00962, "test_loss": 4.605170193481445, "test_acc": 0.01, "lyapunov": 1.4802313485108982, "grad_norm": 0.08826750361435122, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 41.675010204315186 }, { "epoch": 144, "train_loss": 5.260678899536133, "train_acc": 0.01, "test_loss": 4.60517022857666, "test_acc": 0.01, "lyapunov": 1.4781028556701776, "grad_norm": 0.08826672055694883, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 41.67730474472046 }, { "epoch": 145, "train_loss": 5.262034167785645, "train_acc": 0.01, "test_loss": 4.605170384216309, "test_acc": 0.01, "lyapunov": 1.47965680668726, "grad_norm": 0.08792698291184464, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 41.711742639541626 }, { "epoch": 146, "train_loss": 5.262125458984375, "train_acc": 0.01, "test_loss": 4.605170105743408, "test_acc": 0.01, "lyapunov": 1.4797236641959461, "grad_norm": 0.0878274682773103, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 41.72946882247925 }, { "epoch": 147, "train_loss": 5.263207815246582, "train_acc": 0.01, "test_loss": 4.605170260620117, "test_acc": 0.01, "lyapunov": 1.4809288390152289, "grad_norm": 0.08780070915999844, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 41.724937438964844 }, { "epoch": 148, "train_loss": 5.262101231384277, "train_acc": 0.01, "test_loss": 4.605170335388183, "test_acc": 0.01, "lyapunov": 1.4797268191261974, "grad_norm": 0.08811462011437057, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 41.86608529090881 }, { "epoch": 149, "train_loss": 5.26564047592163, "train_acc": 0.01, "test_loss": 4.605170273590088, "test_acc": 0.01, "lyapunov": 1.4827746887646063, "grad_norm": 0.088563737069616, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 41.668235540390015 }, { "epoch": 150, "train_loss": 5.263033789978027, "train_acc": 0.01, "test_loss": 4.605170249176026, "test_acc": 0.01, "lyapunov": 1.480735678197173, "grad_norm": 0.08808051231477661, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 41.65666699409485 } ], "8": [ { "epoch": 1, "train_loss": 5.146603754577637, "train_acc": 0.02116, "test_loss": 4.799143431091308, "test_acc": 0.0147, "lyapunov": 2.247725067846001, "grad_norm": 5.759558294617595, "grad_max_sv": 4.593458223342895, "grad_min_sv": 9.939812799508729e-08, "grad_condition": 84468621.05560377, "lr": 0.0009998903417374227, "time_sec": 86.99692106246948 }, { "epoch": 2, "train_loss": 4.751044019317627, "train_acc": 0.0261, "test_loss": 4.781899060058594, "test_acc": 0.0112, "lyapunov": 1.7586963832225946, "grad_norm": 3.669503755077576, "grad_max_sv": 2.629068848490715, "grad_min_sv": 6.128463263532779e-08, "grad_condition": 51408050.19515464, "lr": 0.0009995614150494292, "time_sec": 86.99053359031677 }, { "epoch": 3, "train_loss": 4.5855533428955075, "train_acc": 0.0302, "test_loss": 4.783446264648438, "test_acc": 0.0204, "lyapunov": 1.650954161458613, "grad_norm": 1.8760355114337364, "grad_max_sv": 1.30306978225708, "grad_min_sv": 3.0873310079282404e-08, "grad_condition": 74135293.70537718, "lr": 0.0009990133642141358, "time_sec": 87.01290392875671 }, { "epoch": 4, "train_loss": 4.534848844451904, "train_acc": 0.03702, "test_loss": 4.8837289710998535, "test_acc": 0.0149, "lyapunov": 1.5894556011995087, "grad_norm": 1.244556287523884, "grad_max_sv": 0.7792816802859306, "grad_min_sv": 1.8834766013497984e-08, "grad_condition": 45093330.72508425, "lr": 0.0009982464296247522, "time_sec": 87.01876306533813 }, { "epoch": 5, "train_loss": 4.592422800903321, "train_acc": 0.03296, "test_loss": 4.848946441650391, "test_acc": 0.0145, "lyapunov": 1.5674470586849905, "grad_norm": 0.9784603406000693, "grad_max_sv": 0.5906251654028892, "grad_min_sv": 1.3135394039365212e-08, "grad_condition": 2765173736.408195, "lr": 0.0009972609476841367, "time_sec": 87.06145668029785 }, { "epoch": 6, "train_loss": 4.617396930847168, "train_acc": 0.03438, "test_loss": 5.069504800415039, "test_acc": 0.0141, "lyapunov": 1.5743840259054434, "grad_norm": 0.8765996249293907, "grad_max_sv": 0.4905373930931091, "grad_min_sv": 1.1570106956413153e-08, "grad_condition": 490506519.64879054, "lr": 0.000996057350657239, "time_sec": 86.98913550376892 }, { "epoch": 7, "train_loss": 4.673418109436035, "train_acc": 0.03144, "test_loss": 5.083357322692871, "test_acc": 0.01, "lyapunov": 1.5757776337206517, "grad_norm": 0.842980463237632, "grad_max_sv": 0.4635330677032471, "grad_min_sv": 9.801791714218744e-09, "grad_condition": 672093861.9243783, "lr": 0.000994636166481494, "time_sec": 87.02865362167358 }, { "epoch": 8, "train_loss": 4.715173123626709, "train_acc": 0.02866, "test_loss": 6.969320404052734, "test_acc": 0.01, "lyapunov": 1.572990819621269, "grad_norm": 0.7658102895010526, "grad_max_sv": 0.39840318709611894, "grad_min_sv": 7.909037175684143e-09, "grad_condition": 2689350489.23699, "lr": 0.0009929980185352525, "time_sec": 87.05855631828308 }, { "epoch": 9, "train_loss": 4.719650735931396, "train_acc": 0.03378, "test_loss": 6.69895283203125, "test_acc": 0.01, "lyapunov": 1.5739632753459998, "grad_norm": 0.6951362665980956, "grad_max_sv": 0.40656831562519075, "grad_min_sv": 9.631129597315046e-09, "grad_condition": 152979631.4939035, "lr": 0.0009911436253643444, "time_sec": 87.04356169700623 }, { "epoch": 10, "train_loss": 4.785277546691894, "train_acc": 0.03084, "test_loss": 7.56282477722168, "test_acc": 0.01, "lyapunov": 1.5731478392925409, "grad_norm": 0.8027087514422708, "grad_max_sv": 0.4249536793678999, "grad_min_sv": 1.0233699096961427e-08, "grad_condition": 2212458832.3035727, "lr": 0.0009890738003669028, "time_sec": 86.9918863773346 }, { "epoch": 11, "train_loss": 4.85365997543335, "train_acc": 0.02776, "test_loss": 6.083891798400879, "test_acc": 0.01, "lyapunov": 1.594173707315684, "grad_norm": 0.6228665658651402, "grad_max_sv": 0.3807309426367283, "grad_min_sv": 7.858218521034076e-09, "grad_condition": 142247255.9097917, "lr": 0.00098678945143658, "time_sec": 87.02730226516724 }, { "epoch": 12, "train_loss": 4.936503148193359, "train_acc": 0.02734, "test_loss": 4.648137149047852, "test_acc": 0.01, "lyapunov": 1.6324983204112333, "grad_norm": 0.8180108242362618, "grad_max_sv": 0.3168713390827179, "grad_min_sv": 6.217847966746067e-09, "grad_condition": 1904828726.2920518, "lr": 0.0009842915805643154, "time_sec": 86.98762059211731 }, { "epoch": 13, "train_loss": 4.989127286529541, "train_acc": 0.02624, "test_loss": 5.89718906326294, "test_acc": 0.01, "lyapunov": 1.6513543821051908, "grad_norm": 0.8703418944824507, "grad_max_sv": 0.3535689525306225, "grad_min_sv": 6.494354365393917e-09, "grad_condition": 75061975.40179494, "lr": 0.000981581283398829, "time_sec": 86.99741172790527 }, { "epoch": 14, "train_loss": 5.027360094604492, "train_acc": 0.02734, "test_loss": 5.6859222030639645, "test_acc": 0.01, "lyapunov": 1.66906841667107, "grad_norm": 0.8955015428134906, "grad_max_sv": 0.3326103314757347, "grad_min_sv": 5.961173611852833e-09, "grad_condition": 196184685.20064688, "lr": 0.0009786597487660333, "time_sec": 86.990553855896 }, { "epoch": 15, "train_loss": 5.103685426635742, "train_acc": 0.0235, "test_loss": 4.620827954101562, "test_acc": 0.01, "lyapunov": 1.6500021161325753, "grad_norm": 0.7165299396921548, "grad_max_sv": 0.29206431321799753, "grad_min_sv": 3.742070758853766e-09, "grad_condition": 11821452317.947672, "lr": 0.0009755282581475766, "time_sec": 86.99919128417969 }, { "epoch": 16, "train_loss": 5.046826876983642, "train_acc": 0.02808, "test_loss": 4.618471592712402, "test_acc": 0.01, "lyapunov": 1.6286348086183944, "grad_norm": 0.8805208885120411, "grad_max_sv": 0.34881011955440044, "grad_min_sv": 5.4340508724715075e-09, "grad_condition": 607977502.9364278, "lr": 0.0009721881851187403, "time_sec": 87.02350974082947 }, { "epoch": 17, "train_loss": 5.125038688812256, "train_acc": 0.02188, "test_loss": 5.0374674758911135, "test_acc": 0.01, "lyapunov": 1.6156021630977426, "grad_norm": 0.7664664524159326, "grad_max_sv": 0.31916227340698244, "grad_min_sv": 3.2244314654420098e-09, "grad_condition": 12300439770.56846, "lr": 0.0009686409947459456, "time_sec": 87.0214216709137 }, { "epoch": 18, "train_loss": 5.1917090243530275, "train_acc": 0.02074, "test_loss": 6.239829849243164, "test_acc": 0.01, "lyapunov": 1.6075686880999513, "grad_norm": 0.8340839537949596, "grad_max_sv": 0.2987551841884851, "grad_min_sv": 1.3384357527406395e-09, "grad_condition": 53090691786.99108, "lr": 0.0009648882429441254, "time_sec": 87.0026741027832 }, { "epoch": 19, "train_loss": 5.1467557635498045, "train_acc": 0.02224, "test_loss": 4.859098764038086, "test_acc": 0.01, "lyapunov": 1.5547950270840578, "grad_norm": 0.5424186147523934, "grad_max_sv": 0.2584996819496155, "grad_min_sv": 1.7988151973410667e-10, "grad_condition": 42973213975.62498, "lr": 0.00096093157579425, "time_sec": 87.0099880695343 }, { "epoch": 20, "train_loss": 5.253306176147461, "train_acc": 0.01948, "test_loss": 8.813103515625, "test_acc": 0.01, "lyapunov": 1.5798406722905385, "grad_norm": 0.6790335216715864, "grad_max_sv": 0.2796168942004442, "grad_min_sv": 1.3123472687420754e-09, "grad_condition": 55528903276.005905, "lr": 0.0009567727288213001, "time_sec": 87.00798654556274 }, { "epoch": 21, "train_loss": 5.3828185322570805, "train_acc": 0.01028, "test_loss": 8.961210163879395, "test_acc": 0.01, "lyapunov": 1.566893112933849, "grad_norm": 0.9785357311156059, "grad_max_sv": 0.4175733871757984, "grad_min_sv": 5.038056967646815e-09, "grad_condition": 2576596333.756474, "lr": 0.0009524135262330095, "time_sec": 87.24499773979187 }, { "epoch": 22, "train_loss": 5.318783715209961, "train_acc": 0.01022, "test_loss": 9.226270596313476, "test_acc": 0.01, "lyapunov": 1.515167183888233, "grad_norm": 0.5897187117480035, "grad_max_sv": 0.32070303708314896, "grad_min_sv": 3.3304707929004972e-09, "grad_condition": 145373104.26632357, "lr": 0.0009478558801197061, "time_sec": 87.02501797676086 }, { "epoch": 23, "train_loss": 5.311336210021973, "train_acc": 0.00992, "test_loss": 9.553670106506347, "test_acc": 0.01, "lyapunov": 1.5058710337294947, "grad_norm": 0.42067884050272164, "grad_max_sv": 0.3374065548181534, "grad_min_sv": 3.917849118045824e-09, "grad_condition": 148787617.53453642, "lr": 0.000943101789615607, "time_sec": 87.03109979629517 }, { "epoch": 24, "train_loss": 5.310154438018799, "train_acc": 0.01036, "test_loss": 7.603771569824219, "test_acc": 0.01, "lyapunov": 1.509728124379502, "grad_norm": 0.3834815238141383, "grad_max_sv": 0.3096462905406952, "grad_min_sv": 2.737797575240686e-09, "grad_condition": 22145829075.872944, "lr": 0.0009381533400219313, "time_sec": 86.98246717453003 }, { "epoch": 25, "train_loss": 5.301079537353516, "train_acc": 0.00976, "test_loss": 7.519319520568848, "test_acc": 0.01, "lyapunov": 1.5108507871627808, "grad_norm": 0.30755221598797206, "grad_max_sv": 0.2302608024328947, "grad_min_sv": 2.0953720649433853e-11, "grad_condition": 115571274953.14014, "lr": 0.0009330127018922189, "time_sec": 87.00150752067566 }, { "epoch": 26, "train_loss": 5.2993214897155765, "train_acc": 0.00926, "test_loss": 7.535327529907226, "test_acc": 0.01, "lyapunov": 1.5122191076693328, "grad_norm": 0.2686555081361175, "grad_max_sv": 0.1873680654913187, "grad_min_sv": 1.1968037446042912e-12, "grad_condition": 111356408601.78958, "lr": 0.000927682130080253, "time_sec": 87.06040525436401 }, { "epoch": 27, "train_loss": 5.301115319061279, "train_acc": 0.01026, "test_loss": 7.4256896377563475, "test_acc": 0.01, "lyapunov": 1.5147829875921655, "grad_norm": 0.2584031825672629, "grad_max_sv": 0.18733071088790892, "grad_min_sv": 1.5532640335746842e-12, "grad_condition": 105854162513.72067, "lr": 0.0009221639627510072, "time_sec": 87.0212287902832 }, { "epoch": 28, "train_loss": 5.300986379394531, "train_acc": 0.00912, "test_loss": 7.3856002044677735, "test_acc": 0.01, "lyapunov": 1.5147232972752407, "grad_norm": 0.2414535578672304, "grad_max_sv": 0.16182587593793868, "grad_min_sv": 2.716757690251971e-13, "grad_condition": 139096227622.95874, "lr": 0.0009164606203550494, "time_sec": 87.02124691009521 }, { "epoch": 29, "train_loss": 5.311827180175781, "train_acc": 0.00958, "test_loss": 9.537436566162109, "test_acc": 0.01, "lyapunov": 1.5239817428466913, "grad_norm": 0.2934555140553008, "grad_max_sv": 0.17254459988325835, "grad_min_sv": 7.800315873566188e-13, "grad_condition": 118094677554.4253, "lr": 0.0009105746045668516, "time_sec": 87.02146863937378 }, { "epoch": 30, "train_loss": 5.306949669952393, "train_acc": 0.00986, "test_loss": 9.629324139404297, "test_acc": 0.01, "lyapunov": 1.5190055486186387, "grad_norm": 0.2568362833037679, "grad_max_sv": 0.1871931992471218, "grad_min_sv": 8.733775765521943e-13, "grad_condition": 124328292229.6437, "lr": 0.0009045084971874733, "time_sec": 87.0063271522522 }, { "epoch": 31, "train_loss": 5.317695409240723, "train_acc": 0.00946, "test_loss": 9.857299293518066, "test_acc": 0.01, "lyapunov": 1.5297813034423478, "grad_norm": 0.31967679371455754, "grad_max_sv": 0.17166709154844284, "grad_min_sv": 1.3052075569227142e-12, "grad_condition": 105851795247.06416, "lr": 0.0008982649590120977, "time_sec": 87.03139019012451 }, { "epoch": 32, "train_loss": 5.306474250030518, "train_acc": 0.00946, "test_loss": 6.192124473571777, "test_acc": 0.01, "lyapunov": 1.5204204305663438, "grad_norm": 0.22033885472694253, "grad_max_sv": 0.1525889288634062, "grad_min_sv": 4.756078352149119e-13, "grad_condition": 128078379912.95, "lr": 0.0008918467286629196, "time_sec": 86.99606108665466 }, { "epoch": 33, "train_loss": 5.307142764892578, "train_acc": 0.00976, "test_loss": 7.497373861694336, "test_acc": 0.01, "lyapunov": 1.522810420721693, "grad_norm": 0.20782539541327114, "grad_max_sv": 0.13517180345952512, "grad_min_sv": 1.1068227830043178e-13, "grad_condition": 123350210961.5916, "lr": 0.0008852566213878943, "time_sec": 87.02485609054565 }, { "epoch": 34, "train_loss": 5.307786667785645, "train_acc": 0.01036, "test_loss": 6.049268864440918, "test_acc": 0.01, "lyapunov": 1.5257866547235748, "grad_norm": 0.1890978405416262, "grad_max_sv": 0.10800869315862656, "grad_min_sv": 7.129825504179478e-15, "grad_condition": 107252102588.7272, "lr": 0.000878497527825878, "time_sec": 87.10786271095276 }, { "epoch": 35, "train_loss": 5.3119341674804685, "train_acc": 0.009, "test_loss": 4.805781600952148, "test_acc": 0.01, "lyapunov": 1.5290101019622724, "grad_norm": 0.1944266687511967, "grad_max_sv": 0.11351412069052458, "grad_min_sv": 1.0284869415209545e-14, "grad_condition": 112374076474.89091, "lr": 0.000871572412738697, "time_sec": 87.02945756912231 }, { "epoch": 36, "train_loss": 5.30866313369751, "train_acc": 0.01008, "test_loss": 5.370443841552734, "test_acc": 0.01, "lyapunov": 1.5276334587570346, "grad_norm": 0.16190926523802132, "grad_max_sv": 0.09535483401268721, "grad_min_sv": 3.195651304626571e-15, "grad_condition": 94990079164.94656, "lr": 0.0008644843137107055, "time_sec": 86.99824213981628 }, { "epoch": 37, "train_loss": 5.308895555877686, "train_acc": 0.0099, "test_loss": 4.843223188781738, "test_acc": 0.01, "lyapunov": 1.5290613820790635, "grad_norm": 0.15630460219006667, "grad_max_sv": 0.08036092817783355, "grad_min_sv": 1.1315139619811405e-17, "grad_condition": 80360078431.92064, "lr": 0.0008572363398164014, "time_sec": 86.98283195495605 }, { "epoch": 38, "train_loss": 5.31004166229248, "train_acc": 0.00976, "test_loss": 4.780417753601074, "test_acc": 0.01, "lyapunov": 1.5300937909299455, "grad_norm": 0.16356950260232017, "grad_max_sv": 0.08305604849010706, "grad_min_sv": 8.648904023608753e-17, "grad_condition": 83049364241.033, "lr": 0.0008498316702566826, "time_sec": 87.12476921081543 }, { "epoch": 39, "train_loss": 5.308765927276611, "train_acc": 0.00922, "test_loss": 4.650610294342041, "test_acc": 0.01, "lyapunov": 1.529145797195337, "grad_norm": 0.13936121996216216, "grad_max_sv": 0.06846637381240725, "grad_min_sv": 6.938789416330728e-18, "grad_condition": 68465862650.46446, "lr": 0.0008422735529643442, "time_sec": 87.00707483291626 }, { "epoch": 40, "train_loss": 5.312034950561523, "train_acc": 0.00936, "test_loss": 8.73487543487549, "test_acc": 0.01, "lyapunov": 1.532078573465957, "grad_norm": 0.18500833074783374, "grad_max_sv": 0.078881626855582, "grad_min_sv": 1.2209525522074501e-26, "grad_condition": 78881626855.5808, "lr": 0.0008345653031794289, "time_sec": 86.97358655929565 }, { "epoch": 41, "train_loss": 5.3188898524475094, "train_acc": 0.00938, "test_loss": 6.380272773742676, "test_acc": 0.01, "lyapunov": 1.5366824176305396, "grad_norm": 0.16899341003407245, "grad_max_sv": 0.0827794061973691, "grad_min_sv": 1.2491873132717773e-20, "grad_condition": 82779405140.55663, "lr": 0.0008267103019950526, "time_sec": 86.98160243034363 }, { "epoch": 42, "train_loss": 5.311096598052979, "train_acc": 0.00918, "test_loss": 6.181304641723633, "test_acc": 0.01, "lyapunov": 1.53186220738589, "grad_norm": 0.14945919124069362, "grad_max_sv": 0.07147165723145008, "grad_min_sv": 1.6261729001718281e-18, "grad_condition": 71471530485.47403, "lr": 0.0008187119948743447, "time_sec": 86.98783445358276 }, { "epoch": 43, "train_loss": 5.311037984619141, "train_acc": 0.00992, "test_loss": 6.528422421264648, "test_acc": 0.01, "lyapunov": 1.5322752218417195, "grad_norm": 0.13413981069527348, "grad_max_sv": 0.05753951920196414, "grad_min_sv": 5.739214042427294e-41, "grad_condition": 57539519201.964134, "lr": 0.000810573890139155, "time_sec": 87.02233648300171 }, { "epoch": 44, "train_loss": 5.314179193420411, "train_acc": 0.00976, "test_loss": 6.383645655822754, "test_acc": 0.01, "lyapunov": 1.5352078728053882, "grad_norm": 0.15018671176350665, "grad_max_sv": 0.06426793411374092, "grad_min_sv": 1.0144677449199871e-19, "grad_condition": 64267926931.3136, "lr": 0.0008022995574311873, "time_sec": 86.99135541915894 }, { "epoch": 45, "train_loss": 5.3138120045471195, "train_acc": 0.00972, "test_loss": 6.1780305633544925, "test_acc": 0.01, "lyapunov": 1.53417928048107, "grad_norm": 0.1546946181453632, "grad_max_sv": 0.07538183946162462, "grad_min_sv": 2.0235549254645516e-17, "grad_condition": 75380064770.74498, "lr": 0.0007938926261462363, "time_sec": 86.9700219631195 }, { "epoch": 46, "train_loss": 5.31338122253418, "train_acc": 0.01088, "test_loss": 4.875375650024414, "test_acc": 0.01, "lyapunov": 1.5348101799445384, "grad_norm": 0.13799834022044194, "grad_max_sv": 0.05826565367169678, "grad_min_sv": 1.2213807007518915e-19, "grad_condition": 58265644274.60155, "lr": 0.0007853567838422158, "time_sec": 86.9914186000824 }, { "epoch": 47, "train_loss": 5.316119242401123, "train_acc": 0.01028, "test_loss": 7.579864669799805, "test_acc": 0.01, "lyapunov": 1.5372701596725933, "grad_norm": 0.1318310224117309, "grad_max_sv": 0.059043215587735176, "grad_min_sv": 1.0278524235822533e-42, "grad_condition": 59043215587.73517, "lr": 0.0007766957746216719, "time_sec": 86.99268984794617 }, { "epoch": 48, "train_loss": 5.3163630574035645, "train_acc": 0.00918, "test_loss": 8.10872494354248, "test_acc": 0.01, "lyapunov": 1.537570302443736, "grad_norm": 0.14919853802284255, "grad_max_sv": 0.059043734613806007, "grad_min_sv": 1.9169802249728662e-27, "grad_condition": 59043734613.80581, "lr": 0.0007679133974894982, "time_sec": 86.96942186355591 }, { "epoch": 49, "train_loss": 5.315186663513184, "train_acc": 0.00982, "test_loss": 10.137148637390137, "test_acc": 0.01, "lyapunov": 1.5357392169630435, "grad_norm": 0.14339565437399782, "grad_max_sv": 0.07659720163792372, "grad_min_sv": 9.214212859750722e-16, "grad_condition": 76509866898.91414, "lr": 0.000759013504686565, "time_sec": 87.01622128486633 }, { "epoch": 50, "train_loss": 5.314455534973145, "train_acc": 0.0102, "test_loss": 8.247185594177246, "test_acc": 0.01, "lyapunov": 1.5355263009400624, "grad_norm": 0.13354715221640268, "grad_max_sv": 0.06603035274893046, "grad_min_sv": 4.3361800326764774e-19, "grad_condition": 66030309212.30867, "lr": 0.0007499999999999998, "time_sec": 86.99394655227661 }, { "epoch": 51, "train_loss": 5.32153740737915, "train_acc": 0.01, "test_loss": 8.37662465057373, "test_acc": 0.01, "lyapunov": 1.5409153455968403, "grad_norm": 0.14502327588857133, "grad_max_sv": 0.06259518237784505, "grad_min_sv": 4.890059136866219e-20, "grad_condition": 62595178420.28666, "lr": 0.0007408768370508575, "time_sec": 86.97510194778442 }, { "epoch": 52, "train_loss": 5.316599715270996, "train_acc": 0.00936, "test_loss": 8.278748655700683, "test_acc": 0.01, "lyapunov": 1.5381617646692964, "grad_norm": 0.1359300928840212, "grad_max_sv": 0.05868045939132571, "grad_min_sv": 2.1909536115890692e-21, "grad_condition": 58680459216.2619, "lr": 0.0007316480175599307, "time_sec": 86.98001670837402 }, { "epoch": 53, "train_loss": 5.316536732788086, "train_acc": 0.01016, "test_loss": 5.486338158416748, "test_acc": 0.01, "lyapunov": 1.5382660676146407, "grad_norm": 0.1271741910618785, "grad_max_sv": 0.05760562280192971, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 57605622801.92971, "lr": 0.0007223175895924635, "time_sec": 86.99369311332703 }, { "epoch": 54, "train_loss": 5.316702398681641, "train_acc": 0.0102, "test_loss": 5.302798899841308, "test_acc": 0.01, "lyapunov": 1.5386110059440594, "grad_norm": 0.15368852800875965, "grad_max_sv": 0.0578720694873482, "grad_min_sv": 1.7830822309301135e-42, "grad_condition": 57872069487.348206, "lr": 0.0007128896457825361, "time_sec": 86.96624207496643 }, { "epoch": 55, "train_loss": 5.316231355743408, "train_acc": 0.00948, "test_loss": 8.74564740600586, "test_acc": 0.01, "lyapunov": 1.5383109363448588, "grad_norm": 0.13190622008458677, "grad_max_sv": 0.04535484011285007, "grad_min_sv": 0.0, "grad_condition": 45354840112.850075, "lr": 0.0007033683215378998, "time_sec": 86.97799372673035 }, { "epoch": 56, "train_loss": 5.317534141235352, "train_acc": 0.00946, "test_loss": 8.70028028869629, "test_acc": 0.01, "lyapunov": 1.5393455677934924, "grad_norm": 0.13462977039802712, "grad_max_sv": 0.06513494476675988, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 65134944766.75987, "lr": 0.0006937577932260512, "time_sec": 86.98487591743469 }, { "epoch": 57, "train_loss": 5.318079041290283, "train_acc": 0.0097, "test_loss": 9.145556756591796, "test_acc": 0.01, "lyapunov": 1.5401513216745517, "grad_norm": 0.13118847481535986, "grad_max_sv": 0.05173748955130577, "grad_min_sv": 0.0, "grad_condition": 51737489551.30577, "lr": 0.0006840622763423388, "time_sec": 87.00480890274048 }, { "epoch": 58, "train_loss": 5.316858307800293, "train_acc": 0.00892, "test_loss": 8.666381803894042, "test_acc": 0.01, "lyapunov": 1.5383905370522033, "grad_norm": 0.12912610896619198, "grad_max_sv": 0.06017917674034834, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 60179176740.34834, "lr": 0.0006742860236609073, "time_sec": 87.00866675376892 }, { "epoch": 59, "train_loss": 5.325099550476074, "train_acc": 0.00954, "test_loss": 8.285526527404786, "test_acc": 0.01, "lyapunov": 1.544173507739211, "grad_norm": 0.15876381906710343, "grad_max_sv": 0.06922355592250824, "grad_min_sv": 2.3088949294307303e-16, "grad_condition": 69207800483.04135, "lr": 0.0006644333233692913, "time_sec": 86.97984671592712 }, { "epoch": 60, "train_loss": 5.3204884049987795, "train_acc": 0.0094, "test_loss": 8.168935748291016, "test_acc": 0.01, "lyapunov": 1.5423277512840603, "grad_norm": 0.12428279151580043, "grad_max_sv": 0.05191116128116846, "grad_min_sv": 0.0, "grad_condition": 51911161281.168465, "lr": 0.0006545084971874734, "time_sec": 86.99251651763916 }, { "epoch": 61, "train_loss": 5.318557815551758, "train_acc": 0.00974, "test_loss": 11.625576313781739, "test_acc": 0.01, "lyapunov": 1.5408994303944776, "grad_norm": 0.11981934242025526, "grad_max_sv": 0.04157847780734301, "grad_min_sv": 0.0, "grad_condition": 41578477807.343, "lr": 0.0006445158984722354, "time_sec": 86.97000765800476 }, { "epoch": 62, "train_loss": 5.320785666503906, "train_acc": 0.00938, "test_loss": 12.541597724914551, "test_acc": 0.01, "lyapunov": 1.5433500727729115, "grad_norm": 0.11919617488574552, "grad_max_sv": 0.04310994283296168, "grad_min_sv": 0.0, "grad_condition": 43109942832.96168, "lr": 0.0006344599103076324, "time_sec": 86.96448731422424 }, { "epoch": 63, "train_loss": 5.32412813293457, "train_acc": 0.0091, "test_loss": 11.793109805297851, "test_acc": 0.01, "lyapunov": 1.5443742366702966, "grad_norm": 0.118004366839836, "grad_max_sv": 0.0428059502504766, "grad_min_sv": 0.0, "grad_condition": 42805950250.4766, "lr": 0.0006243449435824269, "time_sec": 86.93323230743408 }, { "epoch": 64, "train_loss": 5.318806624603272, "train_acc": 0.00956, "test_loss": 12.444959045410156, "test_acc": 0.01, "lyapunov": 1.5414444375830842, "grad_norm": 0.11645932110555444, "grad_max_sv": 0.030990714300423862, "grad_min_sv": 0.0, "grad_condition": 30990714300.42386, "lr": 0.0006141754350553275, "time_sec": 86.89740920066833 }, { "epoch": 65, "train_loss": 5.317045929870606, "train_acc": 0.01018, "test_loss": 10.023806936645508, "test_acc": 0.01, "lyapunov": 1.5395582572883353, "grad_norm": 0.11276313707472024, "grad_max_sv": 0.03361189742572605, "grad_min_sv": 0.0, "grad_condition": 33611897425.726055, "lr": 0.0006039558454088793, "time_sec": 86.97432947158813 }, { "epoch": 66, "train_loss": 5.32016941192627, "train_acc": 0.00944, "test_loss": 10.012617837524415, "test_acc": 0.01, "lyapunov": 1.5425440329115103, "grad_norm": 0.10590387961842582, "grad_max_sv": 0.02548480206169188, "grad_min_sv": 0.0, "grad_condition": 25484802061.691883, "lr": 0.000593690657292862, "time_sec": 86.97213578224182 }, { "epoch": 67, "train_loss": 5.320958078460693, "train_acc": 0.00912, "test_loss": 8.012544973754883, "test_acc": 0.01, "lyapunov": 1.5432329269321374, "grad_norm": 0.11098177802612447, "grad_max_sv": 0.028018432063981892, "grad_min_sv": 0.0, "grad_condition": 28018432063.98189, "lr": 0.0005833843733580507, "time_sec": 86.92108106613159 }, { "epoch": 68, "train_loss": 5.319859785614014, "train_acc": 0.0098, "test_loss": 9.247186422729492, "test_acc": 0.01, "lyapunov": 1.542363587852634, "grad_norm": 0.1248664197770911, "grad_max_sv": 0.04367699818685651, "grad_min_sv": 0.0, "grad_condition": 43676998186.85651, "lr": 0.0005730415142812054, "time_sec": 86.95592594146729 }, { "epoch": 69, "train_loss": 5.318826563873291, "train_acc": 0.01016, "test_loss": 10.35489285736084, "test_acc": 0.01, "lyapunov": 1.5414060040203201, "grad_norm": 0.10987589074835707, "grad_max_sv": 0.03276977320201695, "grad_min_sv": 0.0, "grad_condition": 32769773202.01695, "lr": 0.0005626666167821517, "time_sec": 86.91380739212036 }, { "epoch": 70, "train_loss": 5.317324656524658, "train_acc": 0.01038, "test_loss": 9.99694027709961, "test_acc": 0.01, "lyapunov": 1.5401056565896933, "grad_norm": 0.10923451968148526, "grad_max_sv": 0.026721618324518203, "grad_min_sv": 0.0, "grad_condition": 26721618324.518204, "lr": 0.0005522642316338265, "time_sec": 86.8878607749939 }, { "epoch": 71, "train_loss": 5.317690666198731, "train_acc": 0.00962, "test_loss": 8.448246655273438, "test_acc": 0.01, "lyapunov": 1.5407067177545688, "grad_norm": 0.10993057282913465, "grad_max_sv": 0.021391112776473164, "grad_min_sv": 0.0, "grad_condition": 21391112776.473164, "lr": 0.0005418389216661573, "time_sec": 86.89513158798218 }, { "epoch": 72, "train_loss": 5.317815923156738, "train_acc": 0.01004, "test_loss": 12.15319383392334, "test_acc": 0.01, "lyapunov": 1.5406005382537842, "grad_norm": 0.11546754813601234, "grad_max_sv": 0.04164923094213009, "grad_min_sv": 0.0, "grad_condition": 41649230942.13009, "lr": 0.0005313952597646563, "time_sec": 86.93751883506775 }, { "epoch": 73, "train_loss": 5.318552890930175, "train_acc": 0.009, "test_loss": 7.365837602996826, "test_acc": 0.01, "lyapunov": 1.5411235444685991, "grad_norm": 0.11378399985617368, "grad_max_sv": 0.03538390537723899, "grad_min_sv": 0.0, "grad_condition": 35383905377.23899, "lr": 0.0005209378268645994, "time_sec": 86.92508888244629 }, { "epoch": 74, "train_loss": 5.3266375039672855, "train_acc": 0.00916, "test_loss": 5.939176264190674, "test_acc": 0.01, "lyapunov": 1.5473728344568511, "grad_norm": 0.112949937059148, "grad_max_sv": 0.01943044299259782, "grad_min_sv": 0.0, "grad_condition": 19430442992.597816, "lr": 0.0005104712099416781, "time_sec": 86.87594652175903 }, { "epoch": 75, "train_loss": 5.3182286242675785, "train_acc": 0.00916, "test_loss": 7.4682364219665525, "test_acc": 0.01, "lyapunov": 1.5411189620757042, "grad_norm": 0.11641453125231847, "grad_max_sv": 0.01762835620902479, "grad_min_sv": 0.0, "grad_condition": 17628356209.024788, "lr": 0.0004999999999999996, "time_sec": 86.89264059066772 }, { "epoch": 76, "train_loss": 5.318416892242432, "train_acc": 0.00958, "test_loss": 6.8439142288208, "test_acc": 0.01, "lyapunov": 1.5413539412686281, "grad_norm": 0.10777855944530633, "grad_max_sv": 0.015298370318487287, "grad_min_sv": 0.0, "grad_condition": 15298370318.487286, "lr": 0.0004895287900583212, "time_sec": 86.88371872901917 }, { "epoch": 77, "train_loss": 5.3228406227111815, "train_acc": 0.00964, "test_loss": 10.02866414489746, "test_acc": 0.01, "lyapunov": 1.544968852606576, "grad_norm": 0.1305888852844692, "grad_max_sv": 0.01963789644651115, "grad_min_sv": 0.0, "grad_condition": 19637896446.51115, "lr": 0.0004790621731353997, "time_sec": 86.87340235710144 }, { "epoch": 78, "train_loss": 5.319401046447754, "train_acc": 0.00956, "test_loss": 8.256184762573243, "test_acc": 0.01, "lyapunov": 1.54242708158615, "grad_norm": 0.11168685518140656, "grad_max_sv": 0.02321814843453467, "grad_min_sv": 0.0, "grad_condition": 23218148434.534668, "lr": 0.000468604740235343, "time_sec": 86.87403607368469 }, { "epoch": 79, "train_loss": 5.319539002532959, "train_acc": 0.00924, "test_loss": 6.6485612655639645, "test_acc": 0.01, "lyapunov": 1.5427932879504036, "grad_norm": 0.1281479832918265, "grad_max_sv": 0.014649314666166901, "grad_min_sv": 0.0, "grad_condition": 14649314666.1669, "lr": 0.00045816107833384175, "time_sec": 86.86377239227295 }, { "epoch": 80, "train_loss": 5.321709277648925, "train_acc": 0.00858, "test_loss": 7.656314584350586, "test_acc": 0.01, "lyapunov": 1.5438944933664462, "grad_norm": 0.1379118039308171, "grad_max_sv": 0.006280570011585951, "grad_min_sv": 0.0, "grad_condition": 6280570011.585951, "lr": 0.0004477357683661729, "time_sec": 86.91206550598145 }, { "epoch": 81, "train_loss": 5.319362686614991, "train_acc": 0.00904, "test_loss": 7.019269757080078, "test_acc": 0.01, "lyapunov": 1.542548160723713, "grad_norm": 0.12802539188386938, "grad_max_sv": 0.019554349593818188, "grad_min_sv": 0.0, "grad_condition": 19554349593.818188, "lr": 0.00043733338321784746, "time_sec": 86.88340616226196 }, { "epoch": 82, "train_loss": 5.319549789886475, "train_acc": 0.00932, "test_loss": 7.563053443908691, "test_acc": 0.01, "lyapunov": 1.5428213295729265, "grad_norm": 0.12962728912126797, "grad_max_sv": 0.011001831339672207, "grad_min_sv": 0.0, "grad_condition": 11001831339.672207, "lr": 0.0004269584857187939, "time_sec": 87.12197208404541 }, { "epoch": 83, "train_loss": 5.3209361798095705, "train_acc": 0.01004, "test_loss": 8.245951638793946, "test_acc": 0.01, "lyapunov": 1.543517429810351, "grad_norm": 0.12992986434807738, "grad_max_sv": 0.011371771851554514, "grad_min_sv": 0.0, "grad_condition": 11371771851.554514, "lr": 0.0004166156266419484, "time_sec": 86.8549747467041 }, { "epoch": 84, "train_loss": 5.319158186340332, "train_acc": 0.00988, "test_loss": 11.181426934814453, "test_acc": 0.01, "lyapunov": 1.5418739129820138, "grad_norm": 0.14570895237027714, "grad_max_sv": 0.03400726960971952, "grad_min_sv": 0.0, "grad_condition": 34007269609.719513, "lr": 0.0004063093427071373, "time_sec": 86.95320224761963 }, { "epoch": 85, "train_loss": 5.319012271881103, "train_acc": 0.0104, "test_loss": 8.699293096923828, "test_acc": 0.01, "lyapunov": 1.5420828835128824, "grad_norm": 0.15422110126668967, "grad_max_sv": 0.0475749587174505, "grad_min_sv": 0.0, "grad_condition": 47574958717.4505, "lr": 0.0003960441545911199, "time_sec": 86.97516655921936 }, { "epoch": 86, "train_loss": 5.319778329925537, "train_acc": 0.0099, "test_loss": 8.610072163391113, "test_acc": 0.01, "lyapunov": 1.5427404270147729, "grad_norm": 0.16350408468824804, "grad_max_sv": 0.0467130537610501, "grad_min_sv": 0.0, "grad_condition": 46713053761.0501, "lr": 0.0003858245649446718, "time_sec": 86.97473764419556 }, { "epoch": 87, "train_loss": 5.320261403961181, "train_acc": 0.01, "test_loss": 9.01234596862793, "test_acc": 0.01, "lyapunov": 1.5430970234639199, "grad_norm": 0.1987413764171708, "grad_max_sv": 0.042272613104432824, "grad_min_sv": 0.0, "grad_condition": 42272613104.432816, "lr": 0.00037565505641757235, "time_sec": 86.94777846336365 }, { "epoch": 88, "train_loss": 5.328781169433594, "train_acc": 0.00958, "test_loss": 7.222933032226562, "test_acc": 0.01, "lyapunov": 1.5479203133326966, "grad_norm": 0.20200984386229512, "grad_max_sv": 0.037374650174751875, "grad_min_sv": 2.888694869312344e-20, "grad_condition": 37374645422.50441, "lr": 0.00036554008969236695, "time_sec": 86.9300582408905 }, { "epoch": 89, "train_loss": 5.3212895065307615, "train_acc": 0.00972, "test_loss": 7.341721871948242, "test_acc": 0.01, "lyapunov": 1.5442103443243314, "grad_norm": 0.21135067798139123, "grad_max_sv": 0.03894036049023271, "grad_min_sv": 0.0, "grad_condition": 38940360490.232704, "lr": 0.0003554841015277638, "time_sec": 87.02612471580505 }, { "epoch": 90, "train_loss": 5.319550964050293, "train_acc": 0.0093, "test_loss": 7.149930093383789, "test_acc": 0.01, "lyapunov": 1.5423216917325773, "grad_norm": 0.17437221481494697, "grad_max_sv": 0.04075719062238932, "grad_min_sv": 0.0, "grad_condition": 40757190622.38932, "lr": 0.000345491502812526, "time_sec": 86.95247411727905 }, { "epoch": 91, "train_loss": 5.319614014892578, "train_acc": 0.00888, "test_loss": 7.18144443359375, "test_acc": 0.01, "lyapunov": 1.5426533264882119, "grad_norm": 0.17520092959369415, "grad_max_sv": 0.022456927318125965, "grad_min_sv": 0.0, "grad_condition": 22456927318.125965, "lr": 0.0003355666766307081, "time_sec": 86.8960337638855 }, { "epoch": 92, "train_loss": 5.3187762687683104, "train_acc": 0.00888, "test_loss": 7.264889540863037, "test_acc": 0.01, "lyapunov": 1.5419618226683047, "grad_norm": 0.1656377365844615, "grad_max_sv": 0.015189866488799452, "grad_min_sv": 0.0, "grad_condition": 15189866488.799454, "lr": 0.00032571397633909225, "time_sec": 86.88141465187073 }, { "epoch": 93, "train_loss": 5.321614575958252, "train_acc": 0.00952, "test_loss": 7.152406310272217, "test_acc": 0.01, "lyapunov": 1.5444753560263786, "grad_norm": 0.1783525963324978, "grad_max_sv": 0.024426844296976925, "grad_min_sv": 0.0, "grad_condition": 24426844296.97692, "lr": 0.00031593772365766094, "time_sec": 86.87559199333191 }, { "epoch": 94, "train_loss": 5.319984560089111, "train_acc": 0.0098, "test_loss": 7.227280062866211, "test_acc": 0.01, "lyapunov": 1.543088520884209, "grad_norm": 0.16043633002422977, "grad_max_sv": 0.0368963482324034, "grad_min_sv": 0.0, "grad_condition": 36896348232.4034, "lr": 0.0003062422067739483, "time_sec": 86.98869109153748 }, { "epoch": 95, "train_loss": 5.318843619537353, "train_acc": 0.00988, "test_loss": 7.253403067016602, "test_acc": 0.01, "lyapunov": 1.5419552667671457, "grad_norm": 0.15988427664274688, "grad_max_sv": 0.03179542766883969, "grad_min_sv": 0.0, "grad_condition": 31795427668.83969, "lr": 0.00029663167846209965, "time_sec": 86.96610736846924 }, { "epoch": 96, "train_loss": 5.321573169403076, "train_acc": 0.00976, "test_loss": 6.988779404449463, "test_acc": 0.01, "lyapunov": 1.5446298613267786, "grad_norm": 0.14208572570705744, "grad_max_sv": 0.03598490892909467, "grad_min_sv": 0.0, "grad_condition": 35984908929.09467, "lr": 0.00028711035421746345, "time_sec": 86.90040850639343 }, { "epoch": 97, "train_loss": 5.325382752685547, "train_acc": 0.00972, "test_loss": 6.935153257751465, "test_acc": 0.01, "lyapunov": 1.5469825359256677, "grad_norm": 0.18543936556050314, "grad_max_sv": 0.024622759968042373, "grad_min_sv": 0.0, "grad_condition": 24622759968.042374, "lr": 0.00027768241040753615, "time_sec": 86.86737728118896 }, { "epoch": 98, "train_loss": 5.319345963439941, "train_acc": 0.0094, "test_loss": 6.679858758544922, "test_acc": 0.01, "lyapunov": 1.5427014974072157, "grad_norm": 0.1365697052360637, "grad_max_sv": 0.0006230609491467476, "grad_min_sv": 0.0, "grad_condition": 623060949.1467476, "lr": 0.00026835198244006903, "time_sec": 86.8515510559082 }, { "epoch": 99, "train_loss": 5.31858975479126, "train_acc": 0.00966, "test_loss": 6.5813590454101565, "test_acc": 0.01, "lyapunov": 1.5418859296442602, "grad_norm": 0.13741337242075724, "grad_max_sv": 0.0017974570393562317, "grad_min_sv": 0.0, "grad_condition": 1797457039.3562317, "lr": 0.0002591231629491421, "time_sec": 86.8734724521637 }, { "epoch": 100, "train_loss": 5.319550311279297, "train_acc": 0.0096, "test_loss": 6.593423309326172, "test_acc": 0.01, "lyapunov": 1.5429147582529756, "grad_norm": 0.1428860474069435, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 86.91073799133301 }, { "epoch": 101, "train_loss": 5.319647026672364, "train_acc": 0.00946, "test_loss": 6.644115385437011, "test_acc": 0.01, "lyapunov": 1.5430320498278685, "grad_norm": 0.14070137371271418, "grad_max_sv": 0.0011870765592902899, "grad_min_sv": 0.0, "grad_condition": 1187076559.2902899, "lr": 0.00024098649531343477, "time_sec": 86.85703229904175 }, { "epoch": 102, "train_loss": 5.320731920471191, "train_acc": 0.01, "test_loss": 6.511743521118164, "test_acc": 0.01, "lyapunov": 1.544078452202975, "grad_norm": 0.16647090297400036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 86.84212875366211 }, { "epoch": 103, "train_loss": 5.320380414123536, "train_acc": 0.0087, "test_loss": 6.558885827636718, "test_acc": 0.01, "lyapunov": 1.5436865057786713, "grad_norm": 0.16211214182978093, "grad_max_sv": 0.0006886070128530264, "grad_min_sv": 0.0, "grad_condition": 688607012.8530264, "lr": 0.0002233042253783278, "time_sec": 86.84861445426941 }, { "epoch": 104, "train_loss": 5.320676337890625, "train_acc": 0.0096, "test_loss": 6.2893127243041995, "test_acc": 0.01, "lyapunov": 1.5437259469800593, "grad_norm": 0.15756640000371477, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 86.85342407226562 }, { "epoch": 105, "train_loss": 5.318497552947998, "train_acc": 0.00968, "test_loss": 6.463031019592285, "test_acc": 0.01, "lyapunov": 1.5418586124239675, "grad_norm": 0.16471254677440242, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 86.83621501922607 }, { "epoch": 106, "train_loss": 5.319013707885742, "train_acc": 0.00958, "test_loss": 8.393161967468261, "test_acc": 0.01, "lyapunov": 1.5424105264341739, "grad_norm": 0.1697085900956353, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 86.87845063209534 }, { "epoch": 107, "train_loss": 5.319404435882569, "train_acc": 0.01006, "test_loss": 6.168719081115722, "test_acc": 0.01, "lyapunov": 1.5427791502164758, "grad_norm": 0.16661392944132697, "grad_max_sv": 0.008691688347607852, "grad_min_sv": 0.0, "grad_condition": 8691688347.607851, "lr": 0.0001894261098608447, "time_sec": 86.86028218269348 }, { "epoch": 108, "train_loss": 5.320062127532959, "train_acc": 0.00946, "test_loss": 6.123481111145019, "test_acc": 0.01, "lyapunov": 1.543502251510425, "grad_norm": 0.1553396268788007, "grad_max_sv": 0.0017994886264204979, "grad_min_sv": 0.0, "grad_condition": 1799488626.420498, "lr": 0.000181288005125655, "time_sec": 86.88756346702576 }, { "epoch": 109, "train_loss": 5.32126156539917, "train_acc": 0.0097, "test_loss": 6.113170930480957, "test_acc": 0.01, "lyapunov": 1.5443304225306986, "grad_norm": 0.16827005574777967, "grad_max_sv": 0.008998295897617936, "grad_min_sv": 0.0, "grad_condition": 8998295897.617935, "lr": 0.0001732896980049473, "time_sec": 86.87347865104675 }, { "epoch": 110, "train_loss": 5.319310050964355, "train_acc": 0.00904, "test_loss": 6.0610163803100585, "test_acc": 0.01, "lyapunov": 1.5427448618442505, "grad_norm": 0.14666590598052404, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 86.86950135231018 }, { "epoch": 111, "train_loss": 5.319597338256836, "train_acc": 0.00972, "test_loss": 6.453852326202393, "test_acc": 0.01, "lyapunov": 1.5429801303712303, "grad_norm": 0.15909427151540545, "grad_max_sv": 0.008126799669116735, "grad_min_sv": 0.0, "grad_condition": 8126799669.116735, "lr": 0.00015772644703565552, "time_sec": 86.88328433036804 }, { "epoch": 112, "train_loss": 5.3212175, "train_acc": 0.00984, "test_loss": 6.988222769927979, "test_acc": 0.01, "lyapunov": 1.5440433973546528, "grad_norm": 0.15582154742531334, "grad_max_sv": 0.023284211242571472, "grad_min_sv": 0.0, "grad_condition": 23284211242.571472, "lr": 0.00015016832974331713, "time_sec": 86.88312244415283 }, { "epoch": 113, "train_loss": 5.320971462249756, "train_acc": 0.0098, "test_loss": 6.753297560882569, "test_acc": 0.01, "lyapunov": 1.5437339016848513, "grad_norm": 0.15454565641823212, "grad_max_sv": 0.0231532484292984, "grad_min_sv": 0.0, "grad_condition": 23153248429.2984, "lr": 0.00014276366018359834, "time_sec": 86.87558174133301 }, { "epoch": 114, "train_loss": 5.318772131958008, "train_acc": 0.00984, "test_loss": 6.465322698974609, "test_acc": 0.01, "lyapunov": 1.5421108507439303, "grad_norm": 0.15163809922079102, "grad_max_sv": 0.017600245866924526, "grad_min_sv": 0.0, "grad_condition": 17600245866.924522, "lr": 0.00013551568628929425, "time_sec": 86.85901880264282 }, { "epoch": 115, "train_loss": 5.323592142486572, "train_acc": 0.00918, "test_loss": 5.990406560516357, "test_acc": 0.01, "lyapunov": 1.5453894397486811, "grad_norm": 0.15673824664274916, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 86.8471782207489 }, { "epoch": 116, "train_loss": 5.321912714385986, "train_acc": 0.00934, "test_loss": 5.642854423522949, "test_acc": 0.01, "lyapunov": 1.5451806213544763, "grad_norm": 0.14873545301539315, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 86.82159352302551 }, { "epoch": 117, "train_loss": 5.319042910766601, "train_acc": 0.00916, "test_loss": 5.394878324890136, "test_acc": 0.01, "lyapunov": 1.5425118525009935, "grad_norm": 0.15364989808867727, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 86.8501136302948 }, { "epoch": 118, "train_loss": 5.3216519416809085, "train_acc": 0.0099, "test_loss": 5.54234706954956, "test_acc": 0.01, "lyapunov": 1.544617168738714, "grad_norm": 0.16204040482857374, "grad_max_sv": 0.014768891455605625, "grad_min_sv": 0.0, "grad_condition": 14768891455.605625, "lr": 0.00010815327133708009, "time_sec": 86.8445405960083 }, { "epoch": 119, "train_loss": 5.318838922729492, "train_acc": 0.00982, "test_loss": 5.401806521606446, "test_acc": 0.01, "lyapunov": 1.5422493301694045, "grad_norm": 0.16127338804024163, "grad_max_sv": 0.00781935746781528, "grad_min_sv": 0.0, "grad_condition": 7819357467.81528, "lr": 0.00010173504098790182, "time_sec": 86.82885694503784 }, { "epoch": 120, "train_loss": 5.319433266448975, "train_acc": 0.00962, "test_loss": 5.87718871307373, "test_acc": 0.01, "lyapunov": 1.5428460543722753, "grad_norm": 0.16811186230922795, "grad_max_sv": 0.003142098290845752, "grad_min_sv": 0.0, "grad_condition": 3142098290.845752, "lr": 9.549150281252629e-05, "time_sec": 86.83435249328613 }, { "epoch": 121, "train_loss": 5.318956566009521, "train_acc": 0.00864, "test_loss": 5.642109811401367, "test_acc": 0.01, "lyapunov": 1.5424094806851634, "grad_norm": 0.16401865280170627, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 86.84270787239075 }, { "epoch": 122, "train_loss": 5.320396621246338, "train_acc": 0.00946, "test_loss": 5.506566726684571, "test_acc": 0.01, "lyapunov": 1.543682734984571, "grad_norm": 0.16574195620383422, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 86.84029245376587 }, { "epoch": 123, "train_loss": 5.3207761328125, "train_acc": 0.0098, "test_loss": 5.753901168823242, "test_acc": 0.01, "lyapunov": 1.5442172185234402, "grad_norm": 0.17475767067470402, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 86.83801436424255 }, { "epoch": 124, "train_loss": 5.318808111877441, "train_acc": 0.00922, "test_loss": 5.811789031982422, "test_acc": 0.01, "lyapunov": 1.5422291850190029, "grad_norm": 0.16090202757718183, "grad_max_sv": 0.003358612256124616, "grad_min_sv": 0.0, "grad_condition": 3358612256.1246157, "lr": 7.231786991974666e-05, "time_sec": 86.8513069152832 }, { "epoch": 125, "train_loss": 5.319976197967529, "train_acc": 0.00978, "test_loss": 5.7769184440612795, "test_acc": 0.01, "lyapunov": 1.543531141622597, "grad_norm": 0.15700147429987782, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 86.86197853088379 }, { "epoch": 126, "train_loss": 5.318454194946289, "train_acc": 0.00986, "test_loss": 6.11075336303711, "test_acc": 0.01, "lyapunov": 1.5418975673368216, "grad_norm": 0.15336017967137117, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 86.86198329925537 }, { "epoch": 127, "train_loss": 5.3203326902771, "train_acc": 0.00934, "test_loss": 6.080118833160401, "test_acc": 0.01, "lyapunov": 1.5438893414519328, "grad_norm": 0.15768179334274351, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 86.84648036956787 }, { "epoch": 128, "train_loss": 5.318091445770263, "train_acc": 0.0093, "test_loss": 6.249022463989258, "test_acc": 0.01, "lyapunov": 1.5415176842218774, "grad_norm": 0.15317629834457977, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 86.83089065551758 }, { "epoch": 129, "train_loss": 5.319208795776367, "train_acc": 0.00944, "test_loss": 6.242862550354004, "test_acc": 0.01, "lyapunov": 1.5426923082307782, "grad_norm": 0.1586342865712123, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 86.8825249671936 }, { "epoch": 130, "train_loss": 5.319570325469971, "train_acc": 0.00932, "test_loss": 6.273485357666016, "test_acc": 0.01, "lyapunov": 1.5430697696593108, "grad_norm": 0.16288378510968, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 86.85678577423096 }, { "epoch": 131, "train_loss": 5.31834419998169, "train_acc": 0.00966, "test_loss": 6.162585590362549, "test_acc": 0.01, "lyapunov": 1.5417695389989088, "grad_norm": 0.15701283230384563, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 86.83028483390808 }, { "epoch": 132, "train_loss": 5.319475943603516, "train_acc": 0.0094, "test_loss": 6.003315113067627, "test_acc": 0.01, "lyapunov": 1.5429863951090352, "grad_norm": 0.1615796670941878, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 86.82017540931702 }, { "epoch": 133, "train_loss": 5.32576198135376, "train_acc": 0.00958, "test_loss": 5.846498718261719, "test_acc": 0.01, "lyapunov": 1.5467814566839078, "grad_norm": 0.1814711768537964, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 86.84380340576172 }, { "epoch": 134, "train_loss": 5.321647165985107, "train_acc": 0.00952, "test_loss": 5.876250485229492, "test_acc": 0.01, "lyapunov": 1.544941949722407, "grad_norm": 0.18078759337952854, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 86.84492230415344 }, { "epoch": 135, "train_loss": 5.31924706817627, "train_acc": 0.0096, "test_loss": 5.819815138244629, "test_acc": 0.01, "lyapunov": 1.5427488103851943, "grad_norm": 0.16329066142016732, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 86.83999133110046 }, { "epoch": 136, "train_loss": 5.319398911132812, "train_acc": 0.00982, "test_loss": 6.490616073608399, "test_acc": 0.01, "lyapunov": 1.5429087801052785, "grad_norm": 0.15926311416791136, "grad_max_sv": 0.0018711634445935487, "grad_min_sv": 0.0, "grad_condition": 1871163444.5935485, "lr": 2.1340251233966362e-05, "time_sec": 86.86916947364807 }, { "epoch": 137, "train_loss": 5.318829065551758, "train_acc": 0.00978, "test_loss": 5.920670237731934, "test_acc": 0.01, "lyapunov": 1.5422979410347122, "grad_norm": 0.16006466704199326, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 86.87598538398743 }, { "epoch": 138, "train_loss": 5.3190561383056645, "train_acc": 0.00948, "test_loss": 6.480327618408203, "test_acc": 0.01, "lyapunov": 1.5425209660664239, "grad_norm": 0.16458438595098937, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 86.83726739883423 }, { "epoch": 139, "train_loss": 5.318953646392822, "train_acc": 0.00984, "test_loss": 5.952891006469726, "test_acc": 0.01, "lyapunov": 1.5424313371443688, "grad_norm": 0.16278457254190812, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 86.83793210983276 }, { "epoch": 140, "train_loss": 5.3213463069152835, "train_acc": 0.00976, "test_loss": 6.456882773590088, "test_acc": 0.01, "lyapunov": 1.5445466053760266, "grad_norm": 0.16371751816212385, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 86.85442423820496 }, { "epoch": 141, "train_loss": 5.318112189025879, "train_acc": 0.00942, "test_loss": 6.3592885223388675, "test_acc": 0.01, "lyapunov": 1.5415452919957582, "grad_norm": 0.16093776786582448, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 86.8611011505127 }, { "epoch": 142, "train_loss": 5.319325820617676, "train_acc": 0.00982, "test_loss": 6.396855745697022, "test_acc": 0.01, "lyapunov": 1.5428402808011341, "grad_norm": 0.16262217434072207, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 86.8790693283081 }, { "epoch": 143, "train_loss": 5.319489360198975, "train_acc": 0.0098, "test_loss": 6.390167568206787, "test_acc": 0.01, "lyapunov": 1.5430222728368266, "grad_norm": 0.1599024522956201, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 86.8610942363739 }, { "epoch": 144, "train_loss": 5.3194953466796875, "train_acc": 0.00936, "test_loss": 6.3929207939147945, "test_acc": 0.01, "lyapunov": 1.5430299802814298, "grad_norm": 0.15787151048989498, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 86.83452033996582 }, { "epoch": 145, "train_loss": 5.319091488189697, "train_acc": 0.0099, "test_loss": 6.387041884613037, "test_acc": 0.01, "lyapunov": 1.5425858250664324, "grad_norm": 0.15981682340967285, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 86.84639286994934 }, { "epoch": 146, "train_loss": 5.319918049621582, "train_acc": 0.01, "test_loss": 6.390152045440674, "test_acc": 0.01, "lyapunov": 1.5434830600343397, "grad_norm": 0.1664732055156118, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 86.84289050102234 }, { "epoch": 147, "train_loss": 5.319467689819336, "train_acc": 0.01, "test_loss": 6.383955514526368, "test_acc": 0.01, "lyapunov": 1.5429968952827746, "grad_norm": 0.16425908204350428, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 86.85825252532959 }, { "epoch": 148, "train_loss": 5.319666849975586, "train_acc": 0.01, "test_loss": 6.379462463378906, "test_acc": 0.01, "lyapunov": 1.5432310299495298, "grad_norm": 0.1579801299018272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 86.90520691871643 }, { "epoch": 149, "train_loss": 5.318641065368652, "train_acc": 0.01, "test_loss": 6.385379031372071, "test_acc": 0.01, "lyapunov": 1.542139550609052, "grad_norm": 0.1606682447514192, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 86.85262036323547 }, { "epoch": 150, "train_loss": 5.31824127532959, "train_acc": 0.01, "test_loss": 6.3839585464477535, "test_acc": 0.01, "lyapunov": 1.5416794817161072, "grad_norm": 0.158152508901321, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 86.85510659217834 } ], "12": [ { "epoch": 1, "train_loss": 5.138188102111816, "train_acc": 0.01868, "test_loss": 4.947204817199707, "test_acc": 0.0102, "lyapunov": 2.4137888052274503, "grad_norm": 5.2278560060516135, "grad_max_sv": 4.450121748447418, "grad_min_sv": 8.815894619873532e-08, "grad_condition": 73462066.87031136, "lr": 0.0009998903417374227, "time_sec": 132.20039796829224 }, { "epoch": 2, "train_loss": 4.910357958526611, "train_acc": 0.01772, "test_loss": 4.974901505279541, "test_acc": 0.0098, "lyapunov": 1.8470725811960753, "grad_norm": 5.334406474785501, "grad_max_sv": 2.416768090268306, "grad_min_sv": 4.845974281257734e-08, "grad_condition": 156669965.4219852, "lr": 0.0009995614150494292, "time_sec": 132.20067143440247 }, { "epoch": 3, "train_loss": 4.789790082702637, "train_acc": 0.01798, "test_loss": 5.241659837341309, "test_acc": 0.0152, "lyapunov": 1.7693803560398425, "grad_norm": 2.284868849655408, "grad_max_sv": 1.6544225737452507, "grad_min_sv": 3.7601093222372486e-08, "grad_condition": 74204967.95678225, "lr": 0.0009990133642141358, "time_sec": 132.1939766407013 }, { "epoch": 4, "train_loss": 4.734155084381103, "train_acc": 0.02012, "test_loss": 4.736255917358398, "test_acc": 0.01, "lyapunov": 1.7185492494222148, "grad_norm": 1.2969402037730182, "grad_max_sv": 0.8527256481349468, "grad_min_sv": 1.8718222001719557e-08, "grad_condition": 3595934101.1830444, "lr": 0.0009982464296247522, "time_sec": 132.19083857536316 }, { "epoch": 5, "train_loss": 4.7501870367431644, "train_acc": 0.01884, "test_loss": 4.7008225593566895, "test_acc": 0.01, "lyapunov": 1.6784742927307363, "grad_norm": 0.7283552366408743, "grad_max_sv": 0.540743650496006, "grad_min_sv": 6.143185659736945e-09, "grad_condition": 20744559298.222054, "lr": 0.0009972609476841367, "time_sec": 132.19878315925598 }, { "epoch": 6, "train_loss": 4.777885425109863, "train_acc": 0.01988, "test_loss": 4.847038110351562, "test_acc": 0.0163, "lyapunov": 1.6714926692835814, "grad_norm": 0.6978205109559127, "grad_max_sv": 0.4112665578722954, "grad_min_sv": 2.577558256003571e-09, "grad_condition": 19293368058.44477, "lr": 0.000996057350657239, "time_sec": 132.22198057174683 }, { "epoch": 7, "train_loss": 4.817885786285401, "train_acc": 0.01714, "test_loss": 4.907033979797363, "test_acc": 0.01, "lyapunov": 1.6430019908548925, "grad_norm": 0.538957530048536, "grad_max_sv": 0.3900473590940237, "grad_min_sv": 8.011143267797137e-10, "grad_condition": 53520886424.44034, "lr": 0.000994636166481494, "time_sec": 132.18847823143005 }, { "epoch": 8, "train_loss": 4.866279851989746, "train_acc": 0.01534, "test_loss": 4.982185540008545, "test_acc": 0.01, "lyapunov": 1.622301935234948, "grad_norm": 0.44743905036756576, "grad_max_sv": 0.2975618153810501, "grad_min_sv": 4.042702856767639e-12, "grad_condition": 98919396245.19788, "lr": 0.0009929980185352525, "time_sec": 132.2019805908203 }, { "epoch": 9, "train_loss": 4.93485692489624, "train_acc": 0.01296, "test_loss": 5.24868205871582, "test_acc": 0.01, "lyapunov": 1.6329893876829416, "grad_norm": 1.2710312604148948, "grad_max_sv": 0.23227821737527848, "grad_min_sv": 1.210631234207371e-10, "grad_condition": 132050856729.70003, "lr": 0.0009911436253643444, "time_sec": 132.25901436805725 }, { "epoch": 10, "train_loss": 4.94441338470459, "train_acc": 0.01662, "test_loss": 4.9677005256652835, "test_acc": 0.01, "lyapunov": 1.6191197569717837, "grad_norm": 0.5849346197331, "grad_max_sv": 0.3103320188820362, "grad_min_sv": 2.4441770461207573e-12, "grad_condition": 142331552698.27188, "lr": 0.0009890738003669028, "time_sec": 132.24092388153076 }, { "epoch": 11, "train_loss": 4.978343018798828, "train_acc": 0.01596, "test_loss": 4.759020803070069, "test_acc": 0.01, "lyapunov": 1.607335550096029, "grad_norm": 0.4668173173890936, "grad_max_sv": 0.3271574813872576, "grad_min_sv": 1.5228846413101469e-12, "grad_condition": 163401069045.22977, "lr": 0.00098678945143658, "time_sec": 132.22342109680176 }, { "epoch": 12, "train_loss": 5.019883101348877, "train_acc": 0.0154, "test_loss": 4.942817668151855, "test_acc": 0.01, "lyapunov": 1.6049258376631286, "grad_norm": 0.5264008543358515, "grad_max_sv": 0.28871628642082214, "grad_min_sv": 1.5745550588117867e-12, "grad_condition": 141150096351.00974, "lr": 0.0009842915805643154, "time_sec": 132.17593479156494 }, { "epoch": 13, "train_loss": 5.055773426361084, "train_acc": 0.01454, "test_loss": 5.201871238708496, "test_acc": 0.01, "lyapunov": 1.5926724358287918, "grad_norm": 0.5496018971790103, "grad_max_sv": 0.3235856369137764, "grad_min_sv": 1.5836317227272346e-12, "grad_condition": 172440841867.61472, "lr": 0.000981581283398829, "time_sec": 132.19917631149292 }, { "epoch": 14, "train_loss": 5.1001338768005375, "train_acc": 0.01374, "test_loss": 6.031500621795654, "test_acc": 0.01, "lyapunov": 1.5873235156164145, "grad_norm": 0.5347429702370289, "grad_max_sv": 0.31967496164143083, "grad_min_sv": 8.416411018220654e-13, "grad_condition": 202636437942.46396, "lr": 0.0009786597487660333, "time_sec": 132.17077159881592 }, { "epoch": 15, "train_loss": 5.135957703857422, "train_acc": 0.0124, "test_loss": 5.739520129394531, "test_acc": 0.01, "lyapunov": 1.574544443803675, "grad_norm": 0.6201173127889323, "grad_max_sv": 0.32148296795785425, "grad_min_sv": 1.8768859669293263e-11, "grad_condition": 245017227140.7776, "lr": 0.0009755282581475766, "time_sec": 132.19619607925415 }, { "epoch": 16, "train_loss": 5.19933319366455, "train_acc": 0.01332, "test_loss": 6.819124224090576, "test_acc": 0.01, "lyapunov": 1.588761254649638, "grad_norm": 0.7105947575125269, "grad_max_sv": 0.3380855549126863, "grad_min_sv": 1.0418656496584723e-09, "grad_condition": 212026412736.4578, "lr": 0.0009721881851187403, "time_sec": 132.16591668128967 }, { "epoch": 17, "train_loss": 5.203327436523438, "train_acc": 0.0158, "test_loss": 7.679113117980957, "test_acc": 0.01, "lyapunov": 1.5917936892765563, "grad_norm": 0.5687429696625533, "grad_max_sv": 0.3429654061794281, "grad_min_sv": 1.0535516342595844e-12, "grad_condition": 208532854744.75134, "lr": 0.0009686409947459456, "time_sec": 132.23086404800415 }, { "epoch": 18, "train_loss": 5.227132577209472, "train_acc": 0.01704, "test_loss": 5.224352997589111, "test_acc": 0.01, "lyapunov": 1.590573813604272, "grad_norm": 0.6501892893379347, "grad_max_sv": 0.3389496423304081, "grad_min_sv": 1.4743293232017855e-12, "grad_condition": 179354691955.7947, "lr": 0.0009648882429441254, "time_sec": 132.17126607894897 }, { "epoch": 19, "train_loss": 5.268917711486816, "train_acc": 0.01574, "test_loss": 5.769149468994141, "test_acc": 0.01, "lyapunov": 1.5737659489102376, "grad_norm": 0.7756970175394374, "grad_max_sv": 0.33219469264149665, "grad_min_sv": 1.3963206987681851e-12, "grad_condition": 166340823567.4583, "lr": 0.00096093157579425, "time_sec": 132.3532431125641 }, { "epoch": 20, "train_loss": 5.388035034332275, "train_acc": 0.01436, "test_loss": 4.855289517211914, "test_acc": 0.01, "lyapunov": 1.6196008579200492, "grad_norm": 3.273774802278225, "grad_max_sv": 0.3476741284544914, "grad_min_sv": 1.7954016832837687e-12, "grad_condition": 163400108512.08075, "lr": 0.0009567727288213001, "time_sec": 132.18322706222534 }, { "epoch": 21, "train_loss": 5.477730575561523, "train_acc": 0.0119, "test_loss": 5.734935963439941, "test_acc": 0.01, "lyapunov": 1.6737558759386888, "grad_norm": 0.7316822390940195, "grad_max_sv": 0.41190238408744334, "grad_min_sv": 1.4433235299420839e-09, "grad_condition": 115946317202.22786, "lr": 0.0009524135262330095, "time_sec": 132.2254023551941 }, { "epoch": 22, "train_loss": 5.39889496673584, "train_acc": 0.01078, "test_loss": 4.648544214630127, "test_acc": 0.01, "lyapunov": 1.5598208084130836, "grad_norm": 0.9136530334274789, "grad_max_sv": 0.5729864671826362, "grad_min_sv": 6.476590619830438e-09, "grad_condition": 6966838482.173167, "lr": 0.0009478558801197061, "time_sec": 132.19873070716858 }, { "epoch": 23, "train_loss": 5.343370434570312, "train_acc": 0.00934, "test_loss": 4.6330633590698245, "test_acc": 0.01, "lyapunov": 1.544742999174406, "grad_norm": 0.5447776712180945, "grad_max_sv": 0.3971055932343006, "grad_min_sv": 3.0723113141940555e-09, "grad_condition": 10360739417.615135, "lr": 0.000943101789615607, "time_sec": 132.19472217559814 }, { "epoch": 24, "train_loss": 5.354044710998535, "train_acc": 0.0106, "test_loss": 4.758938900756836, "test_acc": 0.01, "lyapunov": 1.5540964880867687, "grad_norm": 0.49799279906750776, "grad_max_sv": 0.32289256788790227, "grad_min_sv": 1.215183540768495e-09, "grad_condition": 84138259698.76875, "lr": 0.0009381533400219313, "time_sec": 132.18565702438354 }, { "epoch": 25, "train_loss": 5.34166207687378, "train_acc": 0.00954, "test_loss": 4.616498927307129, "test_acc": 0.01, "lyapunov": 1.5548294105798082, "grad_norm": 0.35224887377867997, "grad_max_sv": 0.2050650805234909, "grad_min_sv": 4.310481015545377e-10, "grad_condition": 137027644012.72295, "lr": 0.0009330127018922189, "time_sec": 132.1707353591919 }, { "epoch": 26, "train_loss": 5.329114703826904, "train_acc": 0.00962, "test_loss": 4.608516737365723, "test_acc": 0.01, "lyapunov": 1.5478018071035595, "grad_norm": 0.41152400199519606, "grad_max_sv": 0.14391734022647143, "grad_min_sv": 6.406558234285353e-11, "grad_condition": 129739564652.99875, "lr": 0.000927682130080253, "time_sec": 132.1968698501587 }, { "epoch": 27, "train_loss": 5.333489670410156, "train_acc": 0.0092, "test_loss": 4.6180027542114255, "test_acc": 0.01, "lyapunov": 1.553746031068475, "grad_norm": 0.395956424199356, "grad_max_sv": 0.077771030459553, "grad_min_sv": 3.8469886311157825e-16, "grad_condition": 77730702472.31937, "lr": 0.0009221639627510072, "time_sec": 132.21505451202393 }, { "epoch": 28, "train_loss": 5.351277679595947, "train_acc": 0.00942, "test_loss": 4.7706145118713374, "test_acc": 0.01, "lyapunov": 1.564519799273947, "grad_norm": 0.8070388432556335, "grad_max_sv": 0.08204491948708892, "grad_min_sv": 1.474816693019578e-15, "grad_condition": 81835653341.89993, "lr": 0.0009164606203550494, "time_sec": 132.19659543037415 }, { "epoch": 29, "train_loss": 5.322618664703369, "train_acc": 0.00872, "test_loss": 5.576576512145996, "test_acc": 0.01, "lyapunov": 1.5448476557841386, "grad_norm": 1.8211987840238726, "grad_max_sv": 0.006918648211285472, "grad_min_sv": 3.854375422071664e-17, "grad_condition": 6914688932.083499, "lr": 0.0009105746045668516, "time_sec": 132.10211896896362 }, { "epoch": 30, "train_loss": 5.332048937377929, "train_acc": 0.00954, "test_loss": 5.513208132934571, "test_acc": 0.01, "lyapunov": 1.550695708035813, "grad_norm": 1.1118821287367113, "grad_max_sv": 0.019531637569889425, "grad_min_sv": 1.0689040165877983e-16, "grad_condition": 19522880900.554432, "lr": 0.0009045084971874733, "time_sec": 132.11267638206482 }, { "epoch": 31, "train_loss": 5.326176876373291, "train_acc": 0.00918, "test_loss": 5.386148994445801, "test_acc": 0.01, "lyapunov": 1.5464019519288827, "grad_norm": 0.5069935542454341, "grad_max_sv": 0.054698918107897045, "grad_min_sv": 3.7386723818325515e-15, "grad_condition": 54294495664.74051, "lr": 0.0008982649590120977, "time_sec": 132.1673936843872 }, { "epoch": 32, "train_loss": 5.322083574829102, "train_acc": 0.01, "test_loss": 4.707043412780762, "test_acc": 0.01, "lyapunov": 1.544298157667565, "grad_norm": 0.42554937796746406, "grad_max_sv": 0.04392390437424183, "grad_min_sv": 2.3012806918730416e-16, "grad_condition": 43903285638.58012, "lr": 0.0008918467286629196, "time_sec": 132.18636798858643 }, { "epoch": 33, "train_loss": 5.328476766967773, "train_acc": 0.00958, "test_loss": 5.157709109497071, "test_acc": 0.01, "lyapunov": 1.5494323496318534, "grad_norm": 0.3948590073220422, "grad_max_sv": 0.046419868059456346, "grad_min_sv": 3.920453121241332e-16, "grad_condition": 46387197576.51258, "lr": 0.0008852566213878943, "time_sec": 132.14906311035156 }, { "epoch": 34, "train_loss": 5.335322699432373, "train_acc": 0.00912, "test_loss": 4.63318578491211, "test_acc": 0.01, "lyapunov": 1.5560249096292365, "grad_norm": 0.3431205276749687, "grad_max_sv": 0.006924860086292029, "grad_min_sv": 0.0, "grad_condition": 6924860086.292028, "lr": 0.000878497527825878, "time_sec": 132.08630466461182 }, { "epoch": 35, "train_loss": 5.323294322357178, "train_acc": 0.00884, "test_loss": 4.605205520629883, "test_acc": 0.01, "lyapunov": 1.5453313735439955, "grad_norm": 0.3024735245825119, "grad_max_sv": 0.028930858056992293, "grad_min_sv": 0.0, "grad_condition": 28930858056.9923, "lr": 0.000871572412738697, "time_sec": 132.11405229568481 }, { "epoch": 36, "train_loss": 5.324136592712402, "train_acc": 0.00868, "test_loss": 4.605186470031739, "test_acc": 0.01, "lyapunov": 1.5469522064604113, "grad_norm": 0.361219602695028, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107055, "time_sec": 132.07118153572083 }, { "epoch": 37, "train_loss": 5.3209700448608395, "train_acc": 0.00892, "test_loss": 4.665984559631347, "test_acc": 0.01, "lyapunov": 1.5437110970392252, "grad_norm": 0.3116729659195542, "grad_max_sv": 0.020941149955615402, "grad_min_sv": 0.0, "grad_condition": 20941149955.6154, "lr": 0.0008572363398164014, "time_sec": 132.09318017959595 }, { "epoch": 38, "train_loss": 5.325020372467041, "train_acc": 0.00874, "test_loss": 4.663543145751953, "test_acc": 0.01, "lyapunov": 1.5469195239074396, "grad_norm": 0.305903104498294, "grad_max_sv": 0.024645538488402962, "grad_min_sv": 0.0, "grad_condition": 24645538488.40296, "lr": 0.0008498316702566826, "time_sec": 132.18630456924438 }, { "epoch": 39, "train_loss": 5.326424997558593, "train_acc": 0.00926, "test_loss": 4.710470159912109, "test_acc": 0.01, "lyapunov": 1.5472500924868962, "grad_norm": 0.3315518442712431, "grad_max_sv": 0.03559725326485932, "grad_min_sv": 4.71556170988084e-33, "grad_condition": 35597253264.859314, "lr": 0.0008422735529643442, "time_sec": 132.1392993927002 }, { "epoch": 40, "train_loss": 5.33426462966919, "train_acc": 0.0096, "test_loss": 4.689337516784668, "test_acc": 0.01, "lyapunov": 1.555562095568918, "grad_norm": 0.3795118996689083, "grad_max_sv": 0.028565633855760098, "grad_min_sv": 0.0, "grad_condition": 28565633855.760094, "lr": 0.0008345653031794289, "time_sec": 132.12650513648987 }, { "epoch": 41, "train_loss": 5.329594454193115, "train_acc": 0.00962, "test_loss": 4.677967825317383, "test_acc": 0.01, "lyapunov": 1.5518201217626977, "grad_norm": 0.35226874238427724, "grad_max_sv": 0.031289939628914, "grad_min_sv": 0.0, "grad_condition": 31289939628.913994, "lr": 0.0008267103019950526, "time_sec": 132.1842393875122 }, { "epoch": 42, "train_loss": 5.334290416412354, "train_acc": 0.00948, "test_loss": 4.7127025581359865, "test_acc": 0.01, "lyapunov": 1.55599294903943, "grad_norm": 0.3150010140468872, "grad_max_sv": 0.008952232170850038, "grad_min_sv": 0.0, "grad_condition": 8952232170.850039, "lr": 0.0008187119948743447, "time_sec": 132.16592741012573 }, { "epoch": 43, "train_loss": 5.330992495574951, "train_acc": 0.00988, "test_loss": 4.715853765869141, "test_acc": 0.01, "lyapunov": 1.5526615817223668, "grad_norm": 0.32555598147833537, "grad_max_sv": 0.025627513602375983, "grad_min_sv": 0.0, "grad_condition": 25627513602.375984, "lr": 0.000810573890139155, "time_sec": 132.1376314163208 }, { "epoch": 44, "train_loss": 5.342441840667725, "train_acc": 0.009, "test_loss": 4.814597158813476, "test_acc": 0.01, "lyapunov": 1.5608167011109764, "grad_norm": 0.3705555621106487, "grad_max_sv": 0.012277775909751654, "grad_min_sv": 0.0, "grad_condition": 12277775909.751654, "lr": 0.0008022995574311873, "time_sec": 132.10150909423828 }, { "epoch": 45, "train_loss": 5.330550760803223, "train_acc": 0.00922, "test_loss": 4.82506159362793, "test_acc": 0.01, "lyapunov": 1.552602043846989, "grad_norm": 0.41377353743023604, "grad_max_sv": 0.012684891000390053, "grad_min_sv": 0.0, "grad_condition": 12684891000.390053, "lr": 0.0007938926261462363, "time_sec": 132.13983154296875 }, { "epoch": 46, "train_loss": 5.346614602661133, "train_acc": 0.00908, "test_loss": 4.75941802444458, "test_acc": 0.01, "lyapunov": 1.565407470059212, "grad_norm": 0.6666703677397586, "grad_max_sv": 0.0006472387816756964, "grad_min_sv": 0.0, "grad_condition": 647238781.6756964, "lr": 0.0007853567838422158, "time_sec": 132.07343816757202 }, { "epoch": 47, "train_loss": 5.32947943145752, "train_acc": 0.00898, "test_loss": 4.822898616027832, "test_acc": 0.01, "lyapunov": 1.5532338082637933, "grad_norm": 1.2230171967365666, "grad_max_sv": 0.011994929099455477, "grad_min_sv": 0.0, "grad_condition": 11994929099.455475, "lr": 0.0007766957746216719, "time_sec": 132.13085794448853 }, { "epoch": 48, "train_loss": 5.3338893869018555, "train_acc": 0.0092, "test_loss": 4.843168624877929, "test_acc": 0.01, "lyapunov": 1.5537122622170412, "grad_norm": 0.9355731457390791, "grad_max_sv": 0.06068415185436606, "grad_min_sv": 1.5809611954265782e-13, "grad_condition": 46398377146.35246, "lr": 0.0007679133974894982, "time_sec": 132.11377477645874 }, { "epoch": 49, "train_loss": 5.340212641296387, "train_acc": 0.00966, "test_loss": 4.808492147827148, "test_acc": 0.01, "lyapunov": 1.556026118490702, "grad_norm": 0.3770156243368251, "grad_max_sv": 0.1463914191350341, "grad_min_sv": 3.152568142733814e-13, "grad_condition": 121760995460.97897, "lr": 0.000759013504686565, "time_sec": 132.2147512435913 }, { "epoch": 50, "train_loss": 5.332282363586426, "train_acc": 0.0096, "test_loss": 4.743034214782715, "test_acc": 0.01, "lyapunov": 1.5524532118111924, "grad_norm": 0.3116530039130024, "grad_max_sv": 0.10226385369896888, "grad_min_sv": 3.0737180401130916e-15, "grad_condition": 101953179254.12184, "lr": 0.0007499999999999998, "time_sec": 132.22958421707153 }, { "epoch": 51, "train_loss": 5.3305883631896975, "train_acc": 0.00952, "test_loss": 4.724603568267822, "test_acc": 0.01, "lyapunov": 1.5518521100968656, "grad_norm": 0.3241210515609679, "grad_max_sv": 0.08684249427169562, "grad_min_sv": 6.328097683852358e-16, "grad_condition": 86783867952.95651, "lr": 0.0007408768370508575, "time_sec": 132.19532179832458 }, { "epoch": 52, "train_loss": 5.332131455078125, "train_acc": 0.00964, "test_loss": 4.782391441345215, "test_acc": 0.01, "lyapunov": 1.5542255048556706, "grad_norm": 0.32295260623787486, "grad_max_sv": 0.077319351490587, "grad_min_sv": 1.8882153881334225e-23, "grad_condition": 77319351489.28442, "lr": 0.0007316480175599307, "time_sec": 132.21878457069397 }, { "epoch": 53, "train_loss": 5.333503689270019, "train_acc": 0.00936, "test_loss": 4.801981381225586, "test_acc": 0.01, "lyapunov": 1.5553877649404813, "grad_norm": 0.31562374196715365, "grad_max_sv": 0.06292690904811024, "grad_min_sv": 1.0573404187094843e-32, "grad_condition": 62926909048.110245, "lr": 0.0007223175895924635, "time_sec": 132.18660378456116 }, { "epoch": 54, "train_loss": 5.333852608795166, "train_acc": 0.00896, "test_loss": 4.810883659362793, "test_acc": 0.01, "lyapunov": 1.5559345386217318, "grad_norm": 0.2781133113627033, "grad_max_sv": 0.06129774982109666, "grad_min_sv": 2.855284741973353e-38, "grad_condition": 61297749821.09666, "lr": 0.0007128896457825361, "time_sec": 132.2198555469513 }, { "epoch": 55, "train_loss": 5.3339955087280275, "train_acc": 0.00996, "test_loss": 4.7569840606689455, "test_acc": 0.01, "lyapunov": 1.5569808833739336, "grad_norm": 0.2566538491911281, "grad_max_sv": 0.05556260636076331, "grad_min_sv": 0.0, "grad_condition": 55562606360.763306, "lr": 0.0007033683215378998, "time_sec": 132.21158051490784 }, { "epoch": 56, "train_loss": 5.3385576313781735, "train_acc": 0.00902, "test_loss": 4.754797148895264, "test_acc": 0.01, "lyapunov": 1.5597065461566075, "grad_norm": 0.27047724542782614, "grad_max_sv": 0.0640806739218533, "grad_min_sv": 1.2193818893472967e-19, "grad_condition": 64080664167.18032, "lr": 0.0006937577932260512, "time_sec": 132.19129037857056 }, { "epoch": 57, "train_loss": 5.334184418182373, "train_acc": 0.0103, "test_loss": 4.782689431762695, "test_acc": 0.01, "lyapunov": 1.556523521842859, "grad_norm": 0.29259577039987816, "grad_max_sv": 0.07542139226570725, "grad_min_sv": 8.844145625485828e-17, "grad_condition": 75415188010.71097, "lr": 0.0006840622763423388, "time_sec": 132.19539308547974 }, { "epoch": 58, "train_loss": 5.3342736126708985, "train_acc": 0.00902, "test_loss": 4.792922207641602, "test_acc": 0.01, "lyapunov": 1.556638328925423, "grad_norm": 0.27651642414760924, "grad_max_sv": 0.07381959799677133, "grad_min_sv": 5.679191077750394e-25, "grad_condition": 73819597996.72554, "lr": 0.0006742860236609073, "time_sec": 132.1646604537964 }, { "epoch": 59, "train_loss": 5.3365766784667965, "train_acc": 0.00976, "test_loss": 4.764654750061035, "test_acc": 0.01, "lyapunov": 1.559028771527283, "grad_norm": 0.32368701389084115, "grad_max_sv": 0.06830886630341411, "grad_min_sv": 3.373213421233685e-18, "grad_condition": 68308625699.52162, "lr": 0.0006644333233692913, "time_sec": 132.20315170288086 }, { "epoch": 60, "train_loss": 5.3372549061584476, "train_acc": 0.00876, "test_loss": 4.821174919128418, "test_acc": 0.01, "lyapunov": 1.5602548335824171, "grad_norm": 0.3407373955115073, "grad_max_sv": 0.05221205474808812, "grad_min_sv": 0.0, "grad_condition": 52212054748.08812, "lr": 0.0006545084971874734, "time_sec": 132.21871399879456 }, { "epoch": 61, "train_loss": 5.340573087158203, "train_acc": 0.01004, "test_loss": 4.814465225219727, "test_acc": 0.01, "lyapunov": 1.5639353786283137, "grad_norm": 0.33445562902063697, "grad_max_sv": 0.04306556633673608, "grad_min_sv": 0.0, "grad_condition": 43065566336.736084, "lr": 0.0006445158984722354, "time_sec": 132.16924214363098 }, { "epoch": 62, "train_loss": 5.343714674987793, "train_acc": 0.0095, "test_loss": 4.770381900024414, "test_acc": 0.01, "lyapunov": 1.566701197258347, "grad_norm": 0.41600975854497274, "grad_max_sv": 0.0407159102614969, "grad_min_sv": 0.0, "grad_condition": 40715910261.4969, "lr": 0.0006344599103076324, "time_sec": 132.14849257469177 }, { "epoch": 63, "train_loss": 5.340150414581299, "train_acc": 0.00942, "test_loss": 4.809834826660156, "test_acc": 0.01, "lyapunov": 1.5634946268232888, "grad_norm": 0.4244404576721166, "grad_max_sv": 0.046563083119690415, "grad_min_sv": 0.0, "grad_condition": 46563083119.690414, "lr": 0.0006243449435824269, "time_sec": 132.2440116405487 }, { "epoch": 64, "train_loss": 5.352264609527588, "train_acc": 0.00968, "test_loss": 4.719538593292237, "test_acc": 0.01, "lyapunov": 1.5730204283428924, "grad_norm": 0.6484058447373605, "grad_max_sv": 0.06881329002790153, "grad_min_sv": 4.045636130762067e-11, "grad_condition": 57057261120.16382, "lr": 0.0006141754350553275, "time_sec": 132.1377170085907 }, { "epoch": 65, "train_loss": 5.345465493011474, "train_acc": 0.0095, "test_loss": 4.807828170013428, "test_acc": 0.01, "lyapunov": 1.5668580141823616, "grad_norm": 0.26811037405238153, "grad_max_sv": 0.0895066935569048, "grad_min_sv": 8.923440580685122e-16, "grad_condition": 89405744261.32881, "lr": 0.0006039558454088793, "time_sec": 132.18963503837585 }, { "epoch": 66, "train_loss": 5.339095722351074, "train_acc": 0.00992, "test_loss": 4.79014116973877, "test_acc": 0.01, "lyapunov": 1.562422338044247, "grad_norm": 0.2418134006072333, "grad_max_sv": 0.04957848088815808, "grad_min_sv": 0.0, "grad_condition": 49578480888.15808, "lr": 0.000593690657292862, "time_sec": 132.18193554878235 }, { "epoch": 67, "train_loss": 5.339143208312988, "train_acc": 0.00878, "test_loss": 4.846720378875732, "test_acc": 0.01, "lyapunov": 1.5629626052153995, "grad_norm": 0.23211875934280046, "grad_max_sv": 0.04276521084830165, "grad_min_sv": 0.0, "grad_condition": 42765210848.30165, "lr": 0.0005833843733580507, "time_sec": 132.21098923683167 }, { "epoch": 68, "train_loss": 5.341660294799805, "train_acc": 0.00926, "test_loss": 4.93624571685791, "test_acc": 0.01, "lyapunov": 1.5647895671522525, "grad_norm": 0.25226724531209027, "grad_max_sv": 0.04243421019054949, "grad_min_sv": 0.0, "grad_condition": 42434210190.54949, "lr": 0.0005730415142812054, "time_sec": 132.18032026290894 }, { "epoch": 69, "train_loss": 5.3429354066467285, "train_acc": 0.00964, "test_loss": 4.963717977905273, "test_acc": 0.01, "lyapunov": 1.5658744921159866, "grad_norm": 0.26387680813745, "grad_max_sv": 0.044778031017631295, "grad_min_sv": 0.0, "grad_condition": 44778031017.63129, "lr": 0.0005626666167821517, "time_sec": 132.16022729873657 }, { "epoch": 70, "train_loss": 5.344523805389405, "train_acc": 0.0091, "test_loss": 4.810392481231689, "test_acc": 0.01, "lyapunov": 1.5665253672148565, "grad_norm": 0.31439106456207916, "grad_max_sv": 0.03966532703489065, "grad_min_sv": 0.0, "grad_condition": 39665327034.890656, "lr": 0.0005522642316338265, "time_sec": 132.1867744922638 }, { "epoch": 71, "train_loss": 5.346882275238037, "train_acc": 0.00912, "test_loss": 4.778971862792969, "test_acc": 0.01, "lyapunov": 1.568563460998828, "grad_norm": 0.20952619953519083, "grad_max_sv": 0.03776215887628496, "grad_min_sv": 0.0, "grad_condition": 37762158876.28496, "lr": 0.0005418389216661573, "time_sec": 132.18875670433044 }, { "epoch": 72, "train_loss": 5.353162684936524, "train_acc": 0.00818, "test_loss": 4.764224601745606, "test_acc": 0.01, "lyapunov": 1.5738632352760686, "grad_norm": 0.21224191589739633, "grad_max_sv": 0.02936461050994694, "grad_min_sv": 0.0, "grad_condition": 29364610509.94694, "lr": 0.0005313952597646563, "time_sec": 132.16054940223694 }, { "epoch": 73, "train_loss": 5.341572857055664, "train_acc": 0.00934, "test_loss": 4.764213945770264, "test_acc": 0.01, "lyapunov": 1.5656722372450183, "grad_norm": 0.17131578138452824, "grad_max_sv": 0.026255082851275802, "grad_min_sv": 0.0, "grad_condition": 26255082851.275803, "lr": 0.0005209378268645994, "time_sec": 132.11386466026306 }, { "epoch": 74, "train_loss": 5.34148181564331, "train_acc": 0.00884, "test_loss": 4.787430990600586, "test_acc": 0.01, "lyapunov": 1.5657289049509542, "grad_norm": 0.20416273686306285, "grad_max_sv": 0.03651727414689958, "grad_min_sv": 0.0, "grad_condition": 36517274146.89958, "lr": 0.0005104712099416781, "time_sec": 132.2018940448761 }, { "epoch": 75, "train_loss": 5.341119176330566, "train_acc": 0.00948, "test_loss": 4.769783227539063, "test_acc": 0.01, "lyapunov": 1.5654692183370176, "grad_norm": 0.17080101166392242, "grad_max_sv": 0.030799029115587472, "grad_min_sv": 0.0, "grad_condition": 30799029115.587475, "lr": 0.0004999999999999996, "time_sec": 132.12539839744568 }, { "epoch": 76, "train_loss": 5.345115729370117, "train_acc": 0.00946, "test_loss": 4.734894322967529, "test_acc": 0.01, "lyapunov": 1.5686149972174175, "grad_norm": 0.18659944764551223, "grad_max_sv": 0.012125130696222185, "grad_min_sv": 0.0, "grad_condition": 12125130696.222187, "lr": 0.0004895287900583212, "time_sec": 132.09123158454895 }, { "epoch": 77, "train_loss": 5.338459321289062, "train_acc": 0.0094, "test_loss": 4.7248460479736325, "test_acc": 0.01, "lyapunov": 1.5630621724116527, "grad_norm": 0.176032379936258, "grad_max_sv": 0.013429323118180037, "grad_min_sv": 0.0, "grad_condition": 13429323118.180037, "lr": 0.0004790621731353997, "time_sec": 132.07102465629578 }, { "epoch": 78, "train_loss": 5.345072369537354, "train_acc": 0.00896, "test_loss": 4.745542971801758, "test_acc": 0.01, "lyapunov": 1.5687669668051287, "grad_norm": 0.2223520771526132, "grad_max_sv": 0.00913866781629622, "grad_min_sv": 0.0, "grad_condition": 9138667816.29622, "lr": 0.000468604740235343, "time_sec": 132.31091713905334 }, { "epoch": 79, "train_loss": 5.338468246459961, "train_acc": 0.00906, "test_loss": 4.776708003234863, "test_acc": 0.01, "lyapunov": 1.5631554016981588, "grad_norm": 0.18439021291098787, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 132.1099407672882 }, { "epoch": 80, "train_loss": 5.3392803921508785, "train_acc": 0.0085, "test_loss": 4.756961068725586, "test_acc": 0.01, "lyapunov": 1.5640239118005308, "grad_norm": 0.1670344381602521, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 132.07850074768066 }, { "epoch": 81, "train_loss": 5.338647942352295, "train_acc": 0.00896, "test_loss": 4.738301519775391, "test_acc": 0.01, "lyapunov": 1.563378708441849, "grad_norm": 0.15920625845312916, "grad_max_sv": 0.012282294360920787, "grad_min_sv": 0.0, "grad_condition": 12282294360.920788, "lr": 0.00043733338321784746, "time_sec": 132.09186792373657 }, { "epoch": 82, "train_loss": 5.339479166107178, "train_acc": 0.0092, "test_loss": 4.714014392089844, "test_acc": 0.01, "lyapunov": 1.5639294709086113, "grad_norm": 0.1731138874132484, "grad_max_sv": 0.03721864921972155, "grad_min_sv": 0.0, "grad_condition": 37218649219.72156, "lr": 0.0004269584857187939, "time_sec": 132.1542615890503 }, { "epoch": 83, "train_loss": 5.345089318237305, "train_acc": 0.00928, "test_loss": 4.7151237457275395, "test_acc": 0.01, "lyapunov": 1.5680857643751842, "grad_norm": 0.1866415261285155, "grad_max_sv": 0.03729230999015272, "grad_min_sv": 0.0, "grad_condition": 37292309990.152725, "lr": 0.0004166156266419484, "time_sec": 132.18493914604187 }, { "epoch": 84, "train_loss": 5.345381183319092, "train_acc": 0.00918, "test_loss": 4.68825431060791, "test_acc": 0.01, "lyapunov": 1.568592563309633, "grad_norm": 0.1882901347639973, "grad_max_sv": 0.021022121235728265, "grad_min_sv": 0.0, "grad_condition": 21022121235.728264, "lr": 0.0004063093427071373, "time_sec": 132.12367796897888 }, { "epoch": 85, "train_loss": 5.340999842681884, "train_acc": 0.00992, "test_loss": 4.716685279846192, "test_acc": 0.01, "lyapunov": 1.5657545608632706, "grad_norm": 0.20177951961733773, "grad_max_sv": 0.01230331021361053, "grad_min_sv": 0.0, "grad_condition": 12303310213.610529, "lr": 0.0003960441545911199, "time_sec": 132.0947766304016 }, { "epoch": 86, "train_loss": 5.344697039794922, "train_acc": 0.00906, "test_loss": 4.770621002197266, "test_acc": 0.01, "lyapunov": 1.5692900818632083, "grad_norm": 0.20891700571465235, "grad_max_sv": 0.013876684103161096, "grad_min_sv": 0.0, "grad_condition": 13876684103.161098, "lr": 0.0003858245649446718, "time_sec": 132.09650421142578 }, { "epoch": 87, "train_loss": 5.346022133178711, "train_acc": 0.00958, "test_loss": 4.825743739318848, "test_acc": 0.01, "lyapunov": 1.5695690389179513, "grad_norm": 0.23167422762918993, "grad_max_sv": 0.0037465339992195368, "grad_min_sv": 0.0, "grad_condition": 3746533999.219537, "lr": 0.00037565505641757235, "time_sec": 132.0917444229126 }, { "epoch": 88, "train_loss": 5.346828841705323, "train_acc": 0.00876, "test_loss": 4.960531255340576, "test_acc": 0.01, "lyapunov": 1.5696865573258656, "grad_norm": 0.1785675731490032, "grad_max_sv": 0.005577366659417748, "grad_min_sv": 0.0, "grad_condition": 5577366659.417749, "lr": 0.00036554008969236695, "time_sec": 132.0870282649994 }, { "epoch": 89, "train_loss": 5.342154947357177, "train_acc": 0.00878, "test_loss": 4.975327129364014, "test_acc": 0.01, "lyapunov": 1.5665336716205567, "grad_norm": 0.16793525655934358, "grad_max_sv": 0.00797480964101851, "grad_min_sv": 0.0, "grad_condition": 7974809641.018509, "lr": 0.0003554841015277638, "time_sec": 132.12742161750793 }, { "epoch": 90, "train_loss": 5.346710361175537, "train_acc": 0.00918, "test_loss": 4.953879835510254, "test_acc": 0.01, "lyapunov": 1.5700483614831324, "grad_norm": 0.18433712454121046, "grad_max_sv": 0.012014600727707148, "grad_min_sv": 0.0, "grad_condition": 12014600727.707148, "lr": 0.000345491502812526, "time_sec": 132.0858714580536 }, { "epoch": 91, "train_loss": 5.341808082733154, "train_acc": 0.00856, "test_loss": 5.010934870910645, "test_acc": 0.01, "lyapunov": 1.566529265754973, "grad_norm": 0.1758408454253638, "grad_max_sv": 0.003343093441799283, "grad_min_sv": 0.0, "grad_condition": 3343093441.799283, "lr": 0.0003355666766307081, "time_sec": 132.0660150051117 }, { "epoch": 92, "train_loss": 5.351253204956055, "train_acc": 0.00918, "test_loss": 5.023424221801758, "test_acc": 0.01, "lyapunov": 1.5723978284069948, "grad_norm": 0.17788255301821657, "grad_max_sv": 0.014162034029141068, "grad_min_sv": 0.0, "grad_condition": 14162034029.141071, "lr": 0.00032571397633909225, "time_sec": 132.10221076011658 }, { "epoch": 93, "train_loss": 5.347586841278076, "train_acc": 0.00884, "test_loss": 4.963154336547851, "test_acc": 0.01, "lyapunov": 1.5719817017045472, "grad_norm": 0.2369860248003482, "grad_max_sv": 0.004905311437323689, "grad_min_sv": 0.0, "grad_condition": 4905311437.323689, "lr": 0.00031593772365766094, "time_sec": 132.1323049068451 }, { "epoch": 94, "train_loss": 5.343141855926514, "train_acc": 0.00848, "test_loss": 4.921149578094482, "test_acc": 0.01, "lyapunov": 1.5679576765850682, "grad_norm": 0.1602509536119079, "grad_max_sv": 0.019888732209801675, "grad_min_sv": 0.0, "grad_condition": 19888732209.801674, "lr": 0.0003062422067739483, "time_sec": 132.1422688961029 }, { "epoch": 95, "train_loss": 5.343594031066894, "train_acc": 0.00906, "test_loss": 4.905448650360108, "test_acc": 0.01, "lyapunov": 1.5682554074260584, "grad_norm": 0.17541418565565223, "grad_max_sv": 0.009854677692055702, "grad_min_sv": 0.0, "grad_condition": 9854677692.055702, "lr": 0.00029663167846209965, "time_sec": 132.11462831497192 }, { "epoch": 96, "train_loss": 5.341661099700928, "train_acc": 0.00938, "test_loss": 4.896561671447754, "test_acc": 0.01, "lyapunov": 1.566467627539964, "grad_norm": 0.18126299601196125, "grad_max_sv": 0.013893446559086442, "grad_min_sv": 0.0, "grad_condition": 13893446559.086445, "lr": 0.00028711035421746345, "time_sec": 132.183189868927 }, { "epoch": 97, "train_loss": 5.341162901000977, "train_acc": 0.00872, "test_loss": 4.906980642700195, "test_acc": 0.01, "lyapunov": 1.5660171655132948, "grad_norm": 0.18389173404235654, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 132.1316442489624 }, { "epoch": 98, "train_loss": 5.340904234008789, "train_acc": 0.0087, "test_loss": 4.880604965209961, "test_acc": 0.01, "lyapunov": 1.5657722669489242, "grad_norm": 0.16941469287847527, "grad_max_sv": 0.0025681605096906424, "grad_min_sv": 0.0, "grad_condition": 2568160509.6906424, "lr": 0.00026835198244006903, "time_sec": 132.0789442062378 }, { "epoch": 99, "train_loss": 5.342495626068115, "train_acc": 0.00838, "test_loss": 4.8667546737670895, "test_acc": 0.01, "lyapunov": 1.56737110986734, "grad_norm": 0.2098824320936581, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 132.06338381767273 }, { "epoch": 100, "train_loss": 5.341140549468994, "train_acc": 0.00882, "test_loss": 4.923036535644531, "test_acc": 0.01, "lyapunov": 1.5660716353170097, "grad_norm": 0.16309007942968, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 132.0798683166504 }, { "epoch": 101, "train_loss": 5.367573778076172, "train_acc": 0.00942, "test_loss": 4.8419834274291995, "test_acc": 0.01, "lyapunov": 1.5839073743356769, "grad_norm": 0.17849770970668777, "grad_max_sv": 0.006972884247079492, "grad_min_sv": 0.0, "grad_condition": 6972884247.079493, "lr": 0.00024098649531343477, "time_sec": 132.07039666175842 }, { "epoch": 102, "train_loss": 5.3430040219116215, "train_acc": 0.00878, "test_loss": 4.867986113739014, "test_acc": 0.01, "lyapunov": 1.5680094472587567, "grad_norm": 0.17231990573343864, "grad_max_sv": 0.002580128749832511, "grad_min_sv": 0.0, "grad_condition": 2580128749.832511, "lr": 0.0002320866025105016, "time_sec": 132.0873384475708 }, { "epoch": 103, "train_loss": 5.342889985504151, "train_acc": 0.00874, "test_loss": 4.840346334075928, "test_acc": 0.01, "lyapunov": 1.5678095716954497, "grad_norm": 0.18603931144131847, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 132.0669243335724 }, { "epoch": 104, "train_loss": 5.345595389709473, "train_acc": 0.00906, "test_loss": 4.82763256072998, "test_acc": 0.01, "lyapunov": 1.5700134941379127, "grad_norm": 0.17962506167998699, "grad_max_sv": 0.0006658073514699935, "grad_min_sv": 0.0, "grad_condition": 665807351.4699936, "lr": 0.000214643216157784, "time_sec": 132.0985701084137 }, { "epoch": 105, "train_loss": 5.354534033508301, "train_acc": 0.00898, "test_loss": 4.813229525756836, "test_acc": 0.01, "lyapunov": 1.5754887292452175, "grad_norm": 0.2002013331480914, "grad_max_sv": 0.004350297572091222, "grad_min_sv": 0.0, "grad_condition": 4350297572.091222, "lr": 0.00020610737385376332, "time_sec": 132.09686851501465 }, { "epoch": 106, "train_loss": 5.3426032342529295, "train_acc": 0.00804, "test_loss": 4.823688924407959, "test_acc": 0.01, "lyapunov": 1.567502071485495, "grad_norm": 0.177797147662824, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 132.1264684200287 }, { "epoch": 107, "train_loss": 5.349622652893067, "train_acc": 0.00884, "test_loss": 4.844220027923584, "test_acc": 0.01, "lyapunov": 1.571947547176, "grad_norm": 0.16292252305474791, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 132.10880613327026 }, { "epoch": 108, "train_loss": 5.345900168304444, "train_acc": 0.00918, "test_loss": 4.840348344421387, "test_acc": 0.01, "lyapunov": 1.5703127265281385, "grad_norm": 0.17468920430563006, "grad_max_sv": 0.0029470635578036307, "grad_min_sv": 0.0, "grad_condition": 2947063557.803631, "lr": 0.000181288005125655, "time_sec": 132.11736822128296 }, { "epoch": 109, "train_loss": 5.345384422454834, "train_acc": 0.00874, "test_loss": 4.8622421981811526, "test_acc": 0.01, "lyapunov": 1.5698327935870042, "grad_norm": 0.21177276682423293, "grad_max_sv": 0.0007724121678620577, "grad_min_sv": 0.0, "grad_condition": 772412167.8620577, "lr": 0.0001732896980049473, "time_sec": 132.07746076583862 }, { "epoch": 110, "train_loss": 5.342875657653809, "train_acc": 0.00912, "test_loss": 4.856573393249512, "test_acc": 0.01, "lyapunov": 1.5677888875117387, "grad_norm": 0.16084383685322373, "grad_max_sv": 0.013493797415867448, "grad_min_sv": 0.0, "grad_condition": 13493797415.867447, "lr": 0.00016543469682057076, "time_sec": 132.08074021339417 }, { "epoch": 111, "train_loss": 5.355080330505371, "train_acc": 0.00822, "test_loss": 4.830239296722412, "test_acc": 0.01, "lyapunov": 1.5756983775312028, "grad_norm": 0.1959747570871713, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 132.07752227783203 }, { "epoch": 112, "train_loss": 5.342228624572754, "train_acc": 0.00892, "test_loss": 4.84301993560791, "test_acc": 0.01, "lyapunov": 1.5673401697212472, "grad_norm": 0.14204259013530204, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 132.06180357933044 }, { "epoch": 113, "train_loss": 5.3422714726257325, "train_acc": 0.00928, "test_loss": 4.821010319519043, "test_acc": 0.01, "lyapunov": 1.5673690311744084, "grad_norm": 0.1572610072392831, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 132.09343099594116 }, { "epoch": 114, "train_loss": 5.3444528672790526, "train_acc": 0.0086, "test_loss": 4.83043311843872, "test_acc": 0.01, "lyapunov": 1.5691952199277366, "grad_norm": 0.15397404749427382, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 132.07117557525635 }, { "epoch": 115, "train_loss": 5.342576068572998, "train_acc": 0.00892, "test_loss": 4.83036664352417, "test_acc": 0.01, "lyapunov": 1.5677011345353578, "grad_norm": 0.13531666387620547, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 132.1246190071106 }, { "epoch": 116, "train_loss": 5.342390079040527, "train_acc": 0.009, "test_loss": 4.818707986450195, "test_acc": 0.01, "lyapunov": 1.5674945427023845, "grad_norm": 0.11755267765049923, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 132.10427331924438 }, { "epoch": 117, "train_loss": 5.346578267517089, "train_acc": 0.00914, "test_loss": 4.808753877258301, "test_acc": 0.01, "lyapunov": 1.571015379617891, "grad_norm": 0.14739866079910954, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 132.09667372703552 }, { "epoch": 118, "train_loss": 5.341421314849853, "train_acc": 0.00888, "test_loss": 4.8178321044921875, "test_acc": 0.01, "lyapunov": 1.5664617289667544, "grad_norm": 0.15196598686273202, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 132.09818243980408 }, { "epoch": 119, "train_loss": 5.342278069915771, "train_acc": 0.00846, "test_loss": 4.809390866088867, "test_acc": 0.01, "lyapunov": 1.5673773797881572, "grad_norm": 0.17015255493793316, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 132.13357877731323 }, { "epoch": 120, "train_loss": 5.341155296783447, "train_acc": 0.00878, "test_loss": 4.819783433532715, "test_acc": 0.01, "lyapunov": 1.56620217955021, "grad_norm": 0.13456226708171515, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 132.0805094242096 }, { "epoch": 121, "train_loss": 5.344341220397949, "train_acc": 0.00942, "test_loss": 4.812504239654541, "test_acc": 0.01, "lyapunov": 1.5690714410503808, "grad_norm": 0.15635175889858405, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 132.10770106315613 }, { "epoch": 122, "train_loss": 5.341316756591797, "train_acc": 0.00872, "test_loss": 4.791230865478516, "test_acc": 0.01, "lyapunov": 1.5663795004720273, "grad_norm": 0.13120586242402146, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 132.12851881980896 }, { "epoch": 123, "train_loss": 5.343846289520264, "train_acc": 0.00826, "test_loss": 4.791252892303467, "test_acc": 0.01, "lyapunov": 1.5686628943514032, "grad_norm": 0.12574649548787997, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 132.11882972717285 }, { "epoch": 124, "train_loss": 5.341886834716797, "train_acc": 0.00924, "test_loss": 4.7894229957580565, "test_acc": 0.01, "lyapunov": 1.566991005712153, "grad_norm": 0.12125233233583547, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 132.1242277622223 }, { "epoch": 125, "train_loss": 5.341545905151367, "train_acc": 0.00844, "test_loss": 4.781455255126953, "test_acc": 0.01, "lyapunov": 1.566652334559604, "grad_norm": 0.11877593044343822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 132.1204969882965 }, { "epoch": 126, "train_loss": 5.343738833465576, "train_acc": 0.0089, "test_loss": 4.782108512115479, "test_acc": 0.01, "lyapunov": 1.5686877148840435, "grad_norm": 0.14685494918897216, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 132.1582751274109 }, { "epoch": 127, "train_loss": 5.340985955505371, "train_acc": 0.0095, "test_loss": 4.780940398406982, "test_acc": 0.01, "lyapunov": 1.5660363987583639, "grad_norm": 0.11589911056077733, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 132.11265683174133 }, { "epoch": 128, "train_loss": 5.343754200744629, "train_acc": 0.00968, "test_loss": 4.7895281066894535, "test_acc": 0.01, "lyapunov": 1.5686014985184535, "grad_norm": 0.14358686229070586, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 132.08578968048096 }, { "epoch": 129, "train_loss": 5.345564033660889, "train_acc": 0.00894, "test_loss": 4.789863642883301, "test_acc": 0.01, "lyapunov": 1.5702618372714734, "grad_norm": 0.15311883643219684, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 132.07862830162048 }, { "epoch": 130, "train_loss": 5.342584033355713, "train_acc": 0.00908, "test_loss": 4.779020539093017, "test_acc": 0.01, "lyapunov": 1.5677639367940175, "grad_norm": 0.15329364714098923, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 132.16318249702454 }, { "epoch": 131, "train_loss": 5.341682634429931, "train_acc": 0.00944, "test_loss": 4.782007501220703, "test_acc": 0.01, "lyapunov": 1.5667803564949718, "grad_norm": 0.13761474702045567, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 132.10979580879211 }, { "epoch": 132, "train_loss": 5.342693343200684, "train_acc": 0.00874, "test_loss": 4.785680311584473, "test_acc": 0.01, "lyapunov": 1.5677480008596045, "grad_norm": 0.14227357176692468, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 132.14933609962463 }, { "epoch": 133, "train_loss": 5.339641748504639, "train_acc": 0.00948, "test_loss": 4.7827409004211425, "test_acc": 0.01, "lyapunov": 1.5646268839726363, "grad_norm": 0.11276908599413558, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 132.07238721847534 }, { "epoch": 134, "train_loss": 5.341200107269287, "train_acc": 0.00926, "test_loss": 4.787122599792481, "test_acc": 0.01, "lyapunov": 1.566309593217757, "grad_norm": 0.11577298218878175, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 132.08721160888672 }, { "epoch": 135, "train_loss": 5.341790512847901, "train_acc": 0.0089, "test_loss": 4.78599192199707, "test_acc": 0.01, "lyapunov": 1.5669051058152144, "grad_norm": 0.11406538673568321, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 132.13204169273376 }, { "epoch": 136, "train_loss": 5.342709656066894, "train_acc": 0.0095, "test_loss": 4.784429030609131, "test_acc": 0.01, "lyapunov": 1.5678098799322573, "grad_norm": 0.1301621255904577, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 132.10533571243286 }, { "epoch": 137, "train_loss": 5.341824940795899, "train_acc": 0.00922, "test_loss": 4.7872933067321775, "test_acc": 0.01, "lyapunov": 1.5669465708305768, "grad_norm": 0.11590542924579983, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 132.09704732894897 }, { "epoch": 138, "train_loss": 5.341511313171386, "train_acc": 0.00974, "test_loss": 4.7792837577819824, "test_acc": 0.01, "lyapunov": 1.5666430996507026, "grad_norm": 0.11256165029712978, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 132.12034392356873 }, { "epoch": 139, "train_loss": 5.341457148132324, "train_acc": 0.00972, "test_loss": 4.780789426422119, "test_acc": 0.01, "lyapunov": 1.5665654376949496, "grad_norm": 0.10204898242159913, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 132.14241123199463 }, { "epoch": 140, "train_loss": 5.3405984710693355, "train_acc": 0.00948, "test_loss": 4.778655993652344, "test_acc": 0.01, "lyapunov": 1.5656854539271206, "grad_norm": 0.12809073544865285, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 132.08009314537048 }, { "epoch": 141, "train_loss": 5.340534744262695, "train_acc": 0.0091, "test_loss": 4.780472738647461, "test_acc": 0.01, "lyapunov": 1.5655692928587384, "grad_norm": 0.10313184635997721, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 132.0838325023651 }, { "epoch": 142, "train_loss": 5.340677046051026, "train_acc": 0.00992, "test_loss": 4.781814497375488, "test_acc": 0.01, "lyapunov": 1.5657385788915101, "grad_norm": 0.10334450883525552, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 132.11706686019897 }, { "epoch": 143, "train_loss": 5.341100224914551, "train_acc": 0.01, "test_loss": 4.7812304672241215, "test_acc": 0.01, "lyapunov": 1.5661775379839455, "grad_norm": 0.1264085338408933, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 132.12464785575867 }, { "epoch": 144, "train_loss": 5.341793058776855, "train_acc": 0.01, "test_loss": 4.78042247467041, "test_acc": 0.01, "lyapunov": 1.5669281586356785, "grad_norm": 0.09436149541511535, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 132.1470422744751 }, { "epoch": 145, "train_loss": 5.349506974182129, "train_acc": 0.01, "test_loss": 4.78042266998291, "test_acc": 0.01, "lyapunov": 1.5731076300906404, "grad_norm": 0.1178995174742038, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 132.09918355941772 }, { "epoch": 146, "train_loss": 5.342189108886719, "train_acc": 0.01, "test_loss": 4.781454308319092, "test_acc": 0.01, "lyapunov": 1.5673414352909683, "grad_norm": 0.09081347881139741, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 132.10713911056519 }, { "epoch": 147, "train_loss": 5.341546408996582, "train_acc": 0.01, "test_loss": 4.781454162597656, "test_acc": 0.01, "lyapunov": 1.5666629228445574, "grad_norm": 0.09019678612458548, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 132.1311194896698 }, { "epoch": 148, "train_loss": 5.341715382995606, "train_acc": 0.01, "test_loss": 4.782687770843506, "test_acc": 0.01, "lyapunov": 1.5668335332894874, "grad_norm": 0.09070167126439822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 132.13174676895142 }, { "epoch": 149, "train_loss": 5.342021694946289, "train_acc": 0.01, "test_loss": 4.782687942504883, "test_acc": 0.01, "lyapunov": 1.5671642540056077, "grad_norm": 0.09082797851606526, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 132.09515190124512 }, { "epoch": 150, "train_loss": 5.339607263183594, "train_acc": 0.01, "test_loss": 4.782687832641601, "test_acc": 0.01, "lyapunov": 1.5645978752609409, "grad_norm": 0.090368422289998, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 132.06873154640198 } ], "16": [ { "epoch": 1, "train_loss": 5.170418347930908, "train_acc": 0.01482, "test_loss": 4.874806223297119, "test_acc": 0.0107, "lyapunov": 2.4393880626429683, "grad_norm": 5.345734057581178, "grad_max_sv": 4.483905690908432, "grad_min_sv": 8.954973220731688e-08, "grad_condition": 129025189.7290709, "lr": 0.0009998903417374227, "time_sec": 177.46578431129456 }, { "epoch": 2, "train_loss": 4.886182316741944, "train_acc": 0.01718, "test_loss": 4.80269637298584, "test_acc": 0.0102, "lyapunov": 1.9971744041613606, "grad_norm": 3.4433992950689616, "grad_max_sv": 2.739058768749237, "grad_min_sv": 5.745658385736263e-08, "grad_condition": 84538548.49489692, "lr": 0.0009995614150494292, "time_sec": 177.3906273841858 }, { "epoch": 3, "train_loss": 4.783107050323486, "train_acc": 0.01528, "test_loss": 4.738721482086182, "test_acc": 0.01, "lyapunov": 1.8048184826550886, "grad_norm": 2.047885898328211, "grad_max_sv": 1.4787879481911659, "grad_min_sv": 3.2768289852033726e-08, "grad_condition": 566050825.5696664, "lr": 0.0009990133642141358, "time_sec": 177.4175295829773 }, { "epoch": 4, "train_loss": 4.751416029052734, "train_acc": 0.01606, "test_loss": 4.630446166992187, "test_acc": 0.01, "lyapunov": 1.707960840991086, "grad_norm": 1.4476075782979456, "grad_max_sv": 0.836699303984642, "grad_min_sv": 1.4332362594222718e-08, "grad_condition": 24679971260.08811, "lr": 0.0009982464296247522, "time_sec": 177.5156271457672 }, { "epoch": 5, "train_loss": 4.7807122309875485, "train_acc": 0.01428, "test_loss": 4.622669477844238, "test_acc": 0.01, "lyapunov": 1.7041781695602496, "grad_norm": 1.050316146928851, "grad_max_sv": 0.498383151658345, "grad_min_sv": 3.796087105340611e-11, "grad_condition": 139863529616.57062, "lr": 0.0009972609476841367, "time_sec": 177.43440508842468 }, { "epoch": 6, "train_loss": 4.8388256774902345, "train_acc": 0.01308, "test_loss": 4.649810864257812, "test_acc": 0.01, "lyapunov": 1.6965309613196136, "grad_norm": 0.6788898927695144, "grad_max_sv": 0.42595611810684203, "grad_min_sv": 1.5628448124239113e-12, "grad_condition": 206494283007.18826, "lr": 0.000996057350657239, "time_sec": 177.44785737991333 }, { "epoch": 7, "train_loss": 4.8986459965515134, "train_acc": 0.01186, "test_loss": 4.708990380859375, "test_acc": 0.01, "lyapunov": 1.7017012535763518, "grad_norm": 0.48731250728585107, "grad_max_sv": 0.33343438915908336, "grad_min_sv": 5.53908882765212e-13, "grad_condition": 254093723126.4781, "lr": 0.000994636166481494, "time_sec": 177.37777757644653 }, { "epoch": 8, "train_loss": 4.943858919830323, "train_acc": 0.01104, "test_loss": 5.26636118927002, "test_acc": 0.01, "lyapunov": 1.7182561540237777, "grad_norm": 0.48999999014626605, "grad_max_sv": 0.25608402006328107, "grad_min_sv": 9.286946471073546e-14, "grad_condition": 242351728116.98883, "lr": 0.0009929980185352525, "time_sec": 177.387188911438 }, { "epoch": 9, "train_loss": 4.979513124542236, "train_acc": 0.01144, "test_loss": 5.497952555084228, "test_acc": 0.01, "lyapunov": 1.7062027213518576, "grad_norm": 0.42079758157884545, "grad_max_sv": 0.2485219370573759, "grad_min_sv": 1.885935727798404e-14, "grad_condition": 245798317000.96808, "lr": 0.0009911436253643444, "time_sec": 177.38124251365662 }, { "epoch": 10, "train_loss": 5.0166656953430175, "train_acc": 0.01076, "test_loss": 4.605617906188965, "test_acc": 0.01, "lyapunov": 1.6932507491172732, "grad_norm": 0.420321050632811, "grad_max_sv": 0.2404270452912897, "grad_min_sv": 9.577507932467198e-25, "grad_condition": 240427045291.03647, "lr": 0.0009890738003669028, "time_sec": 177.3316354751587 }, { "epoch": 11, "train_loss": 5.0578450691223145, "train_acc": 0.0114, "test_loss": 4.605764473724365, "test_acc": 0.01, "lyapunov": 1.6895873580137482, "grad_norm": 0.49178900029145406, "grad_max_sv": 0.26607779785990715, "grad_min_sv": 5.082064100170326e-21, "grad_condition": 266077796409.95917, "lr": 0.00098678945143658, "time_sec": 177.35666227340698 }, { "epoch": 12, "train_loss": 5.092576569976806, "train_acc": 0.01182, "test_loss": 4.60662777633667, "test_acc": 0.01, "lyapunov": 1.6848897119922102, "grad_norm": 0.6934058402651867, "grad_max_sv": 0.34772998839616776, "grad_min_sv": 1.6804705504564466e-13, "grad_condition": 311062929805.2175, "lr": 0.0009842915805643154, "time_sec": 177.45647644996643 }, { "epoch": 13, "train_loss": 5.15109172531128, "train_acc": 0.01186, "test_loss": 4.608129429626465, "test_acc": 0.01, "lyapunov": 1.7015191944663788, "grad_norm": 0.6846074227630976, "grad_max_sv": 0.32766890451312064, "grad_min_sv": 2.4578391875654614e-18, "grad_condition": 327668018219.02893, "lr": 0.000981581283398829, "time_sec": 177.36489033699036 }, { "epoch": 14, "train_loss": 5.2939554736328125, "train_acc": 0.0105, "test_loss": 5.4404556137084965, "test_acc": 0.01, "lyapunov": 1.733636704247321, "grad_norm": 2.0585577176009484, "grad_max_sv": 0.5351610340178012, "grad_min_sv": 6.043698563311623e-09, "grad_condition": 125123088585.82278, "lr": 0.0009786597487660333, "time_sec": 177.41271114349365 }, { "epoch": 15, "train_loss": 5.339356228485108, "train_acc": 0.01, "test_loss": 5.634622732543946, "test_acc": 0.01, "lyapunov": 1.7321220276605747, "grad_norm": 1.2474576611019448, "grad_max_sv": 0.5749046392738819, "grad_min_sv": 7.0887550281236514e-09, "grad_condition": 17881232094.586456, "lr": 0.0009755282581475766, "time_sec": 177.42803382873535 }, { "epoch": 16, "train_loss": 5.213154935302734, "train_acc": 0.00934, "test_loss": 5.393290295410156, "test_acc": 0.01, "lyapunov": 1.5737932243615465, "grad_norm": 0.46647750812487915, "grad_max_sv": 0.27153575848788025, "grad_min_sv": 1.5242528473500716e-09, "grad_condition": 77568831402.5238, "lr": 0.0009721881851187403, "time_sec": 177.44743824005127 }, { "epoch": 17, "train_loss": 5.262427766418457, "train_acc": 0.01022, "test_loss": 4.925324077606201, "test_acc": 0.01, "lyapunov": 1.5760375502164408, "grad_norm": 0.6268713729269668, "grad_max_sv": 0.37553633116185664, "grad_min_sv": 3.283041272093994e-09, "grad_condition": 31488669291.59237, "lr": 0.0009686409947459456, "time_sec": 177.47271943092346 }, { "epoch": 18, "train_loss": 5.289855928497315, "train_acc": 0.009, "test_loss": 5.166483688354492, "test_acc": 0.01, "lyapunov": 1.5759224303238226, "grad_norm": 0.4193761222715419, "grad_max_sv": 0.26443815175443885, "grad_min_sv": 1.8233460938992724e-09, "grad_condition": 83574980362.08054, "lr": 0.0009648882429441254, "time_sec": 177.47960138320923 }, { "epoch": 19, "train_loss": 5.3201322650146485, "train_acc": 0.0104, "test_loss": 5.085500339508057, "test_acc": 0.01, "lyapunov": 1.5752660103161316, "grad_norm": 0.35145865174653673, "grad_max_sv": 0.1685528600588441, "grad_min_sv": 5.831233779827688e-12, "grad_condition": 106917248964.36707, "lr": 0.00096093157579425, "time_sec": 177.47897052764893 }, { "epoch": 20, "train_loss": 5.3543471484375, "train_acc": 0.00944, "test_loss": 5.246659634399414, "test_acc": 0.01, "lyapunov": 1.575355000812989, "grad_norm": 0.5222583225299012, "grad_max_sv": 0.10507027432322502, "grad_min_sv": 7.849948703277934e-12, "grad_condition": 72947428086.86752, "lr": 0.0009567727288213001, "time_sec": 177.43105292320251 }, { "epoch": 21, "train_loss": 5.354224435882569, "train_acc": 0.00964, "test_loss": 5.22655355682373, "test_acc": 0.01, "lyapunov": 1.577795330520786, "grad_norm": 1.7696193327514464, "grad_max_sv": 0.04788816105574369, "grad_min_sv": 3.098440861051027e-15, "grad_condition": 47515160306.08334, "lr": 0.0009524135262330095, "time_sec": 177.38868117332458 }, { "epoch": 22, "train_loss": 5.359287767486572, "train_acc": 0.00866, "test_loss": 5.144994302368164, "test_acc": 0.01, "lyapunov": 1.5772388463130083, "grad_norm": 0.521407113480236, "grad_max_sv": 0.16268486455082892, "grad_min_sv": 1.0480323490539272e-12, "grad_condition": 114294670712.50664, "lr": 0.0009478558801197061, "time_sec": 177.4581241607666 }, { "epoch": 23, "train_loss": 5.359366517028809, "train_acc": 0.00984, "test_loss": 5.14449934387207, "test_acc": 0.01, "lyapunov": 1.5788166193705995, "grad_norm": 0.47520625785430726, "grad_max_sv": 0.14188788905739785, "grad_min_sv": 7.763794243203392e-13, "grad_condition": 90263258979.91963, "lr": 0.000943101789615607, "time_sec": 177.4587037563324 }, { "epoch": 24, "train_loss": 5.363788315887451, "train_acc": 0.00998, "test_loss": 5.219554689025879, "test_acc": 0.01, "lyapunov": 1.5823031307181434, "grad_norm": 0.45933897983850147, "grad_max_sv": 0.1220944058150053, "grad_min_sv": 8.70957522797587e-13, "grad_condition": 79316477379.01375, "lr": 0.0009381533400219313, "time_sec": 177.45913338661194 }, { "epoch": 25, "train_loss": 5.365634008026123, "train_acc": 0.0094, "test_loss": 5.931232183074951, "test_acc": 0.01, "lyapunov": 1.5886532437161107, "grad_norm": 0.43344753842757794, "grad_max_sv": 0.017200349643826485, "grad_min_sv": 1.0856606585118899e-15, "grad_condition": 17078915149.903616, "lr": 0.0009330127018922189, "time_sec": 177.41433334350586 }, { "epoch": 26, "train_loss": 5.356309142761231, "train_acc": 0.00862, "test_loss": 5.939939945220948, "test_acc": 0.01, "lyapunov": 1.5817654276138071, "grad_norm": 0.3773119512884375, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000927682130080253, "time_sec": 177.42445373535156 }, { "epoch": 27, "train_loss": 5.356818426208496, "train_acc": 0.00902, "test_loss": 6.903866325378418, "test_acc": 0.01, "lyapunov": 1.5823859988576006, "grad_norm": 0.4182139130247132, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009221639627510072, "time_sec": 177.31799745559692 }, { "epoch": 28, "train_loss": 5.391271570739746, "train_acc": 0.00976, "test_loss": 5.460548217773438, "test_acc": 0.01, "lyapunov": 1.5841533107220973, "grad_norm": 0.523477636772141, "grad_max_sv": 0.3192333810031414, "grad_min_sv": 2.9275436547182563e-09, "grad_condition": 203519819.7178569, "lr": 0.0009164606203550494, "time_sec": 177.46226978302002 }, { "epoch": 29, "train_loss": 5.375988426361084, "train_acc": 0.00942, "test_loss": 5.342045057678223, "test_acc": 0.01, "lyapunov": 1.584143414521766, "grad_norm": 0.4275297259535999, "grad_max_sv": 0.29515107311308386, "grad_min_sv": 1.5519966579252698e-09, "grad_condition": 5083754884.994722, "lr": 0.0009105746045668516, "time_sec": 177.49048447608948 }, { "epoch": 30, "train_loss": 5.3762526119995115, "train_acc": 0.00992, "test_loss": 5.335840890502929, "test_acc": 0.01, "lyapunov": 1.5899017634599104, "grad_norm": 0.46512305667247905, "grad_max_sv": 0.24659424126148224, "grad_min_sv": 2.2743761505509726e-12, "grad_condition": 128688559196.96506, "lr": 0.0009045084971874733, "time_sec": 177.4821593761444 }, { "epoch": 31, "train_loss": 5.376188383178711, "train_acc": 0.00954, "test_loss": 5.376922852325439, "test_acc": 0.01, "lyapunov": 1.5906847974528437, "grad_norm": 0.40698064884293045, "grad_max_sv": 0.2344340980052948, "grad_min_sv": 1.6077615594515009e-12, "grad_condition": 119697955045.46411, "lr": 0.0008982649590120977, "time_sec": 177.51625323295593 }, { "epoch": 32, "train_loss": 5.373684441070557, "train_acc": 0.00944, "test_loss": 5.2473334838867185, "test_acc": 0.01, "lyapunov": 1.5879211066019199, "grad_norm": 0.3720940356738668, "grad_max_sv": 0.20825780294835566, "grad_min_sv": 3.7871002154344376e-10, "grad_condition": 69233328517.31859, "lr": 0.0008918467286629196, "time_sec": 177.5158429145813 }, { "epoch": 33, "train_loss": 5.369580058288574, "train_acc": 0.00906, "test_loss": 5.292366073608399, "test_acc": 0.01, "lyapunov": 1.5872128549439217, "grad_norm": 0.36741579981339867, "grad_max_sv": 0.16275404021143913, "grad_min_sv": 3.5290433862002075e-13, "grad_condition": 135525270524.32925, "lr": 0.0008852566213878943, "time_sec": 177.54218769073486 }, { "epoch": 34, "train_loss": 5.364965376129151, "train_acc": 0.00946, "test_loss": 5.301969288635254, "test_acc": 0.01, "lyapunov": 1.5879910906867298, "grad_norm": 0.40385833520326136, "grad_max_sv": 0.09459194829687476, "grad_min_sv": 2.8168103316895143e-14, "grad_condition": 90889833007.94754, "lr": 0.000878497527825878, "time_sec": 177.56994581222534 }, { "epoch": 35, "train_loss": 5.367663076019287, "train_acc": 0.01036, "test_loss": 5.347993537902832, "test_acc": 0.01, "lyapunov": 1.5875165621033105, "grad_norm": 0.3132720633072883, "grad_max_sv": 0.1425728589296341, "grad_min_sv": 2.007235616198558e-14, "grad_condition": 139708753283.34723, "lr": 0.000871572412738697, "time_sec": 177.49852347373962 }, { "epoch": 36, "train_loss": 5.370810558624267, "train_acc": 0.01022, "test_loss": 5.382797595214844, "test_acc": 0.01, "lyapunov": 1.5899634550294608, "grad_norm": 0.30370352801828593, "grad_max_sv": 0.16092172265052795, "grad_min_sv": 4.485897177730539e-14, "grad_condition": 154470905347.59918, "lr": 0.0008644843137107055, "time_sec": 177.4556074142456 }, { "epoch": 37, "train_loss": 5.384568545379639, "train_acc": 0.01018, "test_loss": 5.296823876953125, "test_acc": 0.01, "lyapunov": 1.5977905272217967, "grad_norm": 0.266373358722962, "grad_max_sv": 0.14979717023670674, "grad_min_sv": 7.171554109546675e-14, "grad_condition": 140879720678.9068, "lr": 0.0008572363398164014, "time_sec": 177.47119235992432 }, { "epoch": 38, "train_loss": 5.370039872131348, "train_acc": 0.01028, "test_loss": 5.444481262207031, "test_acc": 0.01, "lyapunov": 1.5899496447399755, "grad_norm": 0.3096876275058644, "grad_max_sv": 0.15369951017200947, "grad_min_sv": 9.48148632228887e-14, "grad_condition": 141735332362.74988, "lr": 0.0008498316702566826, "time_sec": 177.47467923164368 }, { "epoch": 39, "train_loss": 5.369657610778809, "train_acc": 0.01024, "test_loss": 5.390600685119629, "test_acc": 0.01, "lyapunov": 1.5896801790008155, "grad_norm": 0.3108555116352423, "grad_max_sv": 0.1614890903234482, "grad_min_sv": 9.349701492890973e-14, "grad_condition": 149566173130.64127, "lr": 0.0008422735529643442, "time_sec": 177.4328293800354 }, { "epoch": 40, "train_loss": 5.3822917242431645, "train_acc": 0.0093, "test_loss": 5.184299499511718, "test_acc": 0.01, "lyapunov": 1.6002484066102205, "grad_norm": 0.24882538015615607, "grad_max_sv": 0.04936090065166354, "grad_min_sv": 6.934642584876431e-15, "grad_condition": 48367763332.42686, "lr": 0.0008345653031794289, "time_sec": 177.37197065353394 }, { "epoch": 41, "train_loss": 5.373546744842529, "train_acc": 0.00964, "test_loss": 5.196872940063477, "test_acc": 0.01, "lyapunov": 1.5940455433047946, "grad_norm": 0.2191391775580976, "grad_max_sv": 0.09365939311683177, "grad_min_sv": 1.5882716898553207e-15, "grad_condition": 93493384840.27858, "lr": 0.0008267103019950526, "time_sec": 177.47450184822083 }, { "epoch": 42, "train_loss": 5.368149404144287, "train_acc": 0.00874, "test_loss": 5.14538009185791, "test_acc": 0.01, "lyapunov": 1.590694589383157, "grad_norm": 0.22212098932442453, "grad_max_sv": 0.10206865929067135, "grad_min_sv": 2.3133067448522557e-15, "grad_condition": 101840784421.61417, "lr": 0.0008187119948743447, "time_sec": 177.46074080467224 }, { "epoch": 43, "train_loss": 5.367429432983398, "train_acc": 0.00892, "test_loss": 5.233426832580567, "test_acc": 0.01, "lyapunov": 1.591343494327477, "grad_norm": 0.23543493742380756, "grad_max_sv": 0.08834987077862025, "grad_min_sv": 5.952270134521069e-16, "grad_condition": 88299394994.77124, "lr": 0.000810573890139155, "time_sec": 177.47843408584595 }, { "epoch": 44, "train_loss": 5.3674171057128905, "train_acc": 0.00878, "test_loss": 5.2093109710693355, "test_acc": 0.01, "lyapunov": 1.5915821013243303, "grad_norm": 0.1990598758819041, "grad_max_sv": 0.07391932224854827, "grad_min_sv": 4.4595190727564784e-24, "grad_condition": 73919322248.21725, "lr": 0.0008022995574311873, "time_sec": 177.49818992614746 }, { "epoch": 45, "train_loss": 5.367794494018555, "train_acc": 0.00928, "test_loss": 5.287538707733154, "test_acc": 0.01, "lyapunov": 1.5911102807125472, "grad_norm": 0.23659112992785783, "grad_max_sv": 0.0903646806254983, "grad_min_sv": 2.044203469301876e-16, "grad_condition": 90346621799.15851, "lr": 0.0007938926261462363, "time_sec": 177.41696000099182 }, { "epoch": 46, "train_loss": 5.376998851623535, "train_acc": 0.00968, "test_loss": 5.387116500854492, "test_acc": 0.01, "lyapunov": 1.5990899456736376, "grad_norm": 0.2197692685737557, "grad_max_sv": 0.09713525734841824, "grad_min_sv": 1.4019481757585365e-15, "grad_condition": 96996163686.28548, "lr": 0.0007853567838422158, "time_sec": 177.49049758911133 }, { "epoch": 47, "train_loss": 5.367403378448486, "train_acc": 0.00904, "test_loss": 5.152558483886719, "test_acc": 0.01, "lyapunov": 1.5909755915936912, "grad_norm": 0.20354351323110018, "grad_max_sv": 0.09671832993626595, "grad_min_sv": 1.7095434307863795e-15, "grad_condition": 96550067706.91704, "lr": 0.0007766957746216719, "time_sec": 177.440682888031 }, { "epoch": 48, "train_loss": 5.3691537622070316, "train_acc": 0.009, "test_loss": 5.103178468322754, "test_acc": 0.01, "lyapunov": 1.5926780014696633, "grad_norm": 0.20080565969562386, "grad_max_sv": 0.09486224502325058, "grad_min_sv": 1.5909231309062707e-15, "grad_condition": 94698098961.85327, "lr": 0.0007679133974894982, "time_sec": 177.45987153053284 }, { "epoch": 49, "train_loss": 5.367714106140137, "train_acc": 0.0093, "test_loss": 5.090968506622314, "test_acc": 0.01, "lyapunov": 1.5918231150683235, "grad_norm": 0.21785142639292177, "grad_max_sv": 0.08113837614655495, "grad_min_sv": 1.754494669434441e-20, "grad_condition": 81138374637.8342, "lr": 0.000759013504686565, "time_sec": 177.4056305885315 }, { "epoch": 50, "train_loss": 5.370782024841309, "train_acc": 0.00932, "test_loss": 5.1753190261840825, "test_acc": 0.01, "lyapunov": 1.5940865891059037, "grad_norm": 0.20444563688390227, "grad_max_sv": 0.07656172616407275, "grad_min_sv": 2.696277782642207e-17, "grad_condition": 76559876296.83813, "lr": 0.0007499999999999998, "time_sec": 177.39811301231384 }, { "epoch": 51, "train_loss": 5.368595368652343, "train_acc": 0.0093, "test_loss": 5.130212609863281, "test_acc": 0.01, "lyapunov": 1.5924014548206573, "grad_norm": 0.2110899983642968, "grad_max_sv": 0.09537852350622415, "grad_min_sv": 2.1267942984928308e-15, "grad_condition": 95172191574.00798, "lr": 0.0007408768370508575, "time_sec": 177.437908411026 }, { "epoch": 52, "train_loss": 5.368308511657715, "train_acc": 0.0095, "test_loss": 5.122430040740967, "test_acc": 0.01, "lyapunov": 1.5921837594503028, "grad_norm": 0.22274269152603762, "grad_max_sv": 0.09443439822643995, "grad_min_sv": 1.7298829634439422e-15, "grad_condition": 94273467470.68217, "lr": 0.0007316480175599307, "time_sec": 177.40578150749207 }, { "epoch": 53, "train_loss": 5.369929014434814, "train_acc": 0.01008, "test_loss": 5.085774603271484, "test_acc": 0.01, "lyapunov": 1.5937723787239446, "grad_norm": 0.20295993227713832, "grad_max_sv": 0.09454309139400721, "grad_min_sv": 6.450947046344728e-16, "grad_condition": 94479862712.68396, "lr": 0.0007223175895924635, "time_sec": 177.40152430534363 }, { "epoch": 54, "train_loss": 5.373923838806152, "train_acc": 0.00952, "test_loss": 5.077367216491699, "test_acc": 0.01, "lyapunov": 1.5964158435002007, "grad_norm": 0.2154712788436217, "grad_max_sv": 0.09458265658468008, "grad_min_sv": 2.433638441241118e-15, "grad_condition": 94352900611.06958, "lr": 0.0007128896457825361, "time_sec": 177.4158182144165 }, { "epoch": 55, "train_loss": 5.367228227386475, "train_acc": 0.01046, "test_loss": 5.130655932617188, "test_acc": 0.01, "lyapunov": 1.5918423345936534, "grad_norm": 0.21491158085488357, "grad_max_sv": 0.07526904288679362, "grad_min_sv": 2.528540900743907e-16, "grad_condition": 75246607455.27087, "lr": 0.0007033683215378998, "time_sec": 177.39575290679932 }, { "epoch": 56, "train_loss": 5.367513545684814, "train_acc": 0.00982, "test_loss": 5.064245509338379, "test_acc": 0.01, "lyapunov": 1.5908652431214862, "grad_norm": 0.20945675875630285, "grad_max_sv": 0.07764090299606323, "grad_min_sv": 1.3979459340183045e-15, "grad_condition": 77513163313.73227, "lr": 0.0006937577932260512, "time_sec": 177.41370344161987 }, { "epoch": 57, "train_loss": 5.378045714263916, "train_acc": 0.0097, "test_loss": 5.010745031738281, "test_acc": 0.01, "lyapunov": 1.5985675842865654, "grad_norm": 0.21081504402843954, "grad_max_sv": 0.08188115861266851, "grad_min_sv": 5.212303423583328e-17, "grad_condition": 81876236542.23714, "lr": 0.0006840622763423388, "time_sec": 177.4101119041443 }, { "epoch": 58, "train_loss": 5.369592454376221, "train_acc": 0.00954, "test_loss": 5.001489561462402, "test_acc": 0.01, "lyapunov": 1.594169369743913, "grad_norm": 0.22207129747707732, "grad_max_sv": 0.06061144880950451, "grad_min_sv": 8.52425895192004e-34, "grad_condition": 60611448809.5045, "lr": 0.0006742860236609073, "time_sec": 177.40956783294678 }, { "epoch": 59, "train_loss": 5.369317971343994, "train_acc": 0.00942, "test_loss": 5.000968522644043, "test_acc": 0.01, "lyapunov": 1.593946976429971, "grad_norm": 0.21723304995593648, "grad_max_sv": 0.06631144480779767, "grad_min_sv": 5.644079889684282e-43, "grad_condition": 66311444807.79767, "lr": 0.0006644333233692913, "time_sec": 177.41563248634338 }, { "epoch": 60, "train_loss": 5.367086203613281, "train_acc": 0.00986, "test_loss": 4.980809173583984, "test_acc": 0.01, "lyapunov": 1.5923281987304883, "grad_norm": 0.22232157475356287, "grad_max_sv": 0.05571612091735005, "grad_min_sv": 0.0, "grad_condition": 55716120917.35005, "lr": 0.0006545084971874734, "time_sec": 177.36889171600342 }, { "epoch": 61, "train_loss": 5.372129827270508, "train_acc": 0.00924, "test_loss": 5.0162686882019045, "test_acc": 0.01, "lyapunov": 1.5957943103502474, "grad_norm": 0.2315139450623546, "grad_max_sv": 0.05857418505474925, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 58574185054.74925, "lr": 0.0006445158984722354, "time_sec": 177.3955101966858 }, { "epoch": 62, "train_loss": 5.376675976257324, "train_acc": 0.01028, "test_loss": 4.951765003204346, "test_acc": 0.01, "lyapunov": 1.5998592873668427, "grad_norm": 0.23053009469996935, "grad_max_sv": 0.049639166425913574, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 49639166425.913574, "lr": 0.0006344599103076324, "time_sec": 177.38628578186035 }, { "epoch": 63, "train_loss": 5.3675309051513675, "train_acc": 0.00898, "test_loss": 4.976654839324951, "test_acc": 0.01, "lyapunov": 1.59307188481626, "grad_norm": 0.247010688591046, "grad_max_sv": 0.04920805087313056, "grad_min_sv": 0.0, "grad_condition": 49208050873.13057, "lr": 0.0006243449435824269, "time_sec": 177.40613865852356 }, { "epoch": 64, "train_loss": 5.367255066528321, "train_acc": 0.0097, "test_loss": 5.067697259521484, "test_acc": 0.01, "lyapunov": 1.5924071750372573, "grad_norm": 0.2341571351131304, "grad_max_sv": 0.05343637596815824, "grad_min_sv": 0.0, "grad_condition": 53436375968.15825, "lr": 0.0006141754350553275, "time_sec": 177.3703956604004 }, { "epoch": 65, "train_loss": 5.367540504302979, "train_acc": 0.00908, "test_loss": 4.9729307174682615, "test_acc": 0.01, "lyapunov": 1.5929816647258865, "grad_norm": 0.23218078781210785, "grad_max_sv": 0.05375193590298295, "grad_min_sv": 0.0, "grad_condition": 53751935902.98295, "lr": 0.0006039558454088793, "time_sec": 177.38945150375366 }, { "epoch": 66, "train_loss": 5.366137564239502, "train_acc": 0.00936, "test_loss": 4.934913189697266, "test_acc": 0.01, "lyapunov": 1.5917930770713045, "grad_norm": 0.21702876886168843, "grad_max_sv": 0.04379821689799428, "grad_min_sv": 0.0, "grad_condition": 43798216897.99428, "lr": 0.000593690657292862, "time_sec": 177.4724154472351 }, { "epoch": 67, "train_loss": 5.370335599822998, "train_acc": 0.00978, "test_loss": 4.938832836914062, "test_acc": 0.01, "lyapunov": 1.5958915979356108, "grad_norm": 0.26747204938928953, "grad_max_sv": 0.038104135124012825, "grad_min_sv": 0.0, "grad_condition": 38104135124.01283, "lr": 0.0005833843733580507, "time_sec": 177.42428302764893 }, { "epoch": 68, "train_loss": 5.367096372375488, "train_acc": 0.00948, "test_loss": 4.961852867126465, "test_acc": 0.01, "lyapunov": 1.5927841407258798, "grad_norm": 0.24628304430345999, "grad_max_sv": 0.037431048322469, "grad_min_sv": 0.0, "grad_condition": 37431048322.468994, "lr": 0.0005730415142812054, "time_sec": 177.35656356811523 }, { "epoch": 69, "train_loss": 5.367298457641602, "train_acc": 0.00942, "test_loss": 4.985350135040283, "test_acc": 0.01, "lyapunov": 1.5926642820353398, "grad_norm": 0.26713274620852084, "grad_max_sv": 0.0558107316493988, "grad_min_sv": 0.0, "grad_condition": 55810731649.3988, "lr": 0.0005626666167821517, "time_sec": 177.404226064682 }, { "epoch": 70, "train_loss": 5.370034771118164, "train_acc": 0.01, "test_loss": 4.9722988952636715, "test_acc": 0.01, "lyapunov": 1.5953361000246404, "grad_norm": 0.2772668383220675, "grad_max_sv": 0.059619830828160046, "grad_min_sv": 0.0, "grad_condition": 59619830828.16006, "lr": 0.0005522642316338265, "time_sec": 177.41033554077148 }, { "epoch": 71, "train_loss": 5.3663228466796875, "train_acc": 0.0097, "test_loss": 4.996751819610596, "test_acc": 0.01, "lyapunov": 1.592004930881588, "grad_norm": 0.27122147817442865, "grad_max_sv": 0.051365063060075045, "grad_min_sv": 0.0, "grad_condition": 51365063060.07505, "lr": 0.0005418389216661573, "time_sec": 177.41588258743286 }, { "epoch": 72, "train_loss": 5.3688113453674315, "train_acc": 0.00906, "test_loss": 4.95511130065918, "test_acc": 0.01, "lyapunov": 1.5943079513052236, "grad_norm": 0.2940023518744728, "grad_max_sv": 0.043863069359213115, "grad_min_sv": 0.0, "grad_condition": 43863069359.21311, "lr": 0.0005313952597646563, "time_sec": 177.4312937259674 }, { "epoch": 73, "train_loss": 5.369862328338623, "train_acc": 0.00916, "test_loss": 4.928821298217773, "test_acc": 0.01, "lyapunov": 1.5948649678388824, "grad_norm": 0.337053679491892, "grad_max_sv": 0.03650999316014349, "grad_min_sv": 0.0, "grad_condition": 36509993160.14349, "lr": 0.0005209378268645994, "time_sec": 177.47835731506348 }, { "epoch": 74, "train_loss": 5.366141536560058, "train_acc": 0.00956, "test_loss": 4.951869967651367, "test_acc": 0.01, "lyapunov": 1.591574984133396, "grad_norm": 0.34688609459259695, "grad_max_sv": 0.0532405337318778, "grad_min_sv": 0.0, "grad_condition": 53240533731.87779, "lr": 0.0005104712099416781, "time_sec": 177.39541888237 }, { "epoch": 75, "train_loss": 5.3659246875, "train_acc": 0.00862, "test_loss": 4.96804543762207, "test_acc": 0.01, "lyapunov": 1.5917583252767773, "grad_norm": 0.49942333201069317, "grad_max_sv": 0.04099391270428896, "grad_min_sv": 0.0, "grad_condition": 40993912704.288956, "lr": 0.0004999999999999996, "time_sec": 177.3808958530426 }, { "epoch": 76, "train_loss": 5.3697430253601075, "train_acc": 0.00932, "test_loss": 4.843025128173828, "test_acc": 0.01, "lyapunov": 1.5954608170272748, "grad_norm": 0.5592194591464297, "grad_max_sv": 0.03530313139781356, "grad_min_sv": 0.0, "grad_condition": 35303131397.81356, "lr": 0.0004895287900583212, "time_sec": 177.36198616027832 }, { "epoch": 77, "train_loss": 5.369125059814453, "train_acc": 0.00908, "test_loss": 4.996518075561523, "test_acc": 0.01, "lyapunov": 1.5947885577331113, "grad_norm": 0.5290088024656862, "grad_max_sv": 0.017188509553670885, "grad_min_sv": 0.0, "grad_condition": 17188509553.670883, "lr": 0.0004790621731353997, "time_sec": 177.27709126472473 }, { "epoch": 78, "train_loss": 5.368183317260742, "train_acc": 0.01024, "test_loss": 4.973466501617431, "test_acc": 0.01, "lyapunov": 1.5941324002297639, "grad_norm": 0.6809743973398079, "grad_max_sv": 0.029488482885062693, "grad_min_sv": 0.0, "grad_condition": 29488482885.062695, "lr": 0.000468604740235343, "time_sec": 177.3189423084259 }, { "epoch": 79, "train_loss": 5.367250970458985, "train_acc": 0.00956, "test_loss": 4.950716239929199, "test_acc": 0.01, "lyapunov": 1.5930783117518705, "grad_norm": 1.411636125689672, "grad_max_sv": 0.031192977959290148, "grad_min_sv": 0.0, "grad_condition": 31192977959.29015, "lr": 0.00045816107833384175, "time_sec": 177.3485884666443 }, { "epoch": 80, "train_loss": 5.366609226837158, "train_acc": 0.01002, "test_loss": 4.952863761901855, "test_acc": 0.01, "lyapunov": 1.5922869257914745, "grad_norm": 1.0613102889069541, "grad_max_sv": 0.042383548151701686, "grad_min_sv": 0.0, "grad_condition": 42383548151.70168, "lr": 0.0004477357683661729, "time_sec": 177.41135001182556 }, { "epoch": 81, "train_loss": 5.367390147705078, "train_acc": 0.00896, "test_loss": 4.965977513885498, "test_acc": 0.01, "lyapunov": 1.5931403121679946, "grad_norm": 1.113579115473781, "grad_max_sv": 0.039911494683474304, "grad_min_sv": 0.0, "grad_condition": 39911494683.474304, "lr": 0.00043733338321784746, "time_sec": 177.3696448802948 }, { "epoch": 82, "train_loss": 5.374857454833984, "train_acc": 0.0098, "test_loss": 4.912637939453125, "test_acc": 0.01, "lyapunov": 1.5992167480766315, "grad_norm": 1.3681227141701577, "grad_max_sv": 0.032051424495875835, "grad_min_sv": 0.0, "grad_condition": 32051424495.875835, "lr": 0.0004269584857187939, "time_sec": 177.33939170837402 }, { "epoch": 83, "train_loss": 5.365830071716308, "train_acc": 0.01, "test_loss": 4.93360542678833, "test_acc": 0.01, "lyapunov": 1.5919503589420367, "grad_norm": 1.2908239754732598, "grad_max_sv": 0.018338044127449393, "grad_min_sv": 0.0, "grad_condition": 18338044127.449394, "lr": 0.0004166156266419484, "time_sec": 177.30572271347046 }, { "epoch": 84, "train_loss": 5.369314513549805, "train_acc": 0.01032, "test_loss": 4.962402893066407, "test_acc": 0.01, "lyapunov": 1.5951606830977418, "grad_norm": 1.2430323961128404, "grad_max_sv": 0.014490698464214802, "grad_min_sv": 0.0, "grad_condition": 14490698464.214802, "lr": 0.0004063093427071373, "time_sec": 177.2841637134552 }, { "epoch": 85, "train_loss": 5.377282650604248, "train_acc": 0.00908, "test_loss": 4.969677833557129, "test_acc": 0.01, "lyapunov": 1.5993056263765106, "grad_norm": 1.0935450948855057, "grad_max_sv": 0.03076445385813713, "grad_min_sv": 0.0, "grad_condition": 30764453858.137135, "lr": 0.0003960441545911199, "time_sec": 177.35037755966187 }, { "epoch": 86, "train_loss": 5.365991982879638, "train_acc": 0.00934, "test_loss": 4.960339687347412, "test_acc": 0.01, "lyapunov": 1.591959211527539, "grad_norm": 1.0249256686134756, "grad_max_sv": 0.03798610083758831, "grad_min_sv": 0.0, "grad_condition": 37986100837.5883, "lr": 0.0003858245649446718, "time_sec": 177.35586881637573 }, { "epoch": 87, "train_loss": 5.36631558807373, "train_acc": 0.00936, "test_loss": 4.948922778320313, "test_acc": 0.01, "lyapunov": 1.5924714169538845, "grad_norm": 0.8096413328413968, "grad_max_sv": 0.033394893538206814, "grad_min_sv": 0.0, "grad_condition": 33394893538.206818, "lr": 0.00037565505641757235, "time_sec": 177.3941514492035 }, { "epoch": 88, "train_loss": 5.372631300354004, "train_acc": 0.01006, "test_loss": 4.890858795166015, "test_acc": 0.01, "lyapunov": 1.5971073076853057, "grad_norm": 0.3735195103580093, "grad_max_sv": 0.02607831247150898, "grad_min_sv": 0.0, "grad_condition": 26078312471.50898, "lr": 0.00036554008969236695, "time_sec": 177.28741931915283 }, { "epoch": 89, "train_loss": 5.367757025299072, "train_acc": 0.0093, "test_loss": 4.9563854202270505, "test_acc": 0.01, "lyapunov": 1.593846448242207, "grad_norm": 0.4162028440796633, "grad_max_sv": 0.030028719501569868, "grad_min_sv": 0.0, "grad_condition": 30028719501.569862, "lr": 0.0003554841015277638, "time_sec": 177.30004262924194 }, { "epoch": 90, "train_loss": 5.369390062561036, "train_acc": 0.01028, "test_loss": 4.903431629943848, "test_acc": 0.01, "lyapunov": 1.5944386360895297, "grad_norm": 0.45537462137938906, "grad_max_sv": 0.03309078188613057, "grad_min_sv": 0.0, "grad_condition": 33090781886.130573, "lr": 0.000345491502812526, "time_sec": 177.33181858062744 }, { "epoch": 91, "train_loss": 5.36617555480957, "train_acc": 0.0097, "test_loss": 4.973295672607422, "test_acc": 0.01, "lyapunov": 1.5924281744700868, "grad_norm": 0.42959416759344066, "grad_max_sv": 0.02529722950421274, "grad_min_sv": 0.0, "grad_condition": 25297229504.212738, "lr": 0.0003355666766307081, "time_sec": 177.29152536392212 }, { "epoch": 92, "train_loss": 5.3661282931518555, "train_acc": 0.0106, "test_loss": 4.874008221435547, "test_acc": 0.01, "lyapunov": 1.5923549528317074, "grad_norm": 0.4739333324657675, "grad_max_sv": 0.027486719330772756, "grad_min_sv": 0.0, "grad_condition": 27486719330.77276, "lr": 0.00032571397633909225, "time_sec": 177.3095293045044 }, { "epoch": 93, "train_loss": 5.36726612121582, "train_acc": 0.00952, "test_loss": 4.844555052947998, "test_acc": 0.01, "lyapunov": 1.5933535443547437, "grad_norm": 0.4489090651028355, "grad_max_sv": 0.027935726940631865, "grad_min_sv": 0.0, "grad_condition": 27935726940.631866, "lr": 0.00031593772365766094, "time_sec": 177.29880285263062 }, { "epoch": 94, "train_loss": 5.367507637634278, "train_acc": 0.00938, "test_loss": 4.85123999710083, "test_acc": 0.01, "lyapunov": 1.593514009509855, "grad_norm": 0.49488308768779743, "grad_max_sv": 0.03786678058095276, "grad_min_sv": 0.0, "grad_condition": 37866780580.95277, "lr": 0.0003062422067739483, "time_sec": 177.66627550125122 }, { "epoch": 95, "train_loss": 5.367161036987305, "train_acc": 0.01, "test_loss": 4.919075784301758, "test_acc": 0.01, "lyapunov": 1.593309577468716, "grad_norm": 0.49632556697910357, "grad_max_sv": 0.03764305226504803, "grad_min_sv": 0.0, "grad_condition": 37643052265.04803, "lr": 0.00029663167846209965, "time_sec": 177.35125970840454 }, { "epoch": 96, "train_loss": 5.368773625488282, "train_acc": 0.00952, "test_loss": 4.886889329528809, "test_acc": 0.01, "lyapunov": 1.5946083480439832, "grad_norm": 0.5634579068593676, "grad_max_sv": 0.033481535781174895, "grad_min_sv": 0.0, "grad_condition": 33481535781.174904, "lr": 0.00028711035421746345, "time_sec": 177.33729600906372 }, { "epoch": 97, "train_loss": 5.373278410797119, "train_acc": 0.0092, "test_loss": 4.919860540771484, "test_acc": 0.01, "lyapunov": 1.5970366150521866, "grad_norm": 0.5241288299265501, "grad_max_sv": 0.02991771958768368, "grad_min_sv": 0.0, "grad_condition": 29917719587.683678, "lr": 0.00027768241040753615, "time_sec": 177.3373203277588 }, { "epoch": 98, "train_loss": 5.367487851867676, "train_acc": 0.00984, "test_loss": 4.922154154968262, "test_acc": 0.01, "lyapunov": 1.5938531629874577, "grad_norm": 0.6102489153602656, "grad_max_sv": 0.02815253552980721, "grad_min_sv": 0.0, "grad_condition": 28152535529.807213, "lr": 0.00026835198244006903, "time_sec": 177.35172653198242 }, { "epoch": 99, "train_loss": 5.367893275756836, "train_acc": 0.01038, "test_loss": 4.930574498748779, "test_acc": 0.01, "lyapunov": 1.593941973908173, "grad_norm": 0.5921377439478998, "grad_max_sv": 0.03409935408271849, "grad_min_sv": 0.0, "grad_condition": 34099354082.718487, "lr": 0.0002591231629491421, "time_sec": 177.36736416816711 }, { "epoch": 100, "train_loss": 5.372079080200195, "train_acc": 0.01062, "test_loss": 4.915191829681397, "test_acc": 0.01, "lyapunov": 1.596833938832783, "grad_norm": 0.5930918441111938, "grad_max_sv": 0.033569992519915104, "grad_min_sv": 0.0, "grad_condition": 33569992519.915108, "lr": 0.0002499999999999997, "time_sec": 177.3853051662445 }, { "epoch": 101, "train_loss": 5.365807982940674, "train_acc": 0.00976, "test_loss": 4.926369466400146, "test_acc": 0.01, "lyapunov": 1.5920866029646696, "grad_norm": 1.2269794373451623, "grad_max_sv": 0.03278505662456155, "grad_min_sv": 0.0, "grad_condition": 32785056624.561546, "lr": 0.00024098649531343477, "time_sec": 177.41039776802063 }, { "epoch": 102, "train_loss": 5.3670011302185054, "train_acc": 0.00968, "test_loss": 5.182023647308349, "test_acc": 0.01, "lyapunov": 1.5932530469601722, "grad_norm": 0.5812477341116522, "grad_max_sv": 0.03314556856639683, "grad_min_sv": 0.0, "grad_condition": 33145568566.39683, "lr": 0.0002320866025105016, "time_sec": 177.37316060066223 }, { "epoch": 103, "train_loss": 5.371551856231689, "train_acc": 0.01004, "test_loss": 4.899476731109619, "test_acc": 0.01, "lyapunov": 1.5966654973261802, "grad_norm": 0.610767105839377, "grad_max_sv": 0.02582362242974341, "grad_min_sv": 0.0, "grad_condition": 25823622429.74341, "lr": 0.0002233042253783278, "time_sec": 177.36590600013733 }, { "epoch": 104, "train_loss": 5.368561768646241, "train_acc": 0.00946, "test_loss": 4.930848654174805, "test_acc": 0.01, "lyapunov": 1.5947173150908915, "grad_norm": 0.6422628015235555, "grad_max_sv": 0.025343496771529316, "grad_min_sv": 0.0, "grad_condition": 25343496771.529316, "lr": 0.000214643216157784, "time_sec": 177.3882737159729 }, { "epoch": 105, "train_loss": 5.36991615814209, "train_acc": 0.0091, "test_loss": 4.899362311553955, "test_acc": 0.01, "lyapunov": 1.5956382519753693, "grad_norm": 0.5876379942472394, "grad_max_sv": 0.02119842660613358, "grad_min_sv": 0.0, "grad_condition": 21198426606.133583, "lr": 0.00020610737385376332, "time_sec": 177.41758513450623 }, { "epoch": 106, "train_loss": 5.366515799407959, "train_acc": 0.01026, "test_loss": 4.887499784851074, "test_acc": 0.01, "lyapunov": 1.592897226743381, "grad_norm": 0.6201818264513558, "grad_max_sv": 0.0033281870651990174, "grad_min_sv": 0.0, "grad_condition": 3328187065.1990175, "lr": 0.00019770044256881242, "time_sec": 177.3366186618805 }, { "epoch": 107, "train_loss": 5.368152584533691, "train_acc": 0.00916, "test_loss": 4.894157613372803, "test_acc": 0.01, "lyapunov": 1.5942484835529571, "grad_norm": 0.7280576803690416, "grad_max_sv": 0.027869051974266767, "grad_min_sv": 0.0, "grad_condition": 27869051974.266766, "lr": 0.0001894261098608447, "time_sec": 177.37792563438416 }, { "epoch": 108, "train_loss": 5.3665059283447265, "train_acc": 0.00976, "test_loss": 4.915471728515625, "test_acc": 0.01, "lyapunov": 1.592840023662733, "grad_norm": 0.7424554492649038, "grad_max_sv": 0.026440556207671762, "grad_min_sv": 0.0, "grad_condition": 26440556207.67176, "lr": 0.000181288005125655, "time_sec": 177.35853958129883 }, { "epoch": 109, "train_loss": 5.376394969329834, "train_acc": 0.01022, "test_loss": 4.922409371948242, "test_acc": 0.01, "lyapunov": 1.6003244386609559, "grad_norm": 0.8040426103005965, "grad_max_sv": 0.024923838768154384, "grad_min_sv": 0.0, "grad_condition": 24923838768.15438, "lr": 0.0001732896980049473, "time_sec": 177.31202268600464 }, { "epoch": 110, "train_loss": 5.376544867401123, "train_acc": 0.01006, "test_loss": 4.9106194869995115, "test_acc": 0.01, "lyapunov": 1.5990420381736268, "grad_norm": 0.7808973134784486, "grad_max_sv": 0.023315236158668994, "grad_min_sv": 0.0, "grad_condition": 23315236158.668995, "lr": 0.00016543469682057076, "time_sec": 177.3295497894287 }, { "epoch": 111, "train_loss": 5.366748910522461, "train_acc": 0.01, "test_loss": 4.904478953552246, "test_acc": 0.01, "lyapunov": 1.5930900046282717, "grad_norm": 0.8315740534061841, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 177.3059582710266 }, { "epoch": 112, "train_loss": 5.365462461242676, "train_acc": 0.0097, "test_loss": 4.909817778778076, "test_acc": 0.01, "lyapunov": 1.591839042770893, "grad_norm": 1.0644316030188519, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 177.3259735107422 }, { "epoch": 113, "train_loss": 5.366983929290772, "train_acc": 0.01, "test_loss": 4.893335526275635, "test_acc": 0.01, "lyapunov": 1.5934227226335373, "grad_norm": 1.0331708046855217, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 177.29799342155457 }, { "epoch": 114, "train_loss": 5.367780682678223, "train_acc": 0.01, "test_loss": 4.896582912445068, "test_acc": 0.01, "lyapunov": 1.5942320003533912, "grad_norm": 1.09308769834869, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 177.33024215698242 }, { "epoch": 115, "train_loss": 5.367718472900391, "train_acc": 0.01, "test_loss": 4.895343659973144, "test_acc": 0.01, "lyapunov": 1.5940615042396213, "grad_norm": 1.2673802568939343, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 177.3362259864807 }, { "epoch": 116, "train_loss": 5.3657911352539065, "train_acc": 0.01, "test_loss": 4.906929530334473, "test_acc": 0.01, "lyapunov": 1.5921993859283758, "grad_norm": 1.2617224687326039, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 177.28457856178284 }, { "epoch": 117, "train_loss": 5.366755274505615, "train_acc": 0.00962, "test_loss": 4.891025592041015, "test_acc": 0.01, "lyapunov": 1.5932053120239922, "grad_norm": 1.3667828520013348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 177.260840177536 }, { "epoch": 118, "train_loss": 5.369936829376221, "train_acc": 0.00938, "test_loss": 4.908762777709961, "test_acc": 0.01, "lyapunov": 1.5956426922927427, "grad_norm": 1.4737347393486513, "grad_max_sv": 0.002789213368669152, "grad_min_sv": 0.0, "grad_condition": 2789213368.6691523, "lr": 0.00010815327133708009, "time_sec": 177.28786754608154 }, { "epoch": 119, "train_loss": 5.367702166290283, "train_acc": 0.01006, "test_loss": 4.900025549316406, "test_acc": 0.01, "lyapunov": 1.5938852357742426, "grad_norm": 1.445693487120252, "grad_max_sv": 0.004225540207698941, "grad_min_sv": 0.0, "grad_condition": 4225540207.698941, "lr": 0.00010173504098790182, "time_sec": 177.32281279563904 }, { "epoch": 120, "train_loss": 5.366396225891113, "train_acc": 0.01, "test_loss": 4.875214715576172, "test_acc": 0.01, "lyapunov": 1.5928466237719408, "grad_norm": 1.5218270915127643, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 177.28257083892822 }, { "epoch": 121, "train_loss": 5.366784219818115, "train_acc": 0.01, "test_loss": 4.868653475952148, "test_acc": 0.01, "lyapunov": 1.5932423071483213, "grad_norm": 1.5915107890267433, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 177.2724094390869 }, { "epoch": 122, "train_loss": 5.3684937673950195, "train_acc": 0.0095, "test_loss": 4.872081127929688, "test_acc": 0.01, "lyapunov": 1.5947217929088855, "grad_norm": 1.7802951927894717, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 177.29115104675293 }, { "epoch": 123, "train_loss": 5.368383057250977, "train_acc": 0.00976, "test_loss": 4.865282067871094, "test_acc": 0.01, "lyapunov": 1.5946415565202914, "grad_norm": 1.8635884798014917, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 177.29619812965393 }, { "epoch": 124, "train_loss": 5.369555229797363, "train_acc": 0.01, "test_loss": 4.850182081604004, "test_acc": 0.01, "lyapunov": 1.595543795839295, "grad_norm": 1.9786412883932707, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 177.28673815727234 }, { "epoch": 125, "train_loss": 5.366839987792969, "train_acc": 0.0099, "test_loss": 4.863481466674805, "test_acc": 0.01, "lyapunov": 1.5933110564566024, "grad_norm": 1.981713372629457, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 177.54408073425293 }, { "epoch": 126, "train_loss": 5.367286334533691, "train_acc": 0.00978, "test_loss": 4.864164552307129, "test_acc": 0.01, "lyapunov": 1.593780165133269, "grad_norm": 2.0792063115884303, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 177.27722811698914 }, { "epoch": 127, "train_loss": 5.377017222900391, "train_acc": 0.00976, "test_loss": 4.867053485107422, "test_acc": 0.01, "lyapunov": 1.5985291836511752, "grad_norm": 1.8808489686841805, "grad_max_sv": 0.0020057843998074532, "grad_min_sv": 0.0, "grad_condition": 2005784399.8074532, "lr": 5.6898210384392595e-05, "time_sec": 177.32938599586487 }, { "epoch": 128, "train_loss": 5.3731236241149904, "train_acc": 0.0099, "test_loss": 4.862087628173828, "test_acc": 0.01, "lyapunov": 1.5972985928625707, "grad_norm": 2.0544715272998646, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 177.26091361045837 }, { "epoch": 129, "train_loss": 5.366952188110352, "train_acc": 0.00966, "test_loss": 4.87226043548584, "test_acc": 0.01, "lyapunov": 1.5934485755003323, "grad_norm": 2.0287817825331826, "grad_max_sv": 0.0008733986876904964, "grad_min_sv": 0.0, "grad_condition": 873398687.6904964, "lr": 4.7586473766990294e-05, "time_sec": 177.30408883094788 }, { "epoch": 130, "train_loss": 5.36849506149292, "train_acc": 0.01004, "test_loss": 4.863279203796386, "test_acc": 0.01, "lyapunov": 1.594751832735203, "grad_norm": 1.980669281269925, "grad_max_sv": 0.010736069735139608, "grad_min_sv": 0.0, "grad_condition": 10736069735.139608, "lr": 4.32272711786996e-05, "time_sec": 177.28869652748108 }, { "epoch": 131, "train_loss": 5.377595603637696, "train_acc": 0.01, "test_loss": 4.866737941741944, "test_acc": 0.01, "lyapunov": 1.5995000756305198, "grad_norm": 2.154727256033659, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 177.257958650589 }, { "epoch": 132, "train_loss": 5.369090413818359, "train_acc": 0.01, "test_loss": 4.858406136322022, "test_acc": 0.01, "lyapunov": 1.5953167524484113, "grad_norm": 2.191344847482899, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 177.27152252197266 }, { "epoch": 133, "train_loss": 5.3665374522399905, "train_acc": 0.01, "test_loss": 4.860008187866211, "test_acc": 0.01, "lyapunov": 1.5930466167152386, "grad_norm": 2.0841828503003916, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 177.28846549987793 }, { "epoch": 134, "train_loss": 5.366383743286133, "train_acc": 0.00974, "test_loss": 4.848487128448486, "test_acc": 0.01, "lyapunov": 1.592855043118567, "grad_norm": 2.195653914411608, "grad_max_sv": 0.0033036706037819384, "grad_min_sv": 0.0, "grad_condition": 3303670603.7819386, "lr": 2.7811814881259484e-05, "time_sec": 177.28988027572632 }, { "epoch": 135, "train_loss": 5.367761196746827, "train_acc": 0.00998, "test_loss": 4.859366925048828, "test_acc": 0.01, "lyapunov": 1.594165514802079, "grad_norm": 2.1904859959999126, "grad_max_sv": 0.0012543844059109688, "grad_min_sv": 0.0, "grad_condition": 1254384405.9109688, "lr": 2.4471741852423218e-05, "time_sec": 177.2780725955963 }, { "epoch": 136, "train_loss": 5.366510193634033, "train_acc": 0.01, "test_loss": 4.8595954734802245, "test_acc": 0.01, "lyapunov": 1.5930009638257039, "grad_norm": 2.1839168134099793, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 177.28521990776062 }, { "epoch": 137, "train_loss": 5.367833109741211, "train_acc": 0.01, "test_loss": 4.850632510375976, "test_acc": 0.01, "lyapunov": 1.5938955752745918, "grad_norm": 2.14228114693839, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 177.32584595680237 }, { "epoch": 138, "train_loss": 5.378068528137207, "train_acc": 0.01018, "test_loss": 4.858175395202637, "test_acc": 0.01, "lyapunov": 1.5998802581406615, "grad_norm": 2.218784068596557, "grad_max_sv": 0.0014573325868695974, "grad_min_sv": 0.0, "grad_condition": 1457332586.8695974, "lr": 1.570841943568445e-05, "time_sec": 177.31577253341675 }, { "epoch": 139, "train_loss": 5.367863772277832, "train_acc": 0.01034, "test_loss": 4.8480802886962895, "test_acc": 0.01, "lyapunov": 1.5942664253132424, "grad_norm": 2.2444364897318794, "grad_max_sv": 0.012257534638047218, "grad_min_sv": 0.0, "grad_condition": 12257534638.047218, "lr": 1.3210548563419845e-05, "time_sec": 177.30443215370178 }, { "epoch": 140, "train_loss": 5.366426722717285, "train_acc": 0.00962, "test_loss": 4.848219221496582, "test_acc": 0.01, "lyapunov": 1.5928701375756422, "grad_norm": 2.3192997356397203, "grad_max_sv": 0.006218939693644643, "grad_min_sv": 0.0, "grad_condition": 6218939693.644643, "lr": 1.0926199633097203e-05, "time_sec": 177.33384609222412 }, { "epoch": 141, "train_loss": 5.36580462097168, "train_acc": 0.00986, "test_loss": 4.850540889739991, "test_acc": 0.01, "lyapunov": 1.592248017830617, "grad_norm": 2.287220965288124, "grad_max_sv": 0.0013559065759181977, "grad_min_sv": 0.0, "grad_condition": 1355906575.9181976, "lr": 8.856374635655688e-06, "time_sec": 177.32693576812744 }, { "epoch": 142, "train_loss": 5.3662375875854496, "train_acc": 0.01, "test_loss": 4.853694881439209, "test_acc": 0.01, "lyapunov": 1.5927291526209058, "grad_norm": 2.302468482661773, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 177.3142066001892 }, { "epoch": 143, "train_loss": 5.372984427642822, "train_acc": 0.01004, "test_loss": 4.852922064208984, "test_acc": 0.01, "lyapunov": 1.597528722889893, "grad_norm": 2.348373340052694, "grad_max_sv": 0.0011802260298281908, "grad_min_sv": 0.0, "grad_condition": 1180226029.8281908, "lr": 5.3638335185058295e-06, "time_sec": 177.3356897830963 }, { "epoch": 144, "train_loss": 5.368205472106934, "train_acc": 0.00984, "test_loss": 4.849281020355225, "test_acc": 0.01, "lyapunov": 1.594479467252941, "grad_norm": 2.312922144804607, "grad_max_sv": 0.0006380858831107616, "grad_min_sv": 0.0, "grad_condition": 638085883.1107616, "lr": 3.942649342761114e-06, "time_sec": 177.28971314430237 }, { "epoch": 145, "train_loss": 5.366419898681641, "train_acc": 0.01006, "test_loss": 4.848984435272217, "test_acc": 0.01, "lyapunov": 1.592920510360347, "grad_norm": 2.317195419975272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 177.31689953804016 }, { "epoch": 146, "train_loss": 5.373454104766846, "train_acc": 0.01, "test_loss": 4.849994027709961, "test_acc": 0.01, "lyapunov": 1.598964246642559, "grad_norm": 2.4233925402092833, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 177.32813477516174 }, { "epoch": 147, "train_loss": 5.3674054251098635, "train_acc": 0.01, "test_loss": 4.851546574401856, "test_acc": 0.01, "lyapunov": 1.5935643969289481, "grad_norm": 2.3247951305562196, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 177.28444719314575 }, { "epoch": 148, "train_loss": 5.3666025303649905, "train_acc": 0.01, "test_loss": 4.8515466201782225, "test_acc": 0.01, "lyapunov": 1.5931046256019026, "grad_norm": 2.3395920546004754, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 177.2980020046234 }, { "epoch": 149, "train_loss": 5.365688817749024, "train_acc": 0.01, "test_loss": 4.851546644592285, "test_acc": 0.01, "lyapunov": 1.5921499198659912, "grad_norm": 2.4070679367245766, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 177.28436994552612 }, { "epoch": 150, "train_loss": 5.363941977539063, "train_acc": 0.01, "test_loss": 4.851546675109863, "test_acc": 0.01, "lyapunov": 1.5903311498329769, "grad_norm": 2.3202323044197746, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 177.27790570259094 } ] } }