{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 4.341291038284302, "train_acc": 0.09568, "test_loss": 3.5902228660583497, "test_acc": 0.1719, "lyapunov": null, "grad_norm": 6.233568552079335, "grad_max_sv": 4.7545679092407225, "grad_min_sv": 1.1250918028338219e-07, "grad_condition": 47144055.51418194, "lr": 0.0009998903417374227, "time_sec": 17.830737352371216 }, { "epoch": 2, "train_loss": 3.4833403620910643, "train_acc": 0.1875, "test_loss": 3.2125896770477294, "test_acc": 0.2413, "lyapunov": null, "grad_norm": 4.2883357141420815, "grad_max_sv": 3.0223524630069734, "grad_min_sv": 7.805360168200437e-08, "grad_condition": 68434745.79111826, "lr": 0.0009995614150494292, "time_sec": 15.740124702453613 }, { "epoch": 3, "train_loss": 3.014097664794922, "train_acc": 0.26054, "test_loss": 2.8822019165039063, "test_acc": 0.2889, "lyapunov": null, "grad_norm": 3.3688150071564396, "grad_max_sv": 2.1886239469051363, "grad_min_sv": 6.223103937719188e-08, "grad_condition": 42282037.7115659, "lr": 0.0009990133642141358, "time_sec": 15.473703145980835 }, { "epoch": 4, "train_loss": 2.7143693132019044, "train_acc": 0.31262, "test_loss": 2.702446311187744, "test_acc": 0.3208, "lyapunov": null, "grad_norm": 2.8785406038007317, "grad_max_sv": 1.7646001279354095, "grad_min_sv": 5.3701336399925025e-08, "grad_condition": 43554152.39164617, "lr": 0.0009982464296247522, "time_sec": 15.499403238296509 }, { "epoch": 5, "train_loss": 2.5030348071289064, "train_acc": 0.3554, "test_loss": 2.763942724990845, "test_acc": 0.329, "lyapunov": null, "grad_norm": 2.5897409787447465, "grad_max_sv": 1.5612378805875777, "grad_min_sv": 4.8854244893981046e-08, "grad_condition": 41333195.00893615, "lr": 0.0009972609476841367, "time_sec": 15.488951683044434 }, { "epoch": 6, "train_loss": 2.3269909496307375, "train_acc": 0.3938, "test_loss": 2.4710379989624025, "test_acc": 0.3761, "lyapunov": null, "grad_norm": 2.37414912310322, "grad_max_sv": 1.3197038874030114, "grad_min_sv": 4.5427973693196176e-08, "grad_condition": 185703885.27271265, "lr": 0.000996057350657239, "time_sec": 15.497607707977295 }, { "epoch": 7, "train_loss": 2.1854072467041017, "train_acc": 0.4216, "test_loss": 2.951163561248779, "test_acc": 0.323, "lyapunov": null, "grad_norm": 2.2068200870493837, "grad_max_sv": 1.2339675694704055, "grad_min_sv": 4.277283941478416e-08, "grad_condition": 52095598.918328084, "lr": 0.000994636166481494, "time_sec": 15.472023725509644 }, { "epoch": 8, "train_loss": 2.0716393295288085, "train_acc": 0.44928, "test_loss": 2.2887711679458618, "test_acc": 0.4114, "lyapunov": null, "grad_norm": 2.076990480510157, "grad_max_sv": 1.131314830482006, "grad_min_sv": 3.9886170205560846e-08, "grad_condition": 41939669.82744624, "lr": 0.0009929980185352525, "time_sec": 15.464510440826416 }, { "epoch": 9, "train_loss": 1.974085814552307, "train_acc": 0.47136, "test_loss": 2.672110557174683, "test_acc": 0.3601, "lyapunov": null, "grad_norm": 1.9761816566655848, "grad_max_sv": 1.0417343363165856, "grad_min_sv": 3.825020498116061e-08, "grad_condition": 39964162.48622004, "lr": 0.0009911436253643444, "time_sec": 15.494410037994385 }, { "epoch": 10, "train_loss": 1.8730941659545899, "train_acc": 0.49054, "test_loss": 2.5056158615112305, "test_acc": 0.3813, "lyapunov": null, "grad_norm": 1.8634099386367884, "grad_max_sv": 0.9600013196468353, "grad_min_sv": 3.579910488604732e-08, "grad_condition": 34060738.21798731, "lr": 0.0009890738003669028, "time_sec": 15.488292455673218 }, { "epoch": 11, "train_loss": 1.7812603790664674, "train_acc": 0.51462, "test_loss": 2.477180172729492, "test_acc": 0.3997, "lyapunov": null, "grad_norm": 1.7790099981650356, "grad_max_sv": 0.9072641983628273, "grad_min_sv": 3.4340940041621694e-08, "grad_condition": 36834828.42576877, "lr": 0.00098678945143658, "time_sec": 15.484249591827393 }, { "epoch": 12, "train_loss": 1.714907325401306, "train_acc": 0.52888, "test_loss": 2.226099481582642, "test_acc": 0.4353, "lyapunov": null, "grad_norm": 1.701538564781707, "grad_max_sv": 0.8431645318865776, "grad_min_sv": 3.240299342038844e-08, "grad_condition": 64109426.95331051, "lr": 0.0009842915805643154, "time_sec": 15.483522891998291 }, { "epoch": 13, "train_loss": 1.648736492576599, "train_acc": 0.5449, "test_loss": 2.1634216318130495, "test_acc": 0.4573, "lyapunov": null, "grad_norm": 1.6315158856421696, "grad_max_sv": 0.7919500142335891, "grad_min_sv": 3.0836463893457736e-08, "grad_condition": 50314317.689856075, "lr": 0.000981581283398829, "time_sec": 15.491243362426758 }, { "epoch": 14, "train_loss": 1.5916738232421874, "train_acc": 0.5591, "test_loss": 2.5368153831481934, "test_acc": 0.398, "lyapunov": null, "grad_norm": 1.579987574958028, "grad_max_sv": 0.7741283252835274, "grad_min_sv": 3.031987156898453e-08, "grad_condition": 33629215.75141786, "lr": 0.0009786597487660333, "time_sec": 15.476540565490723 }, { "epoch": 15, "train_loss": 1.5378693001937866, "train_acc": 0.57156, "test_loss": 1.9343770442962647, "test_acc": 0.4989, "lyapunov": null, "grad_norm": 1.5231234313765212, "grad_max_sv": 0.7179134920239448, "grad_min_sv": 2.8637837475031792e-08, "grad_condition": 49527050.380315706, "lr": 0.0009755282581475766, "time_sec": 15.486248970031738 }, { "epoch": 16, "train_loss": 1.478127024307251, "train_acc": 0.58584, "test_loss": 1.9563913166046143, "test_acc": 0.4922, "lyapunov": null, "grad_norm": 1.46325785921816, "grad_max_sv": 0.6841573119163513, "grad_min_sv": 2.716867457952521e-08, "grad_condition": 56699539.529558375, "lr": 0.0009721881851187403, "time_sec": 15.49137544631958 }, { "epoch": 17, "train_loss": 1.429626383972168, "train_acc": 0.59714, "test_loss": 2.326792067337036, "test_acc": 0.4336, "lyapunov": null, "grad_norm": 1.4242655219863833, "grad_max_sv": 0.6712241530418396, "grad_min_sv": 2.6996844360027695e-08, "grad_condition": 40189659.16617282, "lr": 0.0009686409947459456, "time_sec": 15.493090391159058 }, { "epoch": 18, "train_loss": 1.395352936630249, "train_acc": 0.6053, "test_loss": 1.8314157381057738, "test_acc": 0.5182, "lyapunov": null, "grad_norm": 1.3761305598419875, "grad_max_sv": 0.6385130822658539, "grad_min_sv": 2.6239096877211932e-08, "grad_condition": 63284929.054803826, "lr": 0.0009648882429441254, "time_sec": 15.477057695388794 }, { "epoch": 19, "train_loss": 1.340607022781372, "train_acc": 0.61952, "test_loss": 1.9038033363342286, "test_acc": 0.5042, "lyapunov": null, "grad_norm": 1.3323384681348491, "grad_max_sv": 0.613679239153862, "grad_min_sv": 2.4952525421112828e-08, "grad_condition": 1048659082.6601179, "lr": 0.00096093157579425, "time_sec": 15.483818292617798 }, { "epoch": 20, "train_loss": 1.2925908715438843, "train_acc": 0.62856, "test_loss": 2.031341696929932, "test_acc": 0.4835, "lyapunov": null, "grad_norm": 1.3034876314465462, "grad_max_sv": 0.5816340684890747, "grad_min_sv": 2.434145293522816e-08, "grad_condition": 45204778.74017582, "lr": 0.0009567727288213001, "time_sec": 15.512004375457764 }, { "epoch": 21, "train_loss": 1.278655789756775, "train_acc": 0.63278, "test_loss": 1.8846191581726075, "test_acc": 0.5135, "lyapunov": null, "grad_norm": 1.2776040716135673, "grad_max_sv": 0.5780372425913811, "grad_min_sv": 2.405527027016241e-08, "grad_condition": 42159114.019685745, "lr": 0.0009524135262330095, "time_sec": 15.499945878982544 }, { "epoch": 22, "train_loss": 1.2383485181427003, "train_acc": 0.64622, "test_loss": 1.8699242074966431, "test_acc": 0.518, "lyapunov": null, "grad_norm": 1.2460313700260512, "grad_max_sv": 0.5693550139665604, "grad_min_sv": 2.3625755932697724e-08, "grad_condition": 247459954.48036852, "lr": 0.0009478558801197061, "time_sec": 15.489409923553467 }, { "epoch": 23, "train_loss": 1.208611516494751, "train_acc": 0.6519, "test_loss": 1.8377874282836915, "test_acc": 0.526, "lyapunov": null, "grad_norm": 1.2268147245238885, "grad_max_sv": 0.5506495118141175, "grad_min_sv": 2.2982289769879482e-08, "grad_condition": 91532045.29729453, "lr": 0.000943101789615607, "time_sec": 15.503745555877686 }, { "epoch": 24, "train_loss": 1.1756799732208252, "train_acc": 0.66142, "test_loss": 1.8445790365219117, "test_acc": 0.5321, "lyapunov": null, "grad_norm": 1.1995646648047669, "grad_max_sv": 0.5362823188304902, "grad_min_sv": 2.227390833997589e-08, "grad_condition": 39000923.8470154, "lr": 0.0009381533400219313, "time_sec": 15.488165855407715 }, { "epoch": 25, "train_loss": 1.1402707249450683, "train_acc": 0.67004, "test_loss": 2.1079253253936767, "test_acc": 0.4853, "lyapunov": null, "grad_norm": 1.1685820076008453, "grad_max_sv": 0.500711290538311, "grad_min_sv": 2.1209413056388903e-08, "grad_condition": 37717541.68981, "lr": 0.0009330127018922189, "time_sec": 15.519190073013306 }, { "epoch": 26, "train_loss": 1.115832226486206, "train_acc": 0.67608, "test_loss": 1.7950333555221558, "test_acc": 0.5345, "lyapunov": null, "grad_norm": 1.1487591162708706, "grad_max_sv": 0.5033038355410099, "grad_min_sv": 2.1531226807036675e-08, "grad_condition": 34912719.99916558, "lr": 0.000927682130080253, "time_sec": 15.500119924545288 }, { "epoch": 27, "train_loss": 1.0897642765426636, "train_acc": 0.68058, "test_loss": 1.9983017498016358, "test_acc": 0.5014, "lyapunov": null, "grad_norm": 1.1397755659416107, "grad_max_sv": 0.5070834219455719, "grad_min_sv": 2.094801768229293e-08, "grad_condition": 112680773.02319674, "lr": 0.0009221639627510072, "time_sec": 15.487388610839844 }, { "epoch": 28, "train_loss": 1.0600782299995422, "train_acc": 0.6873, "test_loss": 1.7331308700561523, "test_acc": 0.552, "lyapunov": null, "grad_norm": 1.1194293581413437, "grad_max_sv": 0.49243925511837006, "grad_min_sv": 2.061250336264555e-08, "grad_condition": 2391098394.247443, "lr": 0.0009164606203550494, "time_sec": 15.49947738647461 }, { "epoch": 29, "train_loss": 1.0288162441635131, "train_acc": 0.6958, "test_loss": 1.7574676347732543, "test_acc": 0.5469, "lyapunov": null, "grad_norm": 1.0981602434296158, "grad_max_sv": 0.4940373159945011, "grad_min_sv": 2.0519680072120238e-08, "grad_condition": 152798003.85014075, "lr": 0.0009105746045668516, "time_sec": 15.519279956817627 }, { "epoch": 30, "train_loss": 1.0005281573104858, "train_acc": 0.70474, "test_loss": 1.7724915187835693, "test_acc": 0.5535, "lyapunov": null, "grad_norm": 1.0821209053569316, "grad_max_sv": 0.4882327690720558, "grad_min_sv": 2.040895886699923e-08, "grad_condition": 106754784.91270833, "lr": 0.0009045084971874733, "time_sec": 15.495746612548828 }, { "epoch": 31, "train_loss": 0.9887743633651733, "train_acc": 0.70736, "test_loss": 1.803389212989807, "test_acc": 0.5421, "lyapunov": null, "grad_norm": 1.0717360299018484, "grad_max_sv": 0.4644377827644348, "grad_min_sv": 1.9709001528034342e-08, "grad_condition": 35783294.580241755, "lr": 0.0008982649590120977, "time_sec": 15.506318807601929 }, { "epoch": 32, "train_loss": 0.9635560890579223, "train_acc": 0.71462, "test_loss": 1.7782361072540283, "test_acc": 0.5515, "lyapunov": null, "grad_norm": 1.0547768746381694, "grad_max_sv": 0.47287538424134257, "grad_min_sv": 1.9473239257217223e-08, "grad_condition": 36442794.53940544, "lr": 0.0008918467286629196, "time_sec": 15.525408744812012 }, { "epoch": 33, "train_loss": 0.9454534896087646, "train_acc": 0.71586, "test_loss": 1.8413972650527954, "test_acc": 0.5387, "lyapunov": null, "grad_norm": 1.0457002240106366, "grad_max_sv": 0.4636484496295452, "grad_min_sv": 1.9625483711760426e-08, "grad_condition": 124503449.94674742, "lr": 0.0008852566213878943, "time_sec": 15.658098459243774 }, { "epoch": 34, "train_loss": 0.926147558670044, "train_acc": 0.72194, "test_loss": 1.8227524955749512, "test_acc": 0.5492, "lyapunov": null, "grad_norm": 1.030398616328217, "grad_max_sv": 0.44984652400016784, "grad_min_sv": 1.8758673522856208e-08, "grad_condition": 63054578.90943961, "lr": 0.000878497527825878, "time_sec": 15.51594591140747 }, { "epoch": 35, "train_loss": 0.8910220455551148, "train_acc": 0.7339, "test_loss": 1.7336375022888184, "test_acc": 0.5649, "lyapunov": null, "grad_norm": 1.0076609346644876, "grad_max_sv": 0.44372819289565085, "grad_min_sv": 1.8551427522633945e-08, "grad_condition": 50611185.75714277, "lr": 0.000871572412738697, "time_sec": 15.497729539871216 }, { "epoch": 36, "train_loss": 0.8785494363021851, "train_acc": 0.73456, "test_loss": 1.7843629848480225, "test_acc": 0.5581, "lyapunov": null, "grad_norm": 0.9989169914835021, "grad_max_sv": 0.4366959437727928, "grad_min_sv": 1.8408271952943812e-08, "grad_condition": 85310005.79090494, "lr": 0.0008644843137107055, "time_sec": 15.490435123443604 }, { "epoch": 37, "train_loss": 0.856938405303955, "train_acc": 0.74212, "test_loss": 1.78583115940094, "test_acc": 0.5595, "lyapunov": null, "grad_norm": 0.9837943590828618, "grad_max_sv": 0.42913608700037004, "grad_min_sv": 1.799877897834534e-08, "grad_condition": 44955472.82427679, "lr": 0.0008572363398164014, "time_sec": 15.537626266479492 }, { "epoch": 38, "train_loss": 0.8304045977973938, "train_acc": 0.74954, "test_loss": 1.9540308137893676, "test_acc": 0.5338, "lyapunov": null, "grad_norm": 0.9705660429353747, "grad_max_sv": 0.41689482182264326, "grad_min_sv": 1.7790258101044177e-08, "grad_condition": 85624723.50661872, "lr": 0.0008498316702566826, "time_sec": 15.500178813934326 }, { "epoch": 39, "train_loss": 0.820258391494751, "train_acc": 0.74884, "test_loss": 1.8685070798873902, "test_acc": 0.5491, "lyapunov": null, "grad_norm": 0.9650066613971798, "grad_max_sv": 0.42203645706176757, "grad_min_sv": 1.7701675934789218e-08, "grad_condition": 38471919.31748825, "lr": 0.0008422735529643442, "time_sec": 15.50774359703064 }, { "epoch": 40, "train_loss": 0.8059215658950806, "train_acc": 0.75368, "test_loss": 1.7993948059082032, "test_acc": 0.5644, "lyapunov": null, "grad_norm": 0.9599648842149144, "grad_max_sv": 0.42296523600816727, "grad_min_sv": 1.7450433907606477e-08, "grad_condition": 48602019.20439266, "lr": 0.0008345653031794289, "time_sec": 15.5121328830719 }, { "epoch": 41, "train_loss": 0.7813009564971923, "train_acc": 0.76052, "test_loss": 1.8404800394058227, "test_acc": 0.5604, "lyapunov": null, "grad_norm": 0.9418789892686961, "grad_max_sv": 0.40448441356420517, "grad_min_sv": 1.731778200703138e-08, "grad_condition": 98318164.88521431, "lr": 0.0008267103019950526, "time_sec": 15.492136240005493 }, { "epoch": 42, "train_loss": 0.7671393407821655, "train_acc": 0.76604, "test_loss": 1.793884058380127, "test_acc": 0.5618, "lyapunov": null, "grad_norm": 0.9315468648605028, "grad_max_sv": 0.38932052329182626, "grad_min_sv": 1.6337376871483622e-08, "grad_condition": 62943904.80942075, "lr": 0.0008187119948743447, "time_sec": 15.521047592163086 }, { "epoch": 43, "train_loss": 0.7535210326766968, "train_acc": 0.76782, "test_loss": 1.7884279314041138, "test_acc": 0.5658, "lyapunov": null, "grad_norm": 0.9214199202766519, "grad_max_sv": 0.39339111372828484, "grad_min_sv": 1.6136958740434192e-08, "grad_condition": 115362103.47666125, "lr": 0.000810573890139155, "time_sec": 15.505242109298706 }, { "epoch": 44, "train_loss": 0.7410284707832336, "train_acc": 0.77312, "test_loss": 1.7518087032318115, "test_acc": 0.575, "lyapunov": null, "grad_norm": 0.9135862495102605, "grad_max_sv": 0.4029770277440548, "grad_min_sv": 1.6805088312935034e-08, "grad_condition": 94769472.27955042, "lr": 0.0008022995574311873, "time_sec": 15.517944812774658 }, { "epoch": 45, "train_loss": 0.7176916319656372, "train_acc": 0.77704, "test_loss": 2.0678364603042603, "test_acc": 0.5371, "lyapunov": null, "grad_norm": 0.9046856584920682, "grad_max_sv": 0.3983215056359768, "grad_min_sv": 1.613215366361165e-08, "grad_condition": 71122656.74298272, "lr": 0.0007938926261462363, "time_sec": 15.508166313171387 }, { "epoch": 46, "train_loss": 0.7069017255210877, "train_acc": 0.7811, "test_loss": 1.7433353471755981, "test_acc": 0.5852, "lyapunov": null, "grad_norm": 0.8978206260313095, "grad_max_sv": 0.3794424146413803, "grad_min_sv": 1.602237248293781e-08, "grad_condition": 54736720.76954285, "lr": 0.0007853567838422158, "time_sec": 15.502079725265503 }, { "epoch": 47, "train_loss": 0.6877984882736206, "train_acc": 0.7887, "test_loss": 1.818675978088379, "test_acc": 0.571, "lyapunov": null, "grad_norm": 0.8819975234594025, "grad_max_sv": 0.3825521655380726, "grad_min_sv": 1.5721361913863253e-08, "grad_condition": 205362522.60160935, "lr": 0.0007766957746216719, "time_sec": 15.509292840957642 }, { "epoch": 48, "train_loss": 0.6792054767608643, "train_acc": 0.78942, "test_loss": 1.8216966215133668, "test_acc": 0.5718, "lyapunov": null, "grad_norm": 0.8744607628160516, "grad_max_sv": 0.3726635776460171, "grad_min_sv": 1.5723771835604582e-08, "grad_condition": 93081917.25808936, "lr": 0.0007679133974894982, "time_sec": 15.525796890258789 }, { "epoch": 49, "train_loss": 0.6626561027145386, "train_acc": 0.79284, "test_loss": 1.772965872001648, "test_acc": 0.5863, "lyapunov": null, "grad_norm": 0.8660062343667397, "grad_max_sv": 0.3925539918243885, "grad_min_sv": 1.5532864388332138e-08, "grad_condition": 566473525.6824175, "lr": 0.000759013504686565, "time_sec": 15.50195598602295 }, { "epoch": 50, "train_loss": 0.6532552631759644, "train_acc": 0.79666, "test_loss": 1.8317417165756225, "test_acc": 0.5724, "lyapunov": null, "grad_norm": 0.860130500782199, "grad_max_sv": 0.3667507700622082, "grad_min_sv": 1.5443047825941526e-08, "grad_condition": 91486044.66793105, "lr": 0.0007499999999999998, "time_sec": 15.508357286453247 }, { "epoch": 51, "train_loss": 0.6380054843711853, "train_acc": 0.80084, "test_loss": 1.8737646755218507, "test_acc": 0.5686, "lyapunov": null, "grad_norm": 0.8524936007576276, "grad_max_sv": 0.3761135272681713, "grad_min_sv": 1.5451151683110177e-08, "grad_condition": 34353598.33829906, "lr": 0.0007408768370508575, "time_sec": 15.523806810379028 }, { "epoch": 52, "train_loss": 0.6237339858055114, "train_acc": 0.80636, "test_loss": 1.761890636062622, "test_acc": 0.5872, "lyapunov": null, "grad_norm": 0.8410504283608066, "grad_max_sv": 0.358472990244627, "grad_min_sv": 1.503268568618654e-08, "grad_condition": 136795884.7400892, "lr": 0.0007316480175599307, "time_sec": 15.495483636856079 }, { "epoch": 53, "train_loss": 0.6058457711982727, "train_acc": 0.80932, "test_loss": 1.9825311820983886, "test_acc": 0.5638, "lyapunov": null, "grad_norm": 0.8335328667900934, "grad_max_sv": 0.36334397196769713, "grad_min_sv": 1.5307615661760283e-08, "grad_condition": 250366089.5715099, "lr": 0.0007223175895924635, "time_sec": 15.514543771743774 }, { "epoch": 54, "train_loss": 0.6004596606063842, "train_acc": 0.81078, "test_loss": 1.8254186273574828, "test_acc": 0.5794, "lyapunov": null, "grad_norm": 0.8274523113635032, "grad_max_sv": 0.36342041566967964, "grad_min_sv": 1.4868843903077106e-08, "grad_condition": 300576728.02848065, "lr": 0.0007128896457825361, "time_sec": 15.540250062942505 }, { "epoch": 55, "train_loss": 0.5861557857704163, "train_acc": 0.8164, "test_loss": 1.824499238014221, "test_acc": 0.583, "lyapunov": null, "grad_norm": 0.8198101267614993, "grad_max_sv": 0.357354723662138, "grad_min_sv": 1.4506401982417039e-08, "grad_condition": 35029629.47074116, "lr": 0.0007033683215378998, "time_sec": 15.531729459762573 }, { "epoch": 56, "train_loss": 0.5844129343986512, "train_acc": 0.81744, "test_loss": 1.9169658557891847, "test_acc": 0.5711, "lyapunov": null, "grad_norm": 0.8204173814530821, "grad_max_sv": 0.35366991981863977, "grad_min_sv": 1.4835723899028764e-08, "grad_condition": 72623356.9140754, "lr": 0.0006937577932260512, "time_sec": 15.517155647277832 }, { "epoch": 57, "train_loss": 0.567106929988861, "train_acc": 0.82118, "test_loss": 1.872194965362549, "test_acc": 0.5783, "lyapunov": null, "grad_norm": 0.8144173645411016, "grad_max_sv": 0.3568101763725281, "grad_min_sv": 1.459230552047601e-08, "grad_condition": 479856948.8028302, "lr": 0.0006840622763423388, "time_sec": 15.499967098236084 }, { "epoch": 58, "train_loss": 0.5492036812782287, "train_acc": 0.82718, "test_loss": 1.9435380107879638, "test_acc": 0.5717, "lyapunov": null, "grad_norm": 0.8017437900627353, "grad_max_sv": 0.35105792358517646, "grad_min_sv": 1.4126277701753675e-08, "grad_condition": 43594921.05141826, "lr": 0.0006742860236609073, "time_sec": 15.517162084579468 }, { "epoch": 59, "train_loss": 0.5499647881126404, "train_acc": 0.82578, "test_loss": 1.9104221244812012, "test_acc": 0.5719, "lyapunov": null, "grad_norm": 0.8008754176084809, "grad_max_sv": 0.35147457346320155, "grad_min_sv": 1.4486321607987823e-08, "grad_condition": 183104197.19597444, "lr": 0.0006644333233692913, "time_sec": 15.51251220703125 }, { "epoch": 60, "train_loss": 0.534982263879776, "train_acc": 0.83032, "test_loss": 1.8654183416366577, "test_acc": 0.5849, "lyapunov": null, "grad_norm": 0.7872093874708191, "grad_max_sv": 0.3456037163734436, "grad_min_sv": 1.4336570289236833e-08, "grad_condition": 4249914917.2238555, "lr": 0.0006545084971874734, "time_sec": 15.505401134490967 }, { "epoch": 61, "train_loss": 0.5249415069770813, "train_acc": 0.83296, "test_loss": 1.8301967880249024, "test_acc": 0.5899, "lyapunov": null, "grad_norm": 0.7823659308548245, "grad_max_sv": 0.3372106350958347, "grad_min_sv": 1.3865955505228816e-08, "grad_condition": 252598095.01328754, "lr": 0.0006445158984722354, "time_sec": 15.503329277038574 }, { "epoch": 62, "train_loss": 0.510102439250946, "train_acc": 0.8393, "test_loss": 1.866330424118042, "test_acc": 0.5875, "lyapunov": null, "grad_norm": 0.7690765731453699, "grad_max_sv": 0.3254604462534189, "grad_min_sv": 1.3302552516816778e-08, "grad_condition": 201820413.1939206, "lr": 0.0006344599103076324, "time_sec": 15.51197862625122 }, { "epoch": 63, "train_loss": 0.5105279865837097, "train_acc": 0.83724, "test_loss": 1.901947551727295, "test_acc": 0.5827, "lyapunov": null, "grad_norm": 0.7774036231362129, "grad_max_sv": 0.3391082786023617, "grad_min_sv": 1.3618166180666413e-08, "grad_condition": 142624827.53962922, "lr": 0.0006243449435824269, "time_sec": 15.512575387954712 }, { "epoch": 64, "train_loss": 0.4943154125213623, "train_acc": 0.84368, "test_loss": 1.8720532272338868, "test_acc": 0.5871, "lyapunov": null, "grad_norm": 0.7622106739600653, "grad_max_sv": 0.3370689533650875, "grad_min_sv": 1.3509893057039868e-08, "grad_condition": 110330065.15549783, "lr": 0.0006141754350553275, "time_sec": 15.502142667770386 }, { "epoch": 65, "train_loss": 0.47654122495651247, "train_acc": 0.84812, "test_loss": 1.905906325340271, "test_acc": 0.5836, "lyapunov": null, "grad_norm": 0.7485726591566199, "grad_max_sv": 0.3178395930677652, "grad_min_sv": 1.3372613298992531e-08, "grad_condition": 61795906.83332411, "lr": 0.0006039558454088793, "time_sec": 15.515769243240356 }, { "epoch": 66, "train_loss": 0.4698985565757752, "train_acc": 0.85062, "test_loss": 1.9764730356216431, "test_acc": 0.5772, "lyapunov": null, "grad_norm": 0.742030695327052, "grad_max_sv": 0.32952211387455466, "grad_min_sv": 1.321727686021503e-08, "grad_condition": 4546159923.454214, "lr": 0.000593690657292862, "time_sec": 15.48769211769104 }, { "epoch": 67, "train_loss": 0.4604379980945587, "train_acc": 0.8524, "test_loss": 1.796267902946472, "test_acc": 0.6041, "lyapunov": null, "grad_norm": 0.740514981620189, "grad_max_sv": 0.33283664137125013, "grad_min_sv": 1.3323875688170395e-08, "grad_condition": 50110355.592218384, "lr": 0.0005833843733580507, "time_sec": 15.512935638427734 }, { "epoch": 68, "train_loss": 0.44513163749694823, "train_acc": 0.85782, "test_loss": 1.882637822341919, "test_acc": 0.5923, "lyapunov": null, "grad_norm": 0.728632370248676, "grad_max_sv": 0.3257355663925409, "grad_min_sv": 1.2869882924648746e-08, "grad_condition": 63884816.41740811, "lr": 0.0005730415142812054, "time_sec": 15.52915072441101 }, { "epoch": 69, "train_loss": 0.4467424920272827, "train_acc": 0.85622, "test_loss": 1.8523083587646485, "test_acc": 0.5958, "lyapunov": null, "grad_norm": 0.7288387711248852, "grad_max_sv": 0.322311682254076, "grad_min_sv": 1.291249293496055e-08, "grad_condition": 179204657.50522354, "lr": 0.0005626666167821517, "time_sec": 15.511183738708496 }, { "epoch": 70, "train_loss": 0.4350817290687561, "train_acc": 0.86062, "test_loss": 1.9277977352142335, "test_acc": 0.5905, "lyapunov": null, "grad_norm": 0.7211268163108158, "grad_max_sv": 0.3169262710958719, "grad_min_sv": 1.2573862395379165e-08, "grad_condition": 248234270.03092772, "lr": 0.0005522642316338265, "time_sec": 15.514695167541504 }, { "epoch": 71, "train_loss": 0.43583440225601194, "train_acc": 0.86066, "test_loss": 1.940795637512207, "test_acc": 0.59, "lyapunov": null, "grad_norm": 0.7218256453060395, "grad_max_sv": 0.3179506029933691, "grad_min_sv": 1.2854640636141001e-08, "grad_condition": 159315542.25023228, "lr": 0.0005418389216661573, "time_sec": 15.515326499938965 }, { "epoch": 72, "train_loss": 0.414209595451355, "train_acc": 0.86682, "test_loss": 1.9192114906311035, "test_acc": 0.5871, "lyapunov": null, "grad_norm": 0.7026800304062572, "grad_max_sv": 0.3194992933422327, "grad_min_sv": 1.2563614283167892e-08, "grad_condition": 438466879.2604634, "lr": 0.0005313952597646563, "time_sec": 15.508101224899292 }, { "epoch": 73, "train_loss": 0.41810142745018003, "train_acc": 0.86568, "test_loss": 1.9427220703125, "test_acc": 0.5871, "lyapunov": null, "grad_norm": 0.7107104457797438, "grad_max_sv": 0.3116331197321415, "grad_min_sv": 1.2560458482156755e-08, "grad_condition": 218040038.56003165, "lr": 0.0005209378268645994, "time_sec": 15.528023719787598 }, { "epoch": 74, "train_loss": 0.4033842642211914, "train_acc": 0.87, "test_loss": 1.9472733200073242, "test_acc": 0.5874, "lyapunov": null, "grad_norm": 0.6981925142164059, "grad_max_sv": 0.3173716105520725, "grad_min_sv": 1.260878115683789e-08, "grad_condition": 120156618.97368078, "lr": 0.0005104712099416781, "time_sec": 15.506508111953735 }, { "epoch": 75, "train_loss": 0.39077227040290835, "train_acc": 0.87468, "test_loss": 1.857486226272583, "test_acc": 0.598, "lyapunov": null, "grad_norm": 0.6856338799556791, "grad_max_sv": 0.30381867848336697, "grad_min_sv": 1.2063926282295315e-08, "grad_condition": 414020461.3005485, "lr": 0.0004999999999999996, "time_sec": 15.522391557693481 }, { "epoch": 76, "train_loss": 0.3836136112689972, "train_acc": 0.8757, "test_loss": 1.9512550479888917, "test_acc": 0.587, "lyapunov": null, "grad_norm": 0.6870816068446682, "grad_max_sv": 0.3084618851542473, "grad_min_sv": 1.2161173516388873e-08, "grad_condition": 299698503.7116597, "lr": 0.0004895287900583212, "time_sec": 15.51857614517212 }, { "epoch": 77, "train_loss": 0.38193485226631163, "train_acc": 0.87626, "test_loss": 1.8681373037338256, "test_acc": 0.5993, "lyapunov": null, "grad_norm": 0.6828844071671899, "grad_max_sv": 0.30646760389208794, "grad_min_sv": 1.2204253475693593e-08, "grad_condition": 272459180.1924466, "lr": 0.0004790621731353997, "time_sec": 15.519853591918945 }, { "epoch": 78, "train_loss": 0.37069116824150083, "train_acc": 0.88084, "test_loss": 1.875751858139038, "test_acc": 0.6043, "lyapunov": null, "grad_norm": 0.6706724909872018, "grad_max_sv": 0.30184795036911966, "grad_min_sv": 1.1925269455606569e-08, "grad_condition": 303963866.0557478, "lr": 0.000468604740235343, "time_sec": 15.520630836486816 }, { "epoch": 79, "train_loss": 0.3643507383155823, "train_acc": 0.88364, "test_loss": 1.9180334386825562, "test_acc": 0.5942, "lyapunov": null, "grad_norm": 0.6691117052818351, "grad_max_sv": 0.2972587738186121, "grad_min_sv": 1.1847118905870552e-08, "grad_condition": 4229198196.1638947, "lr": 0.00045816107833384175, "time_sec": 15.53023386001587 }, { "epoch": 80, "train_loss": 0.3633389077377319, "train_acc": 0.88294, "test_loss": 1.8658218830108642, "test_acc": 0.6003, "lyapunov": null, "grad_norm": 0.6700579474761854, "grad_max_sv": 0.2936097148805857, "grad_min_sv": 1.1731030144946502e-08, "grad_condition": 196324429.7051069, "lr": 0.0004477357683661729, "time_sec": 15.50595474243164 }, { "epoch": 81, "train_loss": 0.35195467962265015, "train_acc": 0.88632, "test_loss": 1.9072984680175782, "test_acc": 0.5985, "lyapunov": null, "grad_norm": 0.6558349942319918, "grad_max_sv": 0.2942222774028778, "grad_min_sv": 1.1174211227583247e-08, "grad_condition": 686453916.7723808, "lr": 0.00043733338321784746, "time_sec": 15.547033786773682 }, { "epoch": 82, "train_loss": 0.34602870296001437, "train_acc": 0.88766, "test_loss": 1.9684966739654541, "test_acc": 0.5914, "lyapunov": null, "grad_norm": 0.6555903608944951, "grad_max_sv": 0.29228324331343175, "grad_min_sv": 1.1487677028338903e-08, "grad_condition": 383534563.2338952, "lr": 0.0004269584857187939, "time_sec": 15.51542615890503 }, { "epoch": 83, "train_loss": 0.3428422933292389, "train_acc": 0.89108, "test_loss": 1.9337468532562256, "test_acc": 0.5993, "lyapunov": null, "grad_norm": 0.6492331544938933, "grad_max_sv": 0.28135959543287753, "grad_min_sv": 1.1496448484339673e-08, "grad_condition": 414922787.7095521, "lr": 0.0004166156266419484, "time_sec": 15.53177547454834 }, { "epoch": 84, "train_loss": 0.328343852148056, "train_acc": 0.89454, "test_loss": 1.9273885646820068, "test_acc": 0.6009, "lyapunov": null, "grad_norm": 0.6390681347680143, "grad_max_sv": 0.28590504080057144, "grad_min_sv": 1.1241013130221244e-08, "grad_condition": 433920435.0763866, "lr": 0.0004063093427071373, "time_sec": 15.530908346176147 }, { "epoch": 85, "train_loss": 0.3230694122695923, "train_acc": 0.89496, "test_loss": 1.9058713027954102, "test_acc": 0.5998, "lyapunov": null, "grad_norm": 0.6383613950635205, "grad_max_sv": 0.2902642168104649, "grad_min_sv": 1.141585580797036e-08, "grad_condition": 604353313.9340062, "lr": 0.0003960441545911199, "time_sec": 15.515930414199829 }, { "epoch": 86, "train_loss": 0.31695827428817747, "train_acc": 0.8967, "test_loss": 1.9341052951812745, "test_acc": 0.5998, "lyapunov": null, "grad_norm": 0.6323196704290217, "grad_max_sv": 0.30049107149243354, "grad_min_sv": 1.1364172216449253e-08, "grad_condition": 253780845.1911161, "lr": 0.0003858245649446718, "time_sec": 15.52891731262207 }, { "epoch": 87, "train_loss": 0.310550309715271, "train_acc": 0.8979, "test_loss": 1.9645798837661743, "test_acc": 0.5972, "lyapunov": null, "grad_norm": 0.6290293549615046, "grad_max_sv": 0.28168079666793344, "grad_min_sv": 1.1139878612566237e-08, "grad_condition": 3174828807.3372684, "lr": 0.00037565505641757235, "time_sec": 15.527303218841553 }, { "epoch": 88, "train_loss": 0.30801844054222105, "train_acc": 0.89982, "test_loss": 1.9113462907791137, "test_acc": 0.6061, "lyapunov": null, "grad_norm": 0.6261342549488306, "grad_max_sv": 0.2938710656017065, "grad_min_sv": 1.1276199778260943e-08, "grad_condition": 166623199.75638226, "lr": 0.00036554008969236695, "time_sec": 15.515942573547363 }, { "epoch": 89, "train_loss": 0.3031072138786316, "train_acc": 0.90226, "test_loss": 1.932079137611389, "test_acc": 0.6084, "lyapunov": null, "grad_norm": 0.6209363139222046, "grad_max_sv": 0.2818705204874277, "grad_min_sv": 1.0986600190287382e-08, "grad_condition": 235648712.41506353, "lr": 0.0003554841015277638, "time_sec": 15.523046731948853 }, { "epoch": 90, "train_loss": 0.295468587474823, "train_acc": 0.90442, "test_loss": 1.9561836023330688, "test_acc": 0.6029, "lyapunov": null, "grad_norm": 0.6134434549386554, "grad_max_sv": 0.28373970463871956, "grad_min_sv": 1.1000367631294056e-08, "grad_condition": 371761681.0452756, "lr": 0.000345491502812526, "time_sec": 15.52297592163086 }, { "epoch": 91, "train_loss": 0.29119554637908934, "train_acc": 0.90446, "test_loss": 1.993441968536377, "test_acc": 0.6049, "lyapunov": null, "grad_norm": 0.6105333020567495, "grad_max_sv": 0.27541381642222407, "grad_min_sv": 1.0823096196089371e-08, "grad_condition": 473734139.3827542, "lr": 0.0003355666766307081, "time_sec": 15.514235258102417 }, { "epoch": 92, "train_loss": 0.28460477176189425, "train_acc": 0.90876, "test_loss": 1.9682166564941406, "test_acc": 0.6057, "lyapunov": null, "grad_norm": 0.5988483508766865, "grad_max_sv": 0.27126791067421435, "grad_min_sv": 1.0722518893266364e-08, "grad_condition": 97668951.32032181, "lr": 0.00032571397633909225, "time_sec": 15.52116084098816 }, { "epoch": 93, "train_loss": 0.2825835990524292, "train_acc": 0.90854, "test_loss": 1.9348359714508057, "test_acc": 0.6041, "lyapunov": null, "grad_norm": 0.6011972747002627, "grad_max_sv": 0.2796713523566723, "grad_min_sv": 1.0827668426964532e-08, "grad_condition": 881127416.7703698, "lr": 0.00031593772365766094, "time_sec": 15.528529644012451 }, { "epoch": 94, "train_loss": 0.2801620689296722, "train_acc": 0.9097, "test_loss": 1.980628232383728, "test_acc": 0.6055, "lyapunov": null, "grad_norm": 0.5993074321032092, "grad_max_sv": 0.2800555154681206, "grad_min_sv": 1.0468388221378244e-08, "grad_condition": 140732695.72303194, "lr": 0.0003062422067739483, "time_sec": 15.532250165939331 }, { "epoch": 95, "train_loss": 0.26648273178100584, "train_acc": 0.9142, "test_loss": 2.0015383081436156, "test_acc": 0.6016, "lyapunov": null, "grad_norm": 0.5881453904576209, "grad_max_sv": 0.27579851634800434, "grad_min_sv": 1.0274321395227492e-08, "grad_condition": 201871276.47904783, "lr": 0.00029663167846209965, "time_sec": 15.681024551391602 }, { "epoch": 96, "train_loss": 0.26776352972984313, "train_acc": 0.91448, "test_loss": 2.0207461967468263, "test_acc": 0.6012, "lyapunov": null, "grad_norm": 0.5860462649686203, "grad_max_sv": 0.2698933105915785, "grad_min_sv": 1.0329826621857664e-08, "grad_condition": 76135409.2144176, "lr": 0.00028711035421746345, "time_sec": 15.536462545394897 }, { "epoch": 97, "train_loss": 0.25857464953899384, "train_acc": 0.91696, "test_loss": 1.9442026258468628, "test_acc": 0.6066, "lyapunov": null, "grad_norm": 0.579918050497587, "grad_max_sv": 0.28092321269214154, "grad_min_sv": 1.0451780512853865e-08, "grad_condition": 432604154.8635365, "lr": 0.00027768241040753615, "time_sec": 15.520632982254028 }, { "epoch": 98, "train_loss": 0.2567158591556549, "train_acc": 0.91576, "test_loss": 1.952080411529541, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.5815827800021661, "grad_max_sv": 0.26784452944993975, "grad_min_sv": 9.97831211164979e-09, "grad_condition": 91061008.30272922, "lr": 0.00026835198244006903, "time_sec": 15.535520553588867 }, { "epoch": 99, "train_loss": 0.24892670249938964, "train_acc": 0.9202, "test_loss": 2.033794689941406, "test_acc": 0.6019, "lyapunov": null, "grad_norm": 0.5696851893969495, "grad_max_sv": 0.2726339440792799, "grad_min_sv": 9.946045926049683e-09, "grad_condition": 1696689541.1727843, "lr": 0.0002591231629491421, "time_sec": 15.538635969161987 }, { "epoch": 100, "train_loss": 0.24926711993694306, "train_acc": 0.91978, "test_loss": 1.9742811960220337, "test_acc": 0.6068, "lyapunov": null, "grad_norm": 0.5702583833389835, "grad_max_sv": 0.26799715869128704, "grad_min_sv": 9.895174417351438e-09, "grad_condition": 297572156.6297859, "lr": 0.0002499999999999997, "time_sec": 15.536820650100708 }, { "epoch": 101, "train_loss": 0.2401547999382019, "train_acc": 0.92344, "test_loss": 1.99689197101593, "test_acc": 0.6077, "lyapunov": null, "grad_norm": 0.5610283078331603, "grad_max_sv": 0.2691540464758873, "grad_min_sv": 9.99432525588921e-09, "grad_condition": 545457041.2762839, "lr": 0.00024098649531343477, "time_sec": 15.541125774383545 }, { "epoch": 102, "train_loss": 0.2366540629529953, "train_acc": 0.92332, "test_loss": 1.9686679859161378, "test_acc": 0.6043, "lyapunov": null, "grad_norm": 0.5596319863447712, "grad_max_sv": 0.2598999205976725, "grad_min_sv": 9.748093400801378e-09, "grad_condition": 280631646.0385326, "lr": 0.0002320866025105016, "time_sec": 15.642221689224243 }, { "epoch": 103, "train_loss": 0.23095350846290588, "train_acc": 0.92478, "test_loss": 1.9796740842819214, "test_acc": 0.6086, "lyapunov": null, "grad_norm": 0.5527105531261713, "grad_max_sv": 0.2648670017719269, "grad_min_sv": 1.0250657645751934e-08, "grad_condition": 501602567.1069907, "lr": 0.0002233042253783278, "time_sec": 15.533202886581421 }, { "epoch": 104, "train_loss": 0.23427851341247558, "train_acc": 0.92466, "test_loss": 1.9721594404220582, "test_acc": 0.6107, "lyapunov": null, "grad_norm": 0.5589041472139786, "grad_max_sv": 0.25932734124362466, "grad_min_sv": 9.605904077877003e-09, "grad_condition": 1031803946.0677515, "lr": 0.000214643216157784, "time_sec": 15.51241683959961 }, { "epoch": 105, "train_loss": 0.219517624874115, "train_acc": 0.9293, "test_loss": 2.0007881326675414, "test_acc": 0.6035, "lyapunov": null, "grad_norm": 0.5422594048752922, "grad_max_sv": 0.2685978960245848, "grad_min_sv": 9.883629456617499e-09, "grad_condition": 224740616.11832863, "lr": 0.00020610737385376332, "time_sec": 15.537052392959595 }, { "epoch": 106, "train_loss": 0.2232757794523239, "train_acc": 0.92674, "test_loss": 2.0058324546813964, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.5472900635805251, "grad_max_sv": 0.2613681871443987, "grad_min_sv": 9.819886173656478e-09, "grad_condition": 176319742.57465333, "lr": 0.00019770044256881242, "time_sec": 15.542799949645996 }, { "epoch": 107, "train_loss": 0.21997562067031862, "train_acc": 0.92926, "test_loss": 1.989624990081787, "test_acc": 0.6099, "lyapunov": null, "grad_norm": 0.5414473725256549, "grad_max_sv": 0.2557095166295767, "grad_min_sv": 9.448845216301038e-09, "grad_condition": 1407753979.8512912, "lr": 0.0001894261098608447, "time_sec": 15.52652359008789 }, { "epoch": 108, "train_loss": 0.2132127531719208, "train_acc": 0.93122, "test_loss": 2.043244864463806, "test_acc": 0.6013, "lyapunov": null, "grad_norm": 0.5380471333664735, "grad_max_sv": 0.255327982082963, "grad_min_sv": 9.992253989770521e-09, "grad_condition": 429655462.4469593, "lr": 0.000181288005125655, "time_sec": 15.52126145362854 }, { "epoch": 109, "train_loss": 0.21187591857910157, "train_acc": 0.93122, "test_loss": 1.9954864723205565, "test_acc": 0.6098, "lyapunov": null, "grad_norm": 0.5380204381544875, "grad_max_sv": 0.26441522017121316, "grad_min_sv": 9.557367238854226e-09, "grad_condition": 237566723.1979712, "lr": 0.0001732896980049473, "time_sec": 15.548521995544434 }, { "epoch": 110, "train_loss": 0.20928363649368287, "train_acc": 0.9326, "test_loss": 1.9480315828323365, "test_acc": 0.6146, "lyapunov": null, "grad_norm": 0.5298971206452113, "grad_max_sv": 0.26398450396955014, "grad_min_sv": 9.874217052428108e-09, "grad_condition": 197519783.8891028, "lr": 0.00016543469682057076, "time_sec": 15.51990032196045 }, { "epoch": 111, "train_loss": 0.20472501375198365, "train_acc": 0.93442, "test_loss": 1.9880135498046876, "test_acc": 0.6114, "lyapunov": null, "grad_norm": 0.5226715722616327, "grad_max_sv": 0.25575212091207505, "grad_min_sv": 9.559482279462156e-09, "grad_condition": 213563040.67873913, "lr": 0.00015772644703565552, "time_sec": 15.518001079559326 }, { "epoch": 112, "train_loss": 0.20579987778663636, "train_acc": 0.93296, "test_loss": 2.016691120529175, "test_acc": 0.6117, "lyapunov": null, "grad_norm": 0.5297683532569843, "grad_max_sv": 0.25805489346385, "grad_min_sv": 9.560597037899625e-09, "grad_condition": 1064723629.28162, "lr": 0.00015016832974331713, "time_sec": 15.522767305374146 }, { "epoch": 113, "train_loss": 0.20068273310422896, "train_acc": 0.93668, "test_loss": 2.0594107456207276, "test_acc": 0.6086, "lyapunov": null, "grad_norm": 0.5184460551642818, "grad_max_sv": 0.24561816416680812, "grad_min_sv": 9.581332657826458e-09, "grad_condition": 364510178.3461688, "lr": 0.00014276366018359834, "time_sec": 15.533010005950928 }, { "epoch": 114, "train_loss": 0.19722092057228088, "train_acc": 0.93788, "test_loss": 2.008504161453247, "test_acc": 0.6083, "lyapunov": null, "grad_norm": 0.5143544627139274, "grad_max_sv": 0.26034388653934004, "grad_min_sv": 9.650303647423114e-09, "grad_condition": 3361687889.542286, "lr": 0.00013551568628929425, "time_sec": 15.531035661697388 }, { "epoch": 115, "train_loss": 0.19389657697677612, "train_acc": 0.93868, "test_loss": 2.0233098300933836, "test_acc": 0.6117, "lyapunov": null, "grad_norm": 0.5104261903820102, "grad_max_sv": 0.24447884745895862, "grad_min_sv": 9.077133606870055e-09, "grad_condition": 461064774.41410434, "lr": 0.00012842758726130276, "time_sec": 15.524327993392944 }, { "epoch": 116, "train_loss": 0.19362226080417633, "train_acc": 0.93796, "test_loss": 2.053111413192749, "test_acc": 0.6054, "lyapunov": null, "grad_norm": 0.5131743880915615, "grad_max_sv": 0.2492377854883671, "grad_min_sv": 9.515753446841246e-09, "grad_condition": 206396866.4016946, "lr": 0.0001215024721741218, "time_sec": 15.513204574584961 }, { "epoch": 117, "train_loss": 0.18898310523986817, "train_acc": 0.93976, "test_loss": 2.015893176269531, "test_acc": 0.6127, "lyapunov": null, "grad_norm": 0.5048514988009624, "grad_max_sv": 0.23975766226649284, "grad_min_sv": 9.193109389200611e-09, "grad_condition": 1880002960.4112122, "lr": 0.00011474337861210538, "time_sec": 15.531865119934082 }, { "epoch": 118, "train_loss": 0.18859933629989625, "train_acc": 0.93992, "test_loss": 2.0275477882385253, "test_acc": 0.613, "lyapunov": null, "grad_norm": 0.5070579132326548, "grad_max_sv": 0.2569826778024435, "grad_min_sv": 9.573198521970264e-09, "grad_condition": 946919734.9405922, "lr": 0.00010815327133708009, "time_sec": 15.528860330581665 }, { "epoch": 119, "train_loss": 0.18436414319992064, "train_acc": 0.9409, "test_loss": 2.035816400527954, "test_acc": 0.6094, "lyapunov": null, "grad_norm": 0.49869022882133546, "grad_max_sv": 0.24773051403462887, "grad_min_sv": 9.154285843075704e-09, "grad_condition": 330957531.4847302, "lr": 0.00010173504098790182, "time_sec": 15.546629190444946 }, { "epoch": 120, "train_loss": 0.18639450643777847, "train_acc": 0.94082, "test_loss": 2.0497810037612916, "test_acc": 0.6101, "lyapunov": null, "grad_norm": 0.5054264593475204, "grad_max_sv": 0.24650247804820538, "grad_min_sv": 9.350194245597021e-09, "grad_condition": 546741093.3651453, "lr": 9.549150281252629e-05, "time_sec": 15.52673053741455 }, { "epoch": 121, "train_loss": 0.18135397327423095, "train_acc": 0.94364, "test_loss": 2.0228085262298583, "test_acc": 0.6112, "lyapunov": null, "grad_norm": 0.49196950746055856, "grad_max_sv": 0.25292878448963163, "grad_min_sv": 9.245442955446368e-09, "grad_condition": 345415022.7201654, "lr": 8.942539543314794e-05, "time_sec": 15.530716180801392 }, { "epoch": 122, "train_loss": 0.17821871382713317, "train_acc": 0.94288, "test_loss": 2.015850890350342, "test_acc": 0.6127, "lyapunov": null, "grad_norm": 0.4943397097989714, "grad_max_sv": 0.2537323322147131, "grad_min_sv": 9.237968556525395e-09, "grad_condition": 263035591.43015513, "lr": 8.353937964495024e-05, "time_sec": 15.536164045333862 }, { "epoch": 123, "train_loss": 0.17632093348026276, "train_acc": 0.9444, "test_loss": 2.029286048698425, "test_acc": 0.6089, "lyapunov": null, "grad_norm": 0.48806288568095135, "grad_max_sv": 0.2458991575986147, "grad_min_sv": 9.06146269260763e-09, "grad_condition": 386283353.8532323, "lr": 7.783603724899243e-05, "time_sec": 15.518115997314453 }, { "epoch": 124, "train_loss": 0.1732941804933548, "train_acc": 0.94456, "test_loss": 2.099158185958862, "test_acc": 0.6025, "lyapunov": null, "grad_norm": 0.4868912892942884, "grad_max_sv": 0.24448585212230683, "grad_min_sv": 8.980524343182167e-09, "grad_condition": 336891094.31355625, "lr": 7.231786991974666e-05, "time_sec": 15.542467832565308 }, { "epoch": 125, "train_loss": 0.17837541491031647, "train_acc": 0.94274, "test_loss": 2.0764820568084716, "test_acc": 0.61, "lyapunov": null, "grad_norm": 0.4948203710715524, "grad_max_sv": 0.24412455931305885, "grad_min_sv": 9.184420232503931e-09, "grad_condition": 716346437.4859622, "lr": 6.698729810778072e-05, "time_sec": 15.55189299583435 }, { "epoch": 126, "train_loss": 0.1735024337530136, "train_acc": 0.94474, "test_loss": 2.0553098888397217, "test_acc": 0.6111, "lyapunov": null, "grad_norm": 0.4854349633437902, "grad_max_sv": 0.2419682189822197, "grad_min_sv": 8.905077519393705e-09, "grad_condition": 839365296.5454277, "lr": 6.184665997806817e-05, "time_sec": 15.54058313369751 }, { "epoch": 127, "train_loss": 0.1715146116065979, "train_acc": 0.94478, "test_loss": 2.0106375900268554, "test_acc": 0.6128, "lyapunov": null, "grad_norm": 0.4816957588601112, "grad_max_sv": 0.23674072176218033, "grad_min_sv": 8.675588131831085e-09, "grad_condition": 478973714.0473558, "lr": 5.6898210384392595e-05, "time_sec": 15.529821157455444 }, { "epoch": 128, "train_loss": 0.1660640141773224, "train_acc": 0.9478, "test_loss": 2.0750678112030028, "test_acc": 0.6111, "lyapunov": null, "grad_norm": 0.4757528664416431, "grad_max_sv": 0.244390731677413, "grad_min_sv": 8.79119548703039e-09, "grad_condition": 457083152.2974655, "lr": 5.214411988029363e-05, "time_sec": 15.54984712600708 }, { "epoch": 129, "train_loss": 0.1666716690993309, "train_acc": 0.94686, "test_loss": 2.0469725986480714, "test_acc": 0.6123, "lyapunov": null, "grad_norm": 0.478310500713372, "grad_max_sv": 0.23569908998906614, "grad_min_sv": 8.542899999821468e-09, "grad_condition": 598853903.3316209, "lr": 4.7586473766990294e-05, "time_sec": 15.545772552490234 }, { "epoch": 130, "train_loss": 0.16598962943553924, "train_acc": 0.94712, "test_loss": 1.9995166748046875, "test_acc": 0.6146, "lyapunov": null, "grad_norm": 0.4758526221040286, "grad_max_sv": 0.23986518271267415, "grad_min_sv": 8.749124542689266e-09, "grad_condition": 608746268.1362782, "lr": 4.32272711786996e-05, "time_sec": 15.54599404335022 }, { "epoch": 131, "train_loss": 0.16668007793426515, "train_acc": 0.9479, "test_loss": 2.0491572677612306, "test_acc": 0.6109, "lyapunov": null, "grad_norm": 0.4755344205180913, "grad_max_sv": 0.23323244228959084, "grad_min_sv": 8.472622621633757e-09, "grad_condition": 233979199.2625857, "lr": 3.906842420574966e-05, "time_sec": 15.524599552154541 }, { "epoch": 132, "train_loss": 0.16224975943565367, "train_acc": 0.94862, "test_loss": 2.0500082311630248, "test_acc": 0.6134, "lyapunov": null, "grad_norm": 0.46871867660355254, "grad_max_sv": 0.2372895274311304, "grad_min_sv": 8.64411044331978e-09, "grad_condition": 287263322.167899, "lr": 3.5111757055874305e-05, "time_sec": 15.527011156082153 }, { "epoch": 133, "train_loss": 0.16492341012477874, "train_acc": 0.94736, "test_loss": 2.0346584928512574, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.47534738241769, "grad_max_sv": 0.24461643844842912, "grad_min_sv": 9.178972258834517e-09, "grad_condition": 500309812.0406585, "lr": 3.1359005254054254e-05, "time_sec": 15.547746658325195 }, { "epoch": 134, "train_loss": 0.16421831488609315, "train_acc": 0.94756, "test_loss": 2.0132702159881593, "test_acc": 0.6162, "lyapunov": null, "grad_norm": 0.4772419829809968, "grad_max_sv": 0.23413821049034594, "grad_min_sv": 9.002530253383878e-09, "grad_condition": 363205059.0549506, "lr": 2.7811814881259484e-05, "time_sec": 15.531517505645752 }, { "epoch": 135, "train_loss": 0.16381137976646423, "train_acc": 0.94842, "test_loss": 2.0648642013549803, "test_acc": 0.6083, "lyapunov": null, "grad_norm": 0.4736658227067323, "grad_max_sv": 0.23049395270645617, "grad_min_sv": 8.56864400186879e-09, "grad_condition": 1442465508.733611, "lr": 2.4471741852423218e-05, "time_sec": 15.541293859481812 }, { "epoch": 136, "train_loss": 0.16108462400436402, "train_acc": 0.94976, "test_loss": 2.0012967403411865, "test_acc": 0.6119, "lyapunov": null, "grad_norm": 0.465643715209168, "grad_max_sv": 0.23518772274255753, "grad_min_sv": 8.637825488558292e-09, "grad_condition": 243388926.8874995, "lr": 2.1340251233966362e-05, "time_sec": 15.512713193893433 }, { "epoch": 137, "train_loss": 0.1584918847179413, "train_acc": 0.94912, "test_loss": 2.050839980697632, "test_acc": 0.6104, "lyapunov": null, "grad_norm": 0.46730923038258504, "grad_max_sv": 0.23510748259723185, "grad_min_sv": 8.813612497248977e-09, "grad_condition": 1210234116.5017686, "lr": 1.8418716601170932e-05, "time_sec": 15.537960052490234 }, { "epoch": 138, "train_loss": 0.15678886548519136, "train_acc": 0.9508, "test_loss": 2.0579080810546877, "test_acc": 0.6137, "lyapunov": null, "grad_norm": 0.46202513180941285, "grad_max_sv": 0.22975999489426613, "grad_min_sv": 8.437959897781514e-09, "grad_condition": 1365594635.574403, "lr": 1.570841943568445e-05, "time_sec": 15.53256607055664 }, { "epoch": 139, "train_loss": 0.15868934306621552, "train_acc": 0.95058, "test_loss": 2.0891008211135866, "test_acc": 0.607, "lyapunov": null, "grad_norm": 0.46370376954923076, "grad_max_sv": 0.239790453761816, "grad_min_sv": 8.653809858939418e-09, "grad_condition": 751331866.6462338, "lr": 1.3210548563419845e-05, "time_sec": 15.542593002319336 }, { "epoch": 140, "train_loss": 0.16018940447807312, "train_acc": 0.94944, "test_loss": 2.0365436012268066, "test_acc": 0.6134, "lyapunov": null, "grad_norm": 0.46850944550951273, "grad_max_sv": 0.24336591213941575, "grad_min_sv": 8.69392097297767e-09, "grad_condition": 6372417042.7504635, "lr": 1.0926199633097203e-05, "time_sec": 15.530508279800415 }, { "epoch": 141, "train_loss": 0.1577048332262039, "train_acc": 0.95192, "test_loss": 2.048553763961792, "test_acc": 0.6177, "lyapunov": null, "grad_norm": 0.46173934960898333, "grad_max_sv": 0.2323433578014374, "grad_min_sv": 8.582540832018093e-09, "grad_condition": 374128300.47680604, "lr": 8.856374635655688e-06, "time_sec": 15.53349781036377 }, { "epoch": 142, "train_loss": 0.15599479459762572, "train_acc": 0.95136, "test_loss": 2.0303194038391115, "test_acc": 0.6141, "lyapunov": null, "grad_norm": 0.46112847461678763, "grad_max_sv": 0.23407747074961663, "grad_min_sv": 8.815537186779992e-09, "grad_condition": 888764932.2294099, "lr": 7.001981464747503e-06, "time_sec": 15.521865129470825 }, { "epoch": 143, "train_loss": 0.1572772634601593, "train_acc": 0.95076, "test_loss": 2.015152719116211, "test_acc": 0.6117, "lyapunov": null, "grad_norm": 0.46482832090967446, "grad_max_sv": 0.23328317552804947, "grad_min_sv": 8.496040210356943e-09, "grad_condition": 794958780.6842709, "lr": 5.3638335185058295e-06, "time_sec": 15.530633926391602 }, { "epoch": 144, "train_loss": 0.1607058820438385, "train_acc": 0.94982, "test_loss": 2.028663912010193, "test_acc": 0.6144, "lyapunov": null, "grad_norm": 0.46757658167064325, "grad_max_sv": 0.23105027191340924, "grad_min_sv": 8.55830176145836e-09, "grad_condition": 1653881177.8200665, "lr": 3.942649342761114e-06, "time_sec": 15.53608751296997 }, { "epoch": 145, "train_loss": 0.1565204811191559, "train_acc": 0.95166, "test_loss": 2.0279767280578613, "test_acc": 0.6155, "lyapunov": null, "grad_norm": 0.4638655873772094, "grad_max_sv": 0.23327881954610347, "grad_min_sv": 8.597103550930796e-09, "grad_condition": 316875488.0827421, "lr": 2.7390523158633524e-06, "time_sec": 15.526829719543457 }, { "epoch": 146, "train_loss": 0.15728166580677033, "train_acc": 0.95086, "test_loss": 1.9891761138916015, "test_acc": 0.6145, "lyapunov": null, "grad_norm": 0.46488895344189896, "grad_max_sv": 0.24002570435404777, "grad_min_sv": 8.740120454957777e-09, "grad_condition": 455470499.4939662, "lr": 1.7535703752478133e-06, "time_sec": 15.529450178146362 }, { "epoch": 147, "train_loss": 0.15490476808547973, "train_acc": 0.95148, "test_loss": 2.058331818771362, "test_acc": 0.61, "lyapunov": null, "grad_norm": 0.46221701830974254, "grad_max_sv": 0.2296001013368368, "grad_min_sv": 8.541372666505225e-09, "grad_condition": 659563768.7689784, "lr": 9.866357858642196e-07, "time_sec": 15.537895441055298 }, { "epoch": 148, "train_loss": 0.15796600056648255, "train_acc": 0.94986, "test_loss": 2.0414266393661498, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.46494816666423244, "grad_max_sv": 0.2453433360904455, "grad_min_sv": 8.874223652883401e-09, "grad_condition": 791324939.5663835, "lr": 4.38584950570808e-07, "time_sec": 15.552018165588379 }, { "epoch": 149, "train_loss": 0.1572165874862671, "train_acc": 0.9503, "test_loss": 2.0304482383728026, "test_acc": 0.6163, "lyapunov": null, "grad_norm": 0.46454324009038384, "grad_max_sv": 0.23642796650528908, "grad_min_sv": 8.51550397435591e-09, "grad_condition": 463955776.24121666, "lr": 1.096582625772501e-07, "time_sec": 15.526931762695312 }, { "epoch": 150, "train_loss": 0.15873465202331544, "train_acc": 0.94998, "test_loss": 2.0263592735290525, "test_acc": 0.6123, "lyapunov": null, "grad_norm": 0.46823921364683874, "grad_max_sv": 0.24224489107728003, "grad_min_sv": 8.409305788867338e-09, "grad_condition": 491457160.41681844, "lr": 0.0, "time_sec": 15.518765687942505 } ], "8": [ { "epoch": 1, "train_loss": 4.593809753570556, "train_acc": 0.06056, "test_loss": 4.250240661239624, "test_acc": 0.0724, "lyapunov": null, "grad_norm": 6.28680857536701, "grad_max_sv": 5.32494820356369, "grad_min_sv": 1.0926536573307998e-07, "grad_condition": 75430538.96608621, "lr": 0.0009998903417374227, "time_sec": 32.64524722099304 }, { "epoch": 2, "train_loss": 3.8781360272216796, "train_acc": 0.12202, "test_loss": 3.828091265106201, "test_acc": 0.1187, "lyapunov": null, "grad_norm": 4.685766976401904, "grad_max_sv": 3.971551901102066, "grad_min_sv": 8.512232171353773e-08, "grad_condition": 73925683.02884856, "lr": 0.0009995614150494292, "time_sec": 32.55369710922241 }, { "epoch": 3, "train_loss": 3.5183256304931643, "train_acc": 0.16986, "test_loss": 3.603372495651245, "test_acc": 0.1458, "lyapunov": null, "grad_norm": 3.857816495796443, "grad_max_sv": 3.131850999593735, "grad_min_sv": 7.069926738628718e-08, "grad_condition": 597358447.7631978, "lr": 0.0009990133642141358, "time_sec": 32.61470580101013 }, { "epoch": 4, "train_loss": 3.2580047064208983, "train_acc": 0.21016, "test_loss": 3.3982357917785646, "test_acc": 0.1898, "lyapunov": null, "grad_norm": 3.25322967284326, "grad_max_sv": 2.4588119089603424, "grad_min_sv": 6.045808895738247e-08, "grad_condition": 47197928.09495263, "lr": 0.0009982464296247522, "time_sec": 32.569292306900024 }, { "epoch": 5, "train_loss": 3.0406500122070312, "train_acc": 0.24896, "test_loss": 3.1738818031311036, "test_acc": 0.2326, "lyapunov": null, "grad_norm": 2.772030407825626, "grad_max_sv": 1.9638817846775054, "grad_min_sv": 5.119714804324715e-08, "grad_condition": 73515114.69409783, "lr": 0.0009972609476841367, "time_sec": 32.59326457977295 }, { "epoch": 6, "train_loss": 2.8603873377227784, "train_acc": 0.28122, "test_loss": 3.040658945083618, "test_acc": 0.2441, "lyapunov": null, "grad_norm": 2.406511937670546, "grad_max_sv": 1.6028138607740403, "grad_min_sv": 4.437380299870952e-08, "grad_condition": 42435152.16608156, "lr": 0.000996057350657239, "time_sec": 32.59000778198242 }, { "epoch": 7, "train_loss": 2.696464497909546, "train_acc": 0.3124, "test_loss": 2.7883455558776857, "test_acc": 0.3055, "lyapunov": null, "grad_norm": 2.1276389781637293, "grad_max_sv": 1.321936309337616, "grad_min_sv": 3.9740869406390546e-08, "grad_condition": 38077617.12004892, "lr": 0.000994636166481494, "time_sec": 32.58612537384033 }, { "epoch": 8, "train_loss": 2.5476934342956543, "train_acc": 0.34226, "test_loss": 2.7284567352294924, "test_acc": 0.3201, "lyapunov": null, "grad_norm": 1.9443800586445228, "grad_max_sv": 1.1562949120998383, "grad_min_sv": 3.6514397544484825e-08, "grad_condition": 50793777.88100208, "lr": 0.0009929980185352525, "time_sec": 32.609519958496094 }, { "epoch": 9, "train_loss": 2.420484928741455, "train_acc": 0.37, "test_loss": 2.5651690574645998, "test_acc": 0.3474, "lyapunov": null, "grad_norm": 1.7908327823271384, "grad_max_sv": 0.9936118766665458, "grad_min_sv": 3.386289501583484e-08, "grad_condition": 38337683.052389994, "lr": 0.0009911436253643444, "time_sec": 32.608171224594116 }, { "epoch": 10, "train_loss": 2.3262426779937746, "train_acc": 0.38734, "test_loss": 2.4693000373840333, "test_acc": 0.3722, "lyapunov": null, "grad_norm": 1.6585340858173223, "grad_max_sv": 0.8407874166965484, "grad_min_sv": 3.068910873760267e-08, "grad_condition": 34328942.84679211, "lr": 0.0009890738003669028, "time_sec": 32.64034914970398 }, { "epoch": 11, "train_loss": 2.2108732919311525, "train_acc": 0.41382, "test_loss": 2.465538624572754, "test_acc": 0.3705, "lyapunov": null, "grad_norm": 1.5729603360376456, "grad_max_sv": 0.778350618481636, "grad_min_sv": 2.959336372621024e-08, "grad_condition": 73499461.7080038, "lr": 0.00098678945143658, "time_sec": 32.57490301132202 }, { "epoch": 12, "train_loss": 2.1315050006103515, "train_acc": 0.4307, "test_loss": 2.3204302642822268, "test_acc": 0.3954, "lyapunov": null, "grad_norm": 1.5011321305083667, "grad_max_sv": 0.699262747168541, "grad_min_sv": 2.8460571517563427e-08, "grad_condition": 48774252.99057761, "lr": 0.0009842915805643154, "time_sec": 32.6048150062561 }, { "epoch": 13, "train_loss": 2.0442165532684324, "train_acc": 0.44988, "test_loss": 2.376241368865967, "test_acc": 0.3938, "lyapunov": null, "grad_norm": 1.4288710226212364, "grad_max_sv": 0.651852785050869, "grad_min_sv": 2.6736829209427978e-08, "grad_condition": 911183246.0701777, "lr": 0.000981581283398829, "time_sec": 32.5588493347168 }, { "epoch": 14, "train_loss": 1.9779467534637452, "train_acc": 0.46564, "test_loss": 2.3095103010177613, "test_acc": 0.3997, "lyapunov": null, "grad_norm": 1.3745196502469326, "grad_max_sv": 0.6157992795109749, "grad_min_sv": 2.619163226788568e-08, "grad_condition": 133496832.32967322, "lr": 0.0009786597487660333, "time_sec": 32.544082164764404 }, { "epoch": 15, "train_loss": 1.9085535586547853, "train_acc": 0.48116, "test_loss": 2.277028215789795, "test_acc": 0.4192, "lyapunov": null, "grad_norm": 1.3371637415095632, "grad_max_sv": 0.6050588846206665, "grad_min_sv": 2.4948501375562925e-08, "grad_condition": 111100134.80615222, "lr": 0.0009755282581475766, "time_sec": 32.55138826370239 }, { "epoch": 16, "train_loss": 1.8528347210693359, "train_acc": 0.49492, "test_loss": 2.1695428279876707, "test_acc": 0.4331, "lyapunov": null, "grad_norm": 1.2814778531944382, "grad_max_sv": 0.5591228373348713, "grad_min_sv": 2.4496722306199815e-08, "grad_condition": 25867184.37629143, "lr": 0.0009721881851187403, "time_sec": 32.59131908416748 }, { "epoch": 17, "train_loss": 1.7864885725402833, "train_acc": 0.5083, "test_loss": 2.2167986530303954, "test_acc": 0.428, "lyapunov": null, "grad_norm": 1.2365928586283268, "grad_max_sv": 0.5188852399587631, "grad_min_sv": 2.3400686853525254e-08, "grad_condition": 39202676.90349869, "lr": 0.0009686409947459456, "time_sec": 32.55093550682068 }, { "epoch": 18, "train_loss": 1.7305231869888307, "train_acc": 0.52088, "test_loss": 2.1779684148788454, "test_acc": 0.4405, "lyapunov": null, "grad_norm": 1.2047689336699439, "grad_max_sv": 0.5065509222447873, "grad_min_sv": 2.279239488256479e-08, "grad_condition": 28341315.825680755, "lr": 0.0009648882429441254, "time_sec": 32.556524991989136 }, { "epoch": 19, "train_loss": 1.6774425074768067, "train_acc": 0.53444, "test_loss": 2.22588055267334, "test_acc": 0.4357, "lyapunov": null, "grad_norm": 1.1702937955790653, "grad_max_sv": 0.4866269282996655, "grad_min_sv": 2.1823409551702255e-08, "grad_condition": 34695081.35711311, "lr": 0.00096093157579425, "time_sec": 32.57441163063049 }, { "epoch": 20, "train_loss": 1.6186258012771606, "train_acc": 0.54752, "test_loss": 2.1861088802337645, "test_acc": 0.4422, "lyapunov": null, "grad_norm": 1.1434442793867807, "grad_max_sv": 0.4658520080149174, "grad_min_sv": 2.124641216849632e-08, "grad_condition": 35023634.55777504, "lr": 0.0009567727288213001, "time_sec": 32.563255071640015 }, { "epoch": 21, "train_loss": 1.5804412273406983, "train_acc": 0.5552, "test_loss": 2.116827065849304, "test_acc": 0.4608, "lyapunov": null, "grad_norm": 1.1174809929853884, "grad_max_sv": 0.4587864212691784, "grad_min_sv": 2.115127252788618e-08, "grad_condition": 25409623.926622026, "lr": 0.0009524135262330095, "time_sec": 32.548664808273315 }, { "epoch": 22, "train_loss": 1.5373576833343505, "train_acc": 0.56826, "test_loss": 2.188752991104126, "test_acc": 0.4488, "lyapunov": null, "grad_norm": 1.0855473101193578, "grad_max_sv": 0.43056059926748275, "grad_min_sv": 2.025934667526652e-08, "grad_condition": 28615900.007624805, "lr": 0.0009478558801197061, "time_sec": 32.611814737319946 }, { "epoch": 23, "train_loss": 1.506667826461792, "train_acc": 0.57494, "test_loss": 2.174818174743652, "test_acc": 0.4577, "lyapunov": null, "grad_norm": 1.0696030802642686, "grad_max_sv": 0.43318344950675963, "grad_min_sv": 2.0166759195916484e-08, "grad_condition": 43974441.149682686, "lr": 0.000943101789615607, "time_sec": 32.57555532455444 }, { "epoch": 24, "train_loss": 1.47097098236084, "train_acc": 0.5857, "test_loss": 2.0404002576828004, "test_acc": 0.4847, "lyapunov": null, "grad_norm": 1.0479522200281932, "grad_max_sv": 0.4198159731924534, "grad_min_sv": 1.9698220292407863e-08, "grad_condition": 45870756.831042506, "lr": 0.0009381533400219313, "time_sec": 32.5772430896759 }, { "epoch": 25, "train_loss": 1.4312325327301025, "train_acc": 0.59378, "test_loss": 2.106845015716553, "test_acc": 0.4767, "lyapunov": null, "grad_norm": 1.0240308878342053, "grad_max_sv": 0.41350489780306815, "grad_min_sv": 1.9328133177981543e-08, "grad_condition": 69115062.26987141, "lr": 0.0009330127018922189, "time_sec": 32.557268142700195 }, { "epoch": 26, "train_loss": 1.3932979926300049, "train_acc": 0.60466, "test_loss": 2.0442503452301026, "test_acc": 0.4874, "lyapunov": null, "grad_norm": 1.0080444681764495, "grad_max_sv": 0.39995783641934396, "grad_min_sv": 1.8682676014569743e-08, "grad_condition": 33480939.457173, "lr": 0.000927682130080253, "time_sec": 32.54329538345337 }, { "epoch": 27, "train_loss": 1.3626447483444213, "train_acc": 0.61088, "test_loss": 2.1529213762283326, "test_acc": 0.4772, "lyapunov": null, "grad_norm": 0.9916083960305544, "grad_max_sv": 0.38913136497139933, "grad_min_sv": 1.803411719611403e-08, "grad_condition": 125553964.7328368, "lr": 0.0009221639627510072, "time_sec": 32.55648422241211 }, { "epoch": 28, "train_loss": 1.332198992652893, "train_acc": 0.6166, "test_loss": 2.2807082765579225, "test_acc": 0.4558, "lyapunov": null, "grad_norm": 0.9771496174881384, "grad_max_sv": 0.39622113704681394, "grad_min_sv": 1.8371455795529455e-08, "grad_condition": 25402444.150790665, "lr": 0.0009164606203550494, "time_sec": 32.56743788719177 }, { "epoch": 29, "train_loss": 1.3056928281402589, "train_acc": 0.62548, "test_loss": 2.3650270275115965, "test_acc": 0.4494, "lyapunov": null, "grad_norm": 0.9678089971160496, "grad_max_sv": 0.3883704259991646, "grad_min_sv": 1.808786349449809e-08, "grad_condition": 34866235.35928585, "lr": 0.0009105746045668516, "time_sec": 32.53697896003723 }, { "epoch": 30, "train_loss": 1.2669909148025513, "train_acc": 0.63598, "test_loss": 2.194760869216919, "test_acc": 0.4794, "lyapunov": null, "grad_norm": 0.9467141888064133, "grad_max_sv": 0.3744235411286354, "grad_min_sv": 1.7651215561236e-08, "grad_condition": 139376880.96042347, "lr": 0.0009045084971874733, "time_sec": 32.55838894844055 }, { "epoch": 31, "train_loss": 1.2365936059951783, "train_acc": 0.64152, "test_loss": 2.251469213104248, "test_acc": 0.4728, "lyapunov": null, "grad_norm": 0.9363746920375892, "grad_max_sv": 0.3752880610525608, "grad_min_sv": 1.7496447651810243e-08, "grad_condition": 33435292.843927078, "lr": 0.0008982649590120977, "time_sec": 32.56987476348877 }, { "epoch": 32, "train_loss": 1.2132414292144775, "train_acc": 0.6457, "test_loss": 2.155212931251526, "test_acc": 0.4953, "lyapunov": null, "grad_norm": 0.9198517753600641, "grad_max_sv": 0.3622582726180553, "grad_min_sv": 1.7169938390428767e-08, "grad_condition": 301357597.1554047, "lr": 0.0008918467286629196, "time_sec": 32.644938468933105 }, { "epoch": 33, "train_loss": 1.184193948135376, "train_acc": 0.654, "test_loss": 2.2338722274780274, "test_acc": 0.4833, "lyapunov": null, "grad_norm": 0.9078833042188178, "grad_max_sv": 0.3615180656313896, "grad_min_sv": 1.6779444181325154e-08, "grad_condition": 31157779.01941774, "lr": 0.0008852566213878943, "time_sec": 32.592013359069824 }, { "epoch": 34, "train_loss": 1.1604648839569092, "train_acc": 0.6605, "test_loss": 2.144485057640076, "test_acc": 0.4963, "lyapunov": null, "grad_norm": 0.8972811549201535, "grad_max_sv": 0.34557069540023805, "grad_min_sv": 1.606287251786076e-08, "grad_condition": 75723670.78622702, "lr": 0.000878497527825878, "time_sec": 32.58034062385559 }, { "epoch": 35, "train_loss": 1.1375362993240357, "train_acc": 0.66418, "test_loss": 2.181222864341736, "test_acc": 0.4898, "lyapunov": null, "grad_norm": 0.8889790406396809, "grad_max_sv": 0.35035020038485526, "grad_min_sv": 1.6642615324746756e-08, "grad_condition": 30786547.22695731, "lr": 0.000871572412738697, "time_sec": 32.54904317855835 }, { "epoch": 36, "train_loss": 1.1133264205932618, "train_acc": 0.67238, "test_loss": 2.1131927043914795, "test_acc": 0.5058, "lyapunov": null, "grad_norm": 0.8832491549304202, "grad_max_sv": 0.34634757712483405, "grad_min_sv": 1.6018088946911922e-08, "grad_condition": 49284260.37621014, "lr": 0.0008644843137107055, "time_sec": 32.58738970756531 }, { "epoch": 37, "train_loss": 1.0785640783309935, "train_acc": 0.67878, "test_loss": 2.2109802129745484, "test_acc": 0.4946, "lyapunov": null, "grad_norm": 0.8741999013148335, "grad_max_sv": 0.3421505123376846, "grad_min_sv": 1.5883508850886296e-08, "grad_condition": 147125609.85023776, "lr": 0.0008572363398164014, "time_sec": 32.6028311252594 }, { "epoch": 38, "train_loss": 1.0444296839141847, "train_acc": 0.68996, "test_loss": 2.2259356287002565, "test_acc": 0.4923, "lyapunov": null, "grad_norm": 0.8523318198837474, "grad_max_sv": 0.33938159644603727, "grad_min_sv": 1.5807346684382218e-08, "grad_condition": 34226370.63225422, "lr": 0.0008498316702566826, "time_sec": 32.560999393463135 }, { "epoch": 39, "train_loss": 1.023456362953186, "train_acc": 0.69698, "test_loss": 2.1364882369995115, "test_acc": 0.5049, "lyapunov": null, "grad_norm": 0.8498222777562341, "grad_max_sv": 0.3415807694196701, "grad_min_sv": 1.5869645431099144e-08, "grad_condition": 27853151.39901676, "lr": 0.0008422735529643442, "time_sec": 32.56105279922485 }, { "epoch": 40, "train_loss": 1.0050300610351564, "train_acc": 0.7014, "test_loss": 2.150569340324402, "test_acc": 0.5071, "lyapunov": null, "grad_norm": 0.8356269441634138, "grad_max_sv": 0.3239683095365763, "grad_min_sv": 1.5381535548204818e-08, "grad_condition": 155224453.46718103, "lr": 0.0008345653031794289, "time_sec": 32.59518837928772 }, { "epoch": 41, "train_loss": 0.9930689501571656, "train_acc": 0.7026, "test_loss": 2.154064438056946, "test_acc": 0.5136, "lyapunov": null, "grad_norm": 0.8262418740899825, "grad_max_sv": 0.3324408046901226, "grad_min_sv": 1.5276669600161607e-08, "grad_condition": 51863928.79048334, "lr": 0.0008267103019950526, "time_sec": 32.57974171638489 }, { "epoch": 42, "train_loss": 0.957993507232666, "train_acc": 0.7135, "test_loss": 2.1310552421569824, "test_acc": 0.5193, "lyapunov": null, "grad_norm": 0.8217377307572092, "grad_max_sv": 0.31569988913834096, "grad_min_sv": 1.4821617464605419e-08, "grad_condition": 57225046.557756186, "lr": 0.0008187119948743447, "time_sec": 32.74825191497803 }, { "epoch": 43, "train_loss": 0.9496447095489502, "train_acc": 0.71474, "test_loss": 2.1654404600143433, "test_acc": 0.5088, "lyapunov": null, "grad_norm": 0.8130839223264894, "grad_max_sv": 0.32253594174981115, "grad_min_sv": 1.506773582987675e-08, "grad_condition": 93723846.88549985, "lr": 0.000810573890139155, "time_sec": 32.602092027664185 }, { "epoch": 44, "train_loss": 0.9342586210250855, "train_acc": 0.71974, "test_loss": 2.290501368904114, "test_acc": 0.5013, "lyapunov": null, "grad_norm": 0.8096736459411619, "grad_max_sv": 0.32218324691057204, "grad_min_sv": 1.5053544679538565e-08, "grad_condition": 44430049.08800385, "lr": 0.0008022995574311873, "time_sec": 32.594489097595215 }, { "epoch": 45, "train_loss": 0.9010325805664062, "train_acc": 0.72686, "test_loss": 2.4134263542175294, "test_acc": 0.4913, "lyapunov": null, "grad_norm": 0.799116269115145, "grad_max_sv": 0.31640069633722306, "grad_min_sv": 1.5047001319934415e-08, "grad_condition": 50608547.42886399, "lr": 0.0007938926261462363, "time_sec": 32.557663917541504 }, { "epoch": 46, "train_loss": 0.8911659923553467, "train_acc": 0.73008, "test_loss": 2.2884033529281615, "test_acc": 0.5057, "lyapunov": null, "grad_norm": 0.7934582132141624, "grad_max_sv": 0.31383398175239563, "grad_min_sv": 1.4469329700584135e-08, "grad_condition": 467744144.1725038, "lr": 0.0007853567838422158, "time_sec": 32.56327676773071 }, { "epoch": 47, "train_loss": 0.8638532521438599, "train_acc": 0.73696, "test_loss": 2.2446172203063965, "test_acc": 0.5076, "lyapunov": null, "grad_norm": 0.7837979602809746, "grad_max_sv": 0.31239640712738037, "grad_min_sv": 1.4274264739655428e-08, "grad_condition": 50193793.36053495, "lr": 0.0007766957746216719, "time_sec": 32.57334923744202 }, { "epoch": 48, "train_loss": 0.8375042049598694, "train_acc": 0.74282, "test_loss": 2.227299571418762, "test_acc": 0.5202, "lyapunov": null, "grad_norm": 0.77427016194081, "grad_max_sv": 0.31100503690540793, "grad_min_sv": 1.4236399661915477e-08, "grad_condition": 50469567.486968085, "lr": 0.0007679133974894982, "time_sec": 32.569188356399536 }, { "epoch": 49, "train_loss": 0.8221629112625122, "train_acc": 0.74886, "test_loss": 2.3033808235168456, "test_acc": 0.5082, "lyapunov": null, "grad_norm": 0.7673158740604195, "grad_max_sv": 0.2993927221745253, "grad_min_sv": 1.3854600900906066e-08, "grad_condition": 304920112.4622501, "lr": 0.000759013504686565, "time_sec": 32.584622621536255 }, { "epoch": 50, "train_loss": 0.8111858353424072, "train_acc": 0.75248, "test_loss": 2.386407151031494, "test_acc": 0.5007, "lyapunov": null, "grad_norm": 0.7677657118676934, "grad_max_sv": 0.3098601832985878, "grad_min_sv": 1.3993020677935397e-08, "grad_condition": 150857500.73279318, "lr": 0.0007499999999999998, "time_sec": 32.59726119041443 }, { "epoch": 51, "train_loss": 0.8006631660461426, "train_acc": 0.7542, "test_loss": 2.322489023399353, "test_acc": 0.5061, "lyapunov": null, "grad_norm": 0.7571398534411352, "grad_max_sv": 0.3029158480465412, "grad_min_sv": 1.366701978661438e-08, "grad_condition": 1198508278.0301957, "lr": 0.0007408768370508575, "time_sec": 32.566423654556274 }, { "epoch": 52, "train_loss": 0.7743014498138427, "train_acc": 0.7611, "test_loss": 2.446239744186401, "test_acc": 0.5001, "lyapunov": null, "grad_norm": 0.7494625172701129, "grad_max_sv": 0.30184583105146884, "grad_min_sv": 1.3538439711142935e-08, "grad_condition": 454382825.5364168, "lr": 0.0007316480175599307, "time_sec": 32.606823205947876 }, { "epoch": 53, "train_loss": 0.7602159348106384, "train_acc": 0.76546, "test_loss": 2.3079547737121584, "test_acc": 0.5179, "lyapunov": null, "grad_norm": 0.743347450494438, "grad_max_sv": 0.3061353128403425, "grad_min_sv": 1.348931551216348e-08, "grad_condition": 80924083.81225905, "lr": 0.0007223175895924635, "time_sec": 32.580427408218384 }, { "epoch": 54, "train_loss": 0.7339858147239685, "train_acc": 0.77348, "test_loss": 2.388110917472839, "test_acc": 0.5122, "lyapunov": null, "grad_norm": 0.7398005246039192, "grad_max_sv": 0.2995276223868132, "grad_min_sv": 1.3313009213089532e-08, "grad_condition": 46213404.23441851, "lr": 0.0007128896457825361, "time_sec": 32.57850360870361 }, { "epoch": 55, "train_loss": 0.7361176003837585, "train_acc": 0.77096, "test_loss": 2.3849290475845337, "test_acc": 0.5096, "lyapunov": null, "grad_norm": 0.7355302680365016, "grad_max_sv": 0.2989551298320293, "grad_min_sv": 1.3770161400267037e-08, "grad_condition": 1196071659.3025665, "lr": 0.0007033683215378998, "time_sec": 32.57127046585083 }, { "epoch": 56, "train_loss": 0.7056646187782287, "train_acc": 0.78266, "test_loss": 2.5353955261230467, "test_acc": 0.5094, "lyapunov": null, "grad_norm": 0.7263545559812212, "grad_max_sv": 0.29214551076292994, "grad_min_sv": 1.2961420287754821e-08, "grad_condition": 55296196.635770574, "lr": 0.0006937577932260512, "time_sec": 32.6073100566864 }, { "epoch": 57, "train_loss": 0.6901627484321594, "train_acc": 0.78498, "test_loss": 2.424652412033081, "test_acc": 0.515, "lyapunov": null, "grad_norm": 0.7255525918000217, "grad_max_sv": 0.2947526901960373, "grad_min_sv": 1.3273521161719094e-08, "grad_condition": 81805484.33683524, "lr": 0.0006840622763423388, "time_sec": 32.587172746658325 }, { "epoch": 58, "train_loss": 0.6748793490219116, "train_acc": 0.79032, "test_loss": 2.4186749195098876, "test_acc": 0.5152, "lyapunov": null, "grad_norm": 0.7152761560999475, "grad_max_sv": 0.2920954205095768, "grad_min_sv": 1.3006854693124736e-08, "grad_condition": 92386117.68065517, "lr": 0.0006742860236609073, "time_sec": 32.59625577926636 }, { "epoch": 59, "train_loss": 0.6585909474945069, "train_acc": 0.79492, "test_loss": 2.423396731376648, "test_acc": 0.5147, "lyapunov": null, "grad_norm": 0.7000734196662035, "grad_max_sv": 0.27961262725293634, "grad_min_sv": 1.2433090768732002e-08, "grad_condition": 44055598.930747576, "lr": 0.0006644333233692913, "time_sec": 32.56940460205078 }, { "epoch": 60, "train_loss": 0.6509319092178345, "train_acc": 0.7971, "test_loss": 2.4439749031066893, "test_acc": 0.5172, "lyapunov": null, "grad_norm": 0.7014808778975755, "grad_max_sv": 0.279667991027236, "grad_min_sv": 1.213204634045728e-08, "grad_condition": 71422713.53211066, "lr": 0.0006545084971874734, "time_sec": 32.592474699020386 }, { "epoch": 61, "train_loss": 0.6274669117927552, "train_acc": 0.80326, "test_loss": 2.6459867664337158, "test_acc": 0.4988, "lyapunov": null, "grad_norm": 0.6875040317915668, "grad_max_sv": 0.2785758938640356, "grad_min_sv": 1.2619559043233753e-08, "grad_condition": 171857029.8323717, "lr": 0.0006445158984722354, "time_sec": 32.630576610565186 }, { "epoch": 62, "train_loss": 0.6170748471164703, "train_acc": 0.80476, "test_loss": 2.5383020797729494, "test_acc": 0.507, "lyapunov": null, "grad_norm": 0.6898214493116677, "grad_max_sv": 0.27117876932024954, "grad_min_sv": 1.216634772142032e-08, "grad_condition": 368391230.9870256, "lr": 0.0006344599103076324, "time_sec": 32.61634922027588 }, { "epoch": 63, "train_loss": 0.6143111569595336, "train_acc": 0.80454, "test_loss": 2.4434647581100464, "test_acc": 0.5183, "lyapunov": null, "grad_norm": 0.6875312632959335, "grad_max_sv": 0.28126552477478983, "grad_min_sv": 1.246990521854962e-08, "grad_condition": 798988222.1191355, "lr": 0.0006243449435824269, "time_sec": 32.61603879928589 }, { "epoch": 64, "train_loss": 0.593730930519104, "train_acc": 0.81294, "test_loss": 2.4702172830581666, "test_acc": 0.5204, "lyapunov": null, "grad_norm": 0.6805278132405531, "grad_max_sv": 0.27184186428785323, "grad_min_sv": 1.2160773926804362e-08, "grad_condition": 897317916.9202541, "lr": 0.0006141754350553275, "time_sec": 32.62076783180237 }, { "epoch": 65, "train_loss": 0.5915982696533203, "train_acc": 0.81346, "test_loss": 2.5983056301116942, "test_acc": 0.5091, "lyapunov": null, "grad_norm": 0.6786733542651691, "grad_max_sv": 0.2730319045484066, "grad_min_sv": 1.195807074368116e-08, "grad_condition": 100225768.74912949, "lr": 0.0006039558454088793, "time_sec": 32.57223296165466 }, { "epoch": 66, "train_loss": 0.5778841704368591, "train_acc": 0.8164, "test_loss": 2.5375493215560914, "test_acc": 0.5166, "lyapunov": null, "grad_norm": 0.6661254148265577, "grad_max_sv": 0.27218331433832643, "grad_min_sv": 1.21305288360192e-08, "grad_condition": 409516154.47474587, "lr": 0.000593690657292862, "time_sec": 32.60103678703308 }, { "epoch": 67, "train_loss": 0.5534152274894715, "train_acc": 0.82388, "test_loss": 2.525739343261719, "test_acc": 0.5172, "lyapunov": null, "grad_norm": 0.66286867140097, "grad_max_sv": 0.27192877791821957, "grad_min_sv": 1.1918128833138253e-08, "grad_condition": 43219144.55143875, "lr": 0.0005833843733580507, "time_sec": 32.570470571517944 }, { "epoch": 68, "train_loss": 0.5373673023986817, "train_acc": 0.82976, "test_loss": 2.5977006465911865, "test_acc": 0.517, "lyapunov": null, "grad_norm": 0.6509079409235867, "grad_max_sv": 0.26122898012399676, "grad_min_sv": 1.1391138144897784e-08, "grad_condition": 68515123.47894785, "lr": 0.0005730415142812054, "time_sec": 32.60091519355774 }, { "epoch": 69, "train_loss": 0.5234087624740601, "train_acc": 0.83328, "test_loss": 2.5398946479797364, "test_acc": 0.5195, "lyapunov": null, "grad_norm": 0.6514320709102108, "grad_max_sv": 0.2681581676006317, "grad_min_sv": 1.1655683266427116e-08, "grad_condition": 706218189.6988381, "lr": 0.0005626666167821517, "time_sec": 32.60088515281677 }, { "epoch": 70, "train_loss": 0.5105544789123535, "train_acc": 0.83858, "test_loss": 2.6386670696258543, "test_acc": 0.5124, "lyapunov": null, "grad_norm": 0.6433463540817135, "grad_max_sv": 0.2647452913224697, "grad_min_sv": 1.1366260942169416e-08, "grad_condition": 65156065.92607037, "lr": 0.0005522642316338265, "time_sec": 32.64759874343872 }, { "epoch": 71, "train_loss": 0.5010787317276001, "train_acc": 0.83912, "test_loss": 2.6461667497634886, "test_acc": 0.5113, "lyapunov": null, "grad_norm": 0.6437656983932116, "grad_max_sv": 0.27069182582199575, "grad_min_sv": 1.1655098845937683e-08, "grad_condition": 152350561.59014112, "lr": 0.0005418389216661573, "time_sec": 32.59350061416626 }, { "epoch": 72, "train_loss": 0.48393970026969907, "train_acc": 0.84504, "test_loss": 2.714662640762329, "test_acc": 0.5138, "lyapunov": null, "grad_norm": 0.6380630437719501, "grad_max_sv": 0.2641098305583, "grad_min_sv": 1.1268197760809507e-08, "grad_condition": 120257137.75772035, "lr": 0.0005313952597646563, "time_sec": 32.596872329711914 }, { "epoch": 73, "train_loss": 0.48754292858123777, "train_acc": 0.84344, "test_loss": 2.7237933948516844, "test_acc": 0.5121, "lyapunov": null, "grad_norm": 0.6383299877925953, "grad_max_sv": 0.26338610500097276, "grad_min_sv": 1.1300838716199468e-08, "grad_condition": 111884472.4678097, "lr": 0.0005209378268645994, "time_sec": 32.5793662071228 }, { "epoch": 74, "train_loss": 0.47278374366760256, "train_acc": 0.84774, "test_loss": 2.6715963176727295, "test_acc": 0.5175, "lyapunov": null, "grad_norm": 0.6274777670934027, "grad_max_sv": 0.2674501951783895, "grad_min_sv": 1.1504576969084777e-08, "grad_condition": 1355085877.4304867, "lr": 0.0005104712099416781, "time_sec": 32.57535362243652 }, { "epoch": 75, "train_loss": 0.46160235664367677, "train_acc": 0.8514, "test_loss": 2.648087367248535, "test_acc": 0.5256, "lyapunov": null, "grad_norm": 0.6267372816019459, "grad_max_sv": 0.2574677299708128, "grad_min_sv": 1.0966666171572172e-08, "grad_condition": 334727656.01781523, "lr": 0.0004999999999999996, "time_sec": 32.610466957092285 }, { "epoch": 76, "train_loss": 0.4535921633911133, "train_acc": 0.85614, "test_loss": 2.6602814262390138, "test_acc": 0.523, "lyapunov": null, "grad_norm": 0.6107123792245788, "grad_max_sv": 0.2529071237891912, "grad_min_sv": 1.1059093659587793e-08, "grad_condition": 120836694.63569286, "lr": 0.0004895287900583212, "time_sec": 32.60012149810791 }, { "epoch": 77, "train_loss": 0.4353150751876831, "train_acc": 0.85868, "test_loss": 2.704223956680298, "test_acc": 0.515, "lyapunov": null, "grad_norm": 0.6089035015325723, "grad_max_sv": 0.26519037671387197, "grad_min_sv": 1.1131827913862629e-08, "grad_condition": 731888345.2288473, "lr": 0.0004790621731353997, "time_sec": 32.5684015750885 }, { "epoch": 78, "train_loss": 0.4266960339736938, "train_acc": 0.86162, "test_loss": 2.621325074005127, "test_acc": 0.5293, "lyapunov": null, "grad_norm": 0.6005077005692222, "grad_max_sv": 0.24986533373594283, "grad_min_sv": 1.066437155744851e-08, "grad_condition": 323621690.1204275, "lr": 0.000468604740235343, "time_sec": 32.593501567840576 }, { "epoch": 79, "train_loss": 0.40983675064086916, "train_acc": 0.86828, "test_loss": 2.654561376953125, "test_acc": 0.5278, "lyapunov": null, "grad_norm": 0.5926958478419567, "grad_max_sv": 0.253178546205163, "grad_min_sv": 1.0804884827174745e-08, "grad_condition": 432601908.1535362, "lr": 0.00045816107833384175, "time_sec": 32.603999376297 }, { "epoch": 80, "train_loss": 0.4048340177345276, "train_acc": 0.86952, "test_loss": 2.7457454587936403, "test_acc": 0.5169, "lyapunov": null, "grad_norm": 0.5908548576457587, "grad_max_sv": 0.25038131698966026, "grad_min_sv": 1.0512154793168581e-08, "grad_condition": 130905588.43349023, "lr": 0.0004477357683661729, "time_sec": 32.603445053100586 }, { "epoch": 81, "train_loss": 0.3956010137653351, "train_acc": 0.87362, "test_loss": 2.6873944789886473, "test_acc": 0.5209, "lyapunov": null, "grad_norm": 0.584388729391549, "grad_max_sv": 0.24884492233395578, "grad_min_sv": 1.0513768951801727e-08, "grad_condition": 247213360.42633313, "lr": 0.00043733338321784746, "time_sec": 32.59891176223755 }, { "epoch": 82, "train_loss": 0.39998871772766115, "train_acc": 0.87126, "test_loss": 2.7860556625366213, "test_acc": 0.5159, "lyapunov": null, "grad_norm": 0.5914248649657466, "grad_max_sv": 0.2658348709344864, "grad_min_sv": 1.082797196690511e-08, "grad_condition": 1133342480.7967758, "lr": 0.0004269584857187939, "time_sec": 32.59586429595947 }, { "epoch": 83, "train_loss": 0.3816492418861389, "train_acc": 0.877, "test_loss": 2.7754603567123413, "test_acc": 0.5172, "lyapunov": null, "grad_norm": 0.5821106701045357, "grad_max_sv": 0.2504717506468296, "grad_min_sv": 1.0313228220211468e-08, "grad_condition": 79983143.9616401, "lr": 0.0004166156266419484, "time_sec": 32.61333727836609 }, { "epoch": 84, "train_loss": 0.3718857811355591, "train_acc": 0.88052, "test_loss": 2.711159196472168, "test_acc": 0.5308, "lyapunov": null, "grad_norm": 0.5753178111464781, "grad_max_sv": 0.24524039030075073, "grad_min_sv": 1.0231703595139919e-08, "grad_condition": 185067792.66451305, "lr": 0.0004063093427071373, "time_sec": 32.58551812171936 }, { "epoch": 85, "train_loss": 0.3627623717498779, "train_acc": 0.8827, "test_loss": 2.7379925659179687, "test_acc": 0.5259, "lyapunov": null, "grad_norm": 0.5629491927418928, "grad_max_sv": 0.24136969707906247, "grad_min_sv": 9.91763398714568e-09, "grad_condition": 152636209.94255581, "lr": 0.0003960441545911199, "time_sec": 32.603590965270996 }, { "epoch": 86, "train_loss": 0.346252275390625, "train_acc": 0.88882, "test_loss": 2.766578482246399, "test_acc": 0.5312, "lyapunov": null, "grad_norm": 0.5515259268132012, "grad_max_sv": 0.24355790987610818, "grad_min_sv": 1.0009752546454032e-08, "grad_condition": 97406517.6245994, "lr": 0.0003858245649446718, "time_sec": 32.584232807159424 }, { "epoch": 87, "train_loss": 0.34051946352005, "train_acc": 0.89098, "test_loss": 2.779722568702698, "test_acc": 0.528, "lyapunov": null, "grad_norm": 0.5519101007375313, "grad_max_sv": 0.24400133974850177, "grad_min_sv": 9.877336406855648e-09, "grad_condition": 712710697.5623571, "lr": 0.00037565505641757235, "time_sec": 32.6142373085022 }, { "epoch": 88, "train_loss": 0.33136254326820375, "train_acc": 0.89032, "test_loss": 2.719365368270874, "test_acc": 0.535, "lyapunov": null, "grad_norm": 0.5511773242388698, "grad_max_sv": 0.23767127953469752, "grad_min_sv": 9.902577505389865e-09, "grad_condition": 127351733.7757211, "lr": 0.00036554008969236695, "time_sec": 32.62907528877258 }, { "epoch": 89, "train_loss": 0.32775797492980957, "train_acc": 0.89324, "test_loss": 2.790045444488525, "test_acc": 0.5299, "lyapunov": null, "grad_norm": 0.5479128041042186, "grad_max_sv": 0.2417389802634716, "grad_min_sv": 9.801050153543031e-09, "grad_condition": 342834303.4129317, "lr": 0.0003554841015277638, "time_sec": 32.58039617538452 }, { "epoch": 90, "train_loss": 0.32945220873832703, "train_acc": 0.8918, "test_loss": 2.922000147628784, "test_acc": 0.5182, "lyapunov": null, "grad_norm": 0.5550461625192047, "grad_max_sv": 0.24011647067964076, "grad_min_sv": 9.800379771726567e-09, "grad_condition": 1256581334.5865822, "lr": 0.000345491502812526, "time_sec": 32.59003448486328 }, { "epoch": 91, "train_loss": 0.3192555838537216, "train_acc": 0.89716, "test_loss": 2.8951302070617677, "test_acc": 0.5263, "lyapunov": null, "grad_norm": 0.5399705873184968, "grad_max_sv": 0.2398311447352171, "grad_min_sv": 9.757036307719846e-09, "grad_condition": 127427759.95651396, "lr": 0.0003355666766307081, "time_sec": 32.6045126914978 }, { "epoch": 92, "train_loss": 0.3078860513591766, "train_acc": 0.90134, "test_loss": 2.8668867027282716, "test_acc": 0.5242, "lyapunov": null, "grad_norm": 0.529771320174461, "grad_max_sv": 0.24304427802562714, "grad_min_sv": 9.90028982024438e-09, "grad_condition": 134692222.21263316, "lr": 0.00032571397633909225, "time_sec": 32.59454321861267 }, { "epoch": 93, "train_loss": 0.2954711162376404, "train_acc": 0.90374, "test_loss": 2.8291058578491213, "test_acc": 0.5338, "lyapunov": null, "grad_norm": 0.5270179348539408, "grad_max_sv": 0.23493569679558277, "grad_min_sv": 9.681322873239529e-09, "grad_condition": 154310830.71851045, "lr": 0.00031593772365766094, "time_sec": 32.637152433395386 }, { "epoch": 94, "train_loss": 0.29190866079330446, "train_acc": 0.90516, "test_loss": 2.8675409421920777, "test_acc": 0.5267, "lyapunov": null, "grad_norm": 0.5236741934845208, "grad_max_sv": 0.23337335288524627, "grad_min_sv": 9.406507730548574e-09, "grad_condition": 172022555.775852, "lr": 0.0003062422067739483, "time_sec": 32.615885496139526 }, { "epoch": 95, "train_loss": 0.2843532346916199, "train_acc": 0.90826, "test_loss": 2.9124584104537963, "test_acc": 0.5294, "lyapunov": null, "grad_norm": 0.5141183140073359, "grad_max_sv": 0.22986465878784657, "grad_min_sv": 9.210905181113172e-09, "grad_condition": 336375534.72882974, "lr": 0.00029663167846209965, "time_sec": 32.62099742889404 }, { "epoch": 96, "train_loss": 0.28095845563411714, "train_acc": 0.90888, "test_loss": 2.9585642152786256, "test_acc": 0.5188, "lyapunov": null, "grad_norm": 0.5209337851609864, "grad_max_sv": 0.24165461957454681, "grad_min_sv": 9.822391551029056e-09, "grad_condition": 3734850942.353486, "lr": 0.00028711035421746345, "time_sec": 32.606362104415894 }, { "epoch": 97, "train_loss": 0.270245605134964, "train_acc": 0.91376, "test_loss": 2.8790921213150025, "test_acc": 0.535, "lyapunov": null, "grad_norm": 0.5018050404070028, "grad_max_sv": 0.2287111472338438, "grad_min_sv": 9.100506417479732e-09, "grad_condition": 1286046088.0897596, "lr": 0.00027768241040753615, "time_sec": 32.605376958847046 }, { "epoch": 98, "train_loss": 0.26737561470508575, "train_acc": 0.91348, "test_loss": 2.9673530891418456, "test_acc": 0.52, "lyapunov": null, "grad_norm": 0.5026625596288345, "grad_max_sv": 0.22773091793060302, "grad_min_sv": 9.130605362089221e-09, "grad_condition": 2561536325.8505445, "lr": 0.00026835198244006903, "time_sec": 32.61582803726196 }, { "epoch": 99, "train_loss": 0.25649453671455386, "train_acc": 0.91706, "test_loss": 2.960128957557678, "test_acc": 0.5285, "lyapunov": null, "grad_norm": 0.4959587348752051, "grad_max_sv": 0.22662512063980103, "grad_min_sv": 9.021708526762983e-09, "grad_condition": 2170055259.576285, "lr": 0.0002591231629491421, "time_sec": 32.59518361091614 }, { "epoch": 100, "train_loss": 0.25298852029800417, "train_acc": 0.91614, "test_loss": 2.999088920211792, "test_acc": 0.5213, "lyapunov": null, "grad_norm": 0.49694281512357663, "grad_max_sv": 0.2285677995532751, "grad_min_sv": 9.117687981181898e-09, "grad_condition": 153385408.53154242, "lr": 0.0002499999999999997, "time_sec": 32.60006618499756 }, { "epoch": 101, "train_loss": 0.24837311635971068, "train_acc": 0.92042, "test_loss": 2.9769588521957395, "test_acc": 0.527, "lyapunov": null, "grad_norm": 0.49156384156747235, "grad_max_sv": 0.23404922261834143, "grad_min_sv": 9.245040229915492e-09, "grad_condition": 730777146.0902932, "lr": 0.00024098649531343477, "time_sec": 32.58926057815552 }, { "epoch": 102, "train_loss": 0.24679850215435029, "train_acc": 0.91974, "test_loss": 2.983294668197632, "test_acc": 0.5239, "lyapunov": null, "grad_norm": 0.4891194067973055, "grad_max_sv": 0.22282884679734707, "grad_min_sv": 8.780173748647313e-09, "grad_condition": 157121553.36478597, "lr": 0.0002320866025105016, "time_sec": 32.61522173881531 }, { "epoch": 103, "train_loss": 0.235624645652771, "train_acc": 0.9236, "test_loss": 2.97529112701416, "test_acc": 0.5278, "lyapunov": null, "grad_norm": 0.47526538494931814, "grad_max_sv": 0.2206702034920454, "grad_min_sv": 8.61680920262453e-09, "grad_condition": 145823760.67239988, "lr": 0.0002233042253783278, "time_sec": 32.67024850845337 }, { "epoch": 104, "train_loss": 0.23265846648216248, "train_acc": 0.92502, "test_loss": 2.9763864707946777, "test_acc": 0.5263, "lyapunov": null, "grad_norm": 0.47725567627138915, "grad_max_sv": 0.22133470103144645, "grad_min_sv": 8.68051782312168e-09, "grad_condition": 267574471.67175755, "lr": 0.000214643216157784, "time_sec": 32.611361265182495 }, { "epoch": 105, "train_loss": 0.22897292974472047, "train_acc": 0.92568, "test_loss": 3.0474896495819093, "test_acc": 0.5212, "lyapunov": null, "grad_norm": 0.4764754544051647, "grad_max_sv": 0.22653804197907448, "grad_min_sv": 8.760947359104918e-09, "grad_condition": 3219418687.447474, "lr": 0.00020610737385376332, "time_sec": 32.5970995426178 }, { "epoch": 106, "train_loss": 0.22509269979476929, "train_acc": 0.9271, "test_loss": 2.9895481927871703, "test_acc": 0.5276, "lyapunov": null, "grad_norm": 0.47179914735427825, "grad_max_sv": 0.22902226410806178, "grad_min_sv": 8.651995134743851e-09, "grad_condition": 188321170.63109916, "lr": 0.00019770044256881242, "time_sec": 32.61952805519104 }, { "epoch": 107, "train_loss": 0.22124877912521362, "train_acc": 0.92918, "test_loss": 2.9869052186965943, "test_acc": 0.5261, "lyapunov": null, "grad_norm": 0.4676814721095271, "grad_max_sv": 0.23612426966428757, "grad_min_sv": 8.830977354858538e-09, "grad_condition": 1324097462.1438193, "lr": 0.0001894261098608447, "time_sec": 32.63655757904053 }, { "epoch": 108, "train_loss": 0.2119530977487564, "train_acc": 0.93214, "test_loss": 2.957085295295715, "test_acc": 0.5283, "lyapunov": null, "grad_norm": 0.4597233192330978, "grad_max_sv": 0.21893165111541749, "grad_min_sv": 8.44588889763187e-09, "grad_condition": 325299909.8181821, "lr": 0.000181288005125655, "time_sec": 32.6324462890625 }, { "epoch": 109, "train_loss": 0.2096145883345604, "train_acc": 0.93168, "test_loss": 3.0633232662200927, "test_acc": 0.5232, "lyapunov": null, "grad_norm": 0.46012619309211217, "grad_max_sv": 0.21432300768792628, "grad_min_sv": 8.437937682305527e-09, "grad_condition": 912797689.183795, "lr": 0.0001732896980049473, "time_sec": 32.59154772758484 }, { "epoch": 110, "train_loss": 0.20650233900070192, "train_acc": 0.9334, "test_loss": 3.0124371912002563, "test_acc": 0.5288, "lyapunov": null, "grad_norm": 0.45267852009677, "grad_max_sv": 0.2197608083486557, "grad_min_sv": 8.136439059915762e-09, "grad_condition": 214553728.36221018, "lr": 0.00016543469682057076, "time_sec": 32.58715891838074 }, { "epoch": 111, "train_loss": 0.202456818523407, "train_acc": 0.93476, "test_loss": 2.953989649581909, "test_acc": 0.5364, "lyapunov": null, "grad_norm": 0.44877046173685803, "grad_max_sv": 0.2101663440465927, "grad_min_sv": 8.111785431298008e-09, "grad_condition": 181357744.46055207, "lr": 0.00015772644703565552, "time_sec": 32.61166739463806 }, { "epoch": 112, "train_loss": 0.19417572572231293, "train_acc": 0.93836, "test_loss": 3.0636728370666506, "test_acc": 0.5294, "lyapunov": null, "grad_norm": 0.44228389201963325, "grad_max_sv": 0.2184779081493616, "grad_min_sv": 8.052494614532204e-09, "grad_condition": 701685099.8537222, "lr": 0.00015016832974331713, "time_sec": 32.61799240112305 }, { "epoch": 113, "train_loss": 0.1894145729970932, "train_acc": 0.93984, "test_loss": 2.981136636924744, "test_acc": 0.5323, "lyapunov": null, "grad_norm": 0.4358812319975278, "grad_max_sv": 0.20872662551701068, "grad_min_sv": 7.95152020114211e-09, "grad_condition": 1423865321.2329361, "lr": 0.00014276366018359834, "time_sec": 32.6167311668396 }, { "epoch": 114, "train_loss": 0.18947952261924744, "train_acc": 0.9398, "test_loss": 3.0828820104598997, "test_acc": 0.5292, "lyapunov": null, "grad_norm": 0.43739466792043646, "grad_max_sv": 0.2058663982897997, "grad_min_sv": 7.741768523156016e-09, "grad_condition": 7243536793.4379, "lr": 0.00013551568628929425, "time_sec": 32.59801626205444 }, { "epoch": 115, "train_loss": 0.1862397237443924, "train_acc": 0.94078, "test_loss": 2.9763780981063843, "test_acc": 0.538, "lyapunov": null, "grad_norm": 0.43528746000323826, "grad_max_sv": 0.20504732690751554, "grad_min_sv": 8.141562394137907e-09, "grad_condition": 139509610.14712492, "lr": 0.00012842758726130276, "time_sec": 32.612173080444336 }, { "epoch": 116, "train_loss": 0.17998726233482362, "train_acc": 0.9426, "test_loss": 3.0221671098709106, "test_acc": 0.5357, "lyapunov": null, "grad_norm": 0.4288718122641706, "grad_max_sv": 0.2140086382627487, "grad_min_sv": 7.976556949608644e-09, "grad_condition": 784872577.917934, "lr": 0.0001215024721741218, "time_sec": 32.63769769668579 }, { "epoch": 117, "train_loss": 0.17653137303352356, "train_acc": 0.94314, "test_loss": 3.0061340055465697, "test_acc": 0.5323, "lyapunov": null, "grad_norm": 0.4236151447378006, "grad_max_sv": 0.20592431761324406, "grad_min_sv": 7.804582891849515e-09, "grad_condition": 232091482.5503703, "lr": 0.00011474337861210538, "time_sec": 32.63769888877869 }, { "epoch": 118, "train_loss": 0.18115964114189148, "train_acc": 0.94264, "test_loss": 2.9955945150375367, "test_acc": 0.5394, "lyapunov": null, "grad_norm": 0.43031955217275497, "grad_max_sv": 0.21836008243262767, "grad_min_sv": 7.966632081498128e-09, "grad_condition": 338791411.5737727, "lr": 0.00010815327133708009, "time_sec": 32.59054613113403 }, { "epoch": 119, "train_loss": 0.1751684021663666, "train_acc": 0.94342, "test_loss": 3.0028031162261963, "test_acc": 0.5344, "lyapunov": null, "grad_norm": 0.4234025902326238, "grad_max_sv": 0.2052937986329198, "grad_min_sv": 7.743973756604156e-09, "grad_condition": 205737178.47096592, "lr": 0.00010173504098790182, "time_sec": 32.63575482368469 }, { "epoch": 120, "train_loss": 0.17288655778884887, "train_acc": 0.9449, "test_loss": 3.026424203681946, "test_acc": 0.5381, "lyapunov": null, "grad_norm": 0.41773026543709724, "grad_max_sv": 0.2095510721206665, "grad_min_sv": 7.937595827254033e-09, "grad_condition": 6330317379.225478, "lr": 9.549150281252629e-05, "time_sec": 32.587223052978516 }, { "epoch": 121, "train_loss": 0.17101951307296753, "train_acc": 0.94462, "test_loss": 3.165215256309509, "test_acc": 0.5219, "lyapunov": null, "grad_norm": 0.42195608937670603, "grad_max_sv": 0.20825999304652215, "grad_min_sv": 7.99512678009099e-09, "grad_condition": 653203712.6193202, "lr": 8.942539543314794e-05, "time_sec": 32.596564531326294 }, { "epoch": 122, "train_loss": 0.1693978008031845, "train_acc": 0.94588, "test_loss": 3.0062981233596804, "test_acc": 0.5348, "lyapunov": null, "grad_norm": 0.41591242620468016, "grad_max_sv": 0.2059656113386154, "grad_min_sv": 7.704039686772836e-09, "grad_condition": 1004445609.8434451, "lr": 8.353937964495024e-05, "time_sec": 32.61800956726074 }, { "epoch": 123, "train_loss": 0.16728713005065918, "train_acc": 0.94756, "test_loss": 3.1665957611083986, "test_acc": 0.5246, "lyapunov": null, "grad_norm": 0.41526238625867323, "grad_max_sv": 0.20129744820296763, "grad_min_sv": 7.569636380905243e-09, "grad_condition": 407190475.77847266, "lr": 7.783603724899243e-05, "time_sec": 32.61078882217407 }, { "epoch": 124, "train_loss": 0.1635257438659668, "train_acc": 0.94798, "test_loss": 3.1016404109954836, "test_acc": 0.5367, "lyapunov": null, "grad_norm": 0.4079868295136817, "grad_max_sv": 0.20866212155669928, "grad_min_sv": 7.864988894011604e-09, "grad_condition": 294549971.18264663, "lr": 7.231786991974666e-05, "time_sec": 32.627676486968994 }, { "epoch": 125, "train_loss": 0.1641435864830017, "train_acc": 0.94756, "test_loss": 3.0870759466171265, "test_acc": 0.5259, "lyapunov": null, "grad_norm": 0.4108898930410538, "grad_max_sv": 0.21254582721740006, "grad_min_sv": 7.773244741892532e-09, "grad_condition": 192549384.92611116, "lr": 6.698729810778072e-05, "time_sec": 32.60348701477051 }, { "epoch": 126, "train_loss": 0.15524960072517396, "train_acc": 0.95126, "test_loss": 3.106667465209961, "test_acc": 0.5253, "lyapunov": null, "grad_norm": 0.39708975035952015, "grad_max_sv": 0.20546648390591143, "grad_min_sv": 7.524984951411303e-09, "grad_condition": 594241717.5398318, "lr": 6.184665997806817e-05, "time_sec": 32.62395262718201 }, { "epoch": 127, "train_loss": 0.16405641248226166, "train_acc": 0.94786, "test_loss": 3.0382690155029297, "test_acc": 0.5344, "lyapunov": null, "grad_norm": 0.41136197829373494, "grad_max_sv": 0.20878486707806587, "grad_min_sv": 7.634084871223142e-09, "grad_condition": 4480646318.175786, "lr": 5.6898210384392595e-05, "time_sec": 32.58641195297241 }, { "epoch": 128, "train_loss": 0.15556303625106813, "train_acc": 0.95, "test_loss": 3.0696772289276124, "test_acc": 0.5291, "lyapunov": null, "grad_norm": 0.399629179039621, "grad_max_sv": 0.19112058784812688, "grad_min_sv": 7.558967303998576e-09, "grad_condition": 130958494.19530413, "lr": 5.214411988029363e-05, "time_sec": 32.6273717880249 }, { "epoch": 129, "train_loss": 0.15622675662994384, "train_acc": 0.94962, "test_loss": 3.0737016366958616, "test_acc": 0.53, "lyapunov": null, "grad_norm": 0.4021852855426899, "grad_max_sv": 0.20368068106472492, "grad_min_sv": 7.91968607510862e-09, "grad_condition": 4092034646.124222, "lr": 4.7586473766990294e-05, "time_sec": 32.61072516441345 }, { "epoch": 130, "train_loss": 0.15069342103004454, "train_acc": 0.95206, "test_loss": 3.138083388710022, "test_acc": 0.5303, "lyapunov": null, "grad_norm": 0.3967446109539621, "grad_max_sv": 0.20565238259732724, "grad_min_sv": 7.903937278850096e-09, "grad_condition": 403356372.5201774, "lr": 4.32272711786996e-05, "time_sec": 32.60817766189575 }, { "epoch": 131, "train_loss": 0.1475225008201599, "train_acc": 0.95388, "test_loss": 3.097823154640198, "test_acc": 0.5262, "lyapunov": null, "grad_norm": 0.3911645556854745, "grad_max_sv": 0.2029418082907796, "grad_min_sv": 7.451206509700297e-09, "grad_condition": 184512637.53159684, "lr": 3.906842420574966e-05, "time_sec": 32.620972633361816 }, { "epoch": 132, "train_loss": 0.14910545247793197, "train_acc": 0.95376, "test_loss": 3.1958837438583374, "test_acc": 0.5255, "lyapunov": null, "grad_norm": 0.39312251468793336, "grad_max_sv": 0.19356854669749737, "grad_min_sv": 7.3685526407948895e-09, "grad_condition": 474360013.88184536, "lr": 3.5111757055874305e-05, "time_sec": 32.62202000617981 }, { "epoch": 133, "train_loss": 0.14772581936836243, "train_acc": 0.95306, "test_loss": 3.1449778295516966, "test_acc": 0.528, "lyapunov": null, "grad_norm": 0.39083628600782144, "grad_max_sv": 0.18662805538624525, "grad_min_sv": 7.411569982176611e-09, "grad_condition": 590179948.2869803, "lr": 3.1359005254054254e-05, "time_sec": 32.62527775764465 }, { "epoch": 134, "train_loss": 0.1473908689570427, "train_acc": 0.95432, "test_loss": 3.060500933647156, "test_acc": 0.532, "lyapunov": null, "grad_norm": 0.39321527574531456, "grad_max_sv": 0.1960258588194847, "grad_min_sv": 7.530598097665528e-09, "grad_condition": 690149093.5169044, "lr": 2.7811814881259484e-05, "time_sec": 32.611403942108154 }, { "epoch": 135, "train_loss": 0.1489419222688675, "train_acc": 0.95216, "test_loss": 3.0586274435043337, "test_acc": 0.5333, "lyapunov": null, "grad_norm": 0.3951339678077363, "grad_max_sv": 0.19855166971683502, "grad_min_sv": 7.4231230849652885e-09, "grad_condition": 338026036.5432772, "lr": 2.4471741852423218e-05, "time_sec": 32.57758116722107 }, { "epoch": 136, "train_loss": 0.1439458827161789, "train_acc": 0.9552, "test_loss": 3.1572901706695555, "test_acc": 0.5268, "lyapunov": null, "grad_norm": 0.38505775133385556, "grad_max_sv": 0.20576392244547606, "grad_min_sv": 7.578524123253968e-09, "grad_condition": 2346058745.0245013, "lr": 2.1340251233966362e-05, "time_sec": 32.60840678215027 }, { "epoch": 137, "train_loss": 0.14263056889772416, "train_acc": 0.95558, "test_loss": 3.0500190071105955, "test_acc": 0.5343, "lyapunov": null, "grad_norm": 0.38315618240250937, "grad_max_sv": 0.19492608066648245, "grad_min_sv": 7.437362629664907e-09, "grad_condition": 445968074.97881687, "lr": 1.8418716601170932e-05, "time_sec": 32.5784227848053 }, { "epoch": 138, "train_loss": 0.14197950773239135, "train_acc": 0.95516, "test_loss": 3.054612173843384, "test_acc": 0.5379, "lyapunov": null, "grad_norm": 0.3842449580292686, "grad_max_sv": 0.20386305153369905, "grad_min_sv": 7.256548800879062e-09, "grad_condition": 4009126006.180674, "lr": 1.570841943568445e-05, "time_sec": 32.58382248878479 }, { "epoch": 139, "train_loss": 0.14526520327091216, "train_acc": 0.95412, "test_loss": 3.0950862688064573, "test_acc": 0.5323, "lyapunov": null, "grad_norm": 0.38739146310202444, "grad_max_sv": 0.19300882443785666, "grad_min_sv": 7.3080626628160495e-09, "grad_condition": 1317753085.472504, "lr": 1.3210548563419845e-05, "time_sec": 32.599539041519165 }, { "epoch": 140, "train_loss": 0.14277389855384826, "train_acc": 0.9551, "test_loss": 3.0536239072799685, "test_acc": 0.5334, "lyapunov": null, "grad_norm": 0.3812502385842012, "grad_max_sv": 0.2037056451663375, "grad_min_sv": 7.302020117101499e-09, "grad_condition": 4685216825.833342, "lr": 1.0926199633097203e-05, "time_sec": 32.60143446922302 }, { "epoch": 141, "train_loss": 0.14106001211643218, "train_acc": 0.95592, "test_loss": 3.0723882249832153, "test_acc": 0.5322, "lyapunov": null, "grad_norm": 0.38539484766071236, "grad_max_sv": 0.19134777113795282, "grad_min_sv": 7.162904132459666e-09, "grad_condition": 370718600.83184236, "lr": 8.856374635655688e-06, "time_sec": 32.604408740997314 }, { "epoch": 142, "train_loss": 0.1438280531835556, "train_acc": 0.95406, "test_loss": 3.1630526540756225, "test_acc": 0.526, "lyapunov": null, "grad_norm": 0.3885005879930968, "grad_max_sv": 0.19621171467006207, "grad_min_sv": 7.508452308209804e-09, "grad_condition": 440340049.22603464, "lr": 7.001981464747503e-06, "time_sec": 32.600708961486816 }, { "epoch": 143, "train_loss": 0.1418447697210312, "train_acc": 0.95556, "test_loss": 3.0879846578598023, "test_acc": 0.5291, "lyapunov": null, "grad_norm": 0.3836324164118778, "grad_max_sv": 0.188724672421813, "grad_min_sv": 7.507878820815078e-09, "grad_condition": 1051208641.6769501, "lr": 5.3638335185058295e-06, "time_sec": 32.61192798614502 }, { "epoch": 144, "train_loss": 0.14410037503242493, "train_acc": 0.95534, "test_loss": 3.1234459602355957, "test_acc": 0.5318, "lyapunov": null, "grad_norm": 0.38512540576239257, "grad_max_sv": 0.20008118823170662, "grad_min_sv": 7.477710552595152e-09, "grad_condition": 1216378712.8275027, "lr": 3.942649342761114e-06, "time_sec": 32.67555069923401 }, { "epoch": 145, "train_loss": 0.14076073776245118, "train_acc": 0.95618, "test_loss": 3.0669401094436646, "test_acc": 0.5376, "lyapunov": null, "grad_norm": 0.38185175053609804, "grad_max_sv": 0.19599322322756052, "grad_min_sv": 7.380410241113189e-09, "grad_condition": 248121028.65324074, "lr": 2.7390523158633524e-06, "time_sec": 32.595621824264526 }, { "epoch": 146, "train_loss": 0.14235492443561554, "train_acc": 0.95542, "test_loss": 3.1099600078582763, "test_acc": 0.5303, "lyapunov": null, "grad_norm": 0.3833756904141184, "grad_max_sv": 0.19929019846022128, "grad_min_sv": 7.511771148854818e-09, "grad_condition": 234726041.20136175, "lr": 1.7535703752478133e-06, "time_sec": 32.61228895187378 }, { "epoch": 147, "train_loss": 0.1437687619996071, "train_acc": 0.95498, "test_loss": 3.1555084846496584, "test_acc": 0.5253, "lyapunov": null, "grad_norm": 0.38692842594278615, "grad_max_sv": 0.19934902153909206, "grad_min_sv": 7.2967766568429565e-09, "grad_condition": 2247202882.6063395, "lr": 9.866357858642196e-07, "time_sec": 32.581571102142334 }, { "epoch": 148, "train_loss": 0.13997777037143708, "train_acc": 0.95636, "test_loss": 3.126287574195862, "test_acc": 0.5349, "lyapunov": null, "grad_norm": 0.37982964494822274, "grad_max_sv": 0.19688362777233123, "grad_min_sv": 7.199474146620671e-09, "grad_condition": 410986683.7547163, "lr": 4.38584950570808e-07, "time_sec": 32.614789724349976 }, { "epoch": 149, "train_loss": 0.13758307416915894, "train_acc": 0.9559, "test_loss": 3.0673478214263916, "test_acc": 0.5359, "lyapunov": null, "grad_norm": 0.37705013515223074, "grad_max_sv": 0.20387833528220653, "grad_min_sv": 7.47520324575064e-09, "grad_condition": 2818005270.75425, "lr": 1.096582625772501e-07, "time_sec": 32.597362995147705 }, { "epoch": 150, "train_loss": 0.13772287871360778, "train_acc": 0.95614, "test_loss": 3.273663801765442, "test_acc": 0.5186, "lyapunov": null, "grad_norm": 0.3790080333138129, "grad_max_sv": 0.2025493886321783, "grad_min_sv": 7.3542313326689475e-09, "grad_condition": 1465090879.8372142, "lr": 0.0, "time_sec": 32.61164855957031 } ], "12": [ { "epoch": 1, "train_loss": 4.866019581298828, "train_acc": 0.03074, "test_loss": 4.872710034179687, "test_acc": 0.0143, "lyapunov": null, "grad_norm": 5.904015758743758, "grad_max_sv": 5.3000179648399355, "grad_min_sv": 9.986983708909492e-08, "grad_condition": 75746426.03647776, "lr": 0.0009998903417374227, "time_sec": 49.65879511833191 }, { "epoch": 2, "train_loss": 4.336319505615235, "train_acc": 0.05884, "test_loss": 5.078699280548095, "test_acc": 0.0179, "lyapunov": null, "grad_norm": 4.512132309010241, "grad_max_sv": 3.9969229817390444, "grad_min_sv": 7.723465306475052e-08, "grad_condition": 99844248.01218227, "lr": 0.0009995614150494292, "time_sec": 49.67804217338562 }, { "epoch": 3, "train_loss": 4.054194154663086, "train_acc": 0.08442, "test_loss": 4.735939234924317, "test_acc": 0.0289, "lyapunov": null, "grad_norm": 3.6216238346079055, "grad_max_sv": 3.0721623718738558, "grad_min_sv": 6.332745707271492e-08, "grad_condition": 68533376.3072471, "lr": 0.0009990133642141358, "time_sec": 49.650996685028076 }, { "epoch": 4, "train_loss": 3.8553889916229247, "train_acc": 0.11068, "test_loss": 4.7776531311035155, "test_acc": 0.04, "lyapunov": null, "grad_norm": 3.0027283473808, "grad_max_sv": 2.4722895294427873, "grad_min_sv": 5.260577265187028e-08, "grad_condition": 133218192.19257763, "lr": 0.0009982464296247522, "time_sec": 49.62583518028259 }, { "epoch": 5, "train_loss": 3.6851790403747557, "train_acc": 0.13608, "test_loss": 4.847144582366943, "test_acc": 0.0436, "lyapunov": null, "grad_norm": 2.4406262601219466, "grad_max_sv": 1.8893477827310563, "grad_min_sv": 4.253873583381917e-08, "grad_condition": 53203728.717256345, "lr": 0.0009972609476841367, "time_sec": 49.64903235435486 }, { "epoch": 6, "train_loss": 3.557223811721802, "train_acc": 0.1541, "test_loss": 4.846635614776611, "test_acc": 0.0504, "lyapunov": null, "grad_norm": 1.9869329520709325, "grad_max_sv": 1.4254269927740097, "grad_min_sv": 3.4773817814137684e-08, "grad_condition": 109287419.58926606, "lr": 0.000996057350657239, "time_sec": 49.632389545440674 }, { "epoch": 7, "train_loss": 3.448442996292114, "train_acc": 0.17344, "test_loss": 5.146338744354248, "test_acc": 0.0432, "lyapunov": null, "grad_norm": 1.6934869679578504, "grad_max_sv": 1.111972664296627, "grad_min_sv": 3.0129338379758507e-08, "grad_condition": 49145502.73266151, "lr": 0.000994636166481494, "time_sec": 49.63013672828674 }, { "epoch": 8, "train_loss": 3.3602959382629396, "train_acc": 0.18858, "test_loss": 4.997173266601562, "test_acc": 0.0549, "lyapunov": null, "grad_norm": 1.4715658174689026, "grad_max_sv": 0.8646033376455307, "grad_min_sv": 2.5999903535689484e-08, "grad_condition": 38484605.38778691, "lr": 0.0009929980185352525, "time_sec": 49.63576054573059 }, { "epoch": 9, "train_loss": 3.2854549378204347, "train_acc": 0.20336, "test_loss": 5.892930588531494, "test_acc": 0.0446, "lyapunov": null, "grad_norm": 1.3451340821865851, "grad_max_sv": 0.7257503181695938, "grad_min_sv": 2.3997866654967837e-08, "grad_condition": 36951868.39671626, "lr": 0.0009911436253643444, "time_sec": 49.629499197006226 }, { "epoch": 10, "train_loss": 3.2246680919647215, "train_acc": 0.21242, "test_loss": 5.3121603576660155, "test_acc": 0.0492, "lyapunov": null, "grad_norm": 1.2440111786697226, "grad_max_sv": 0.6271802522242069, "grad_min_sv": 2.25186588764803e-08, "grad_condition": 32332715.425953984, "lr": 0.0009890738003669028, "time_sec": 49.677348613739014 }, { "epoch": 11, "train_loss": 3.1626394175720214, "train_acc": 0.22606, "test_loss": 6.13012219543457, "test_acc": 0.0509, "lyapunov": null, "grad_norm": 1.1630276076372463, "grad_max_sv": 0.5456254407763481, "grad_min_sv": 2.0650329043969684e-08, "grad_condition": 43285920.578072175, "lr": 0.00098678945143658, "time_sec": 49.63444662094116 }, { "epoch": 12, "train_loss": 3.105594987640381, "train_acc": 0.2381, "test_loss": 6.692684747314453, "test_acc": 0.0337, "lyapunov": null, "grad_norm": 1.0991523249692334, "grad_max_sv": 0.5055619306862355, "grad_min_sv": 2.044758472541375e-08, "grad_condition": 38174879.70426883, "lr": 0.0009842915805643154, "time_sec": 49.667534828186035 }, { "epoch": 13, "train_loss": 3.071034761581421, "train_acc": 0.24202, "test_loss": 6.808190565490722, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 1.0461733390262893, "grad_max_sv": 0.45393969416618346, "grad_min_sv": 1.9080661878279058e-08, "grad_condition": 26144165.717305023, "lr": 0.000981581283398829, "time_sec": 49.651849031448364 }, { "epoch": 14, "train_loss": 3.031006901779175, "train_acc": 0.25136, "test_loss": 6.8066056442260745, "test_acc": 0.0421, "lyapunov": null, "grad_norm": 1.0001345448432042, "grad_max_sv": 0.4178654387593269, "grad_min_sv": 1.817219532629366e-08, "grad_condition": 26243292.8670463, "lr": 0.0009786597487660333, "time_sec": 49.67574381828308 }, { "epoch": 15, "train_loss": 2.992844039916992, "train_acc": 0.25788, "test_loss": 6.2335087615966795, "test_acc": 0.0415, "lyapunov": null, "grad_norm": 0.9709343078677097, "grad_max_sv": 0.40159890055656433, "grad_min_sv": 1.7637466787068233e-08, "grad_condition": 31130355.004485857, "lr": 0.0009755282581475766, "time_sec": 49.648940324783325 }, { "epoch": 16, "train_loss": 2.9533546379089355, "train_acc": 0.2654, "test_loss": 6.982061653900146, "test_acc": 0.0331, "lyapunov": null, "grad_norm": 0.9294555695312433, "grad_max_sv": 0.38935905918478964, "grad_min_sv": 1.7345642956689833e-08, "grad_condition": 34633361.17032104, "lr": 0.0009721881851187403, "time_sec": 49.62569880485535 }, { "epoch": 17, "train_loss": 2.9248884143066407, "train_acc": 0.27134, "test_loss": 5.847897528839112, "test_acc": 0.0375, "lyapunov": null, "grad_norm": 0.8931744987288306, "grad_max_sv": 0.3547165349125862, "grad_min_sv": 1.6551659471827906e-08, "grad_condition": 78906912.01626787, "lr": 0.0009686409947459456, "time_sec": 49.628357887268066 }, { "epoch": 18, "train_loss": 2.896197442779541, "train_acc": 0.27548, "test_loss": 6.654647819519043, "test_acc": 0.0387, "lyapunov": null, "grad_norm": 0.8750290297759321, "grad_max_sv": 0.3526077255606651, "grad_min_sv": 1.6023472331015005e-08, "grad_condition": 266939500.3731903, "lr": 0.0009648882429441254, "time_sec": 49.64867830276489 }, { "epoch": 19, "train_loss": 2.8669221867370607, "train_acc": 0.28036, "test_loss": 5.810343419647217, "test_acc": 0.0502, "lyapunov": null, "grad_norm": 0.8587949296642396, "grad_max_sv": 0.34078171029686927, "grad_min_sv": 1.6171859118507826e-08, "grad_condition": 22947806.160383917, "lr": 0.00096093157579425, "time_sec": 49.63094878196716 }, { "epoch": 20, "train_loss": 2.82938760848999, "train_acc": 0.289, "test_loss": 5.896671797180176, "test_acc": 0.0461, "lyapunov": null, "grad_norm": 0.839027246743402, "grad_max_sv": 0.3308767855167389, "grad_min_sv": 1.570504673531481e-08, "grad_condition": 24206043.26616613, "lr": 0.0009567727288213001, "time_sec": 49.6539568901062 }, { "epoch": 21, "train_loss": 2.8006727541351317, "train_acc": 0.2938, "test_loss": 6.180831294250488, "test_acc": 0.0398, "lyapunov": null, "grad_norm": 0.8110141308366953, "grad_max_sv": 0.3095390945672989, "grad_min_sv": 1.4921404802026306e-08, "grad_condition": 34079256.769043334, "lr": 0.0009524135262330095, "time_sec": 49.64039897918701 }, { "epoch": 22, "train_loss": 2.7774745903778078, "train_acc": 0.29804, "test_loss": 6.308743616485596, "test_acc": 0.045, "lyapunov": null, "grad_norm": 0.8004103125902539, "grad_max_sv": 0.31844869926571845, "grad_min_sv": 1.5020042806734857e-08, "grad_condition": 27917630.374082875, "lr": 0.0009478558801197061, "time_sec": 49.63332271575928 }, { "epoch": 23, "train_loss": 2.7524796044921875, "train_acc": 0.30316, "test_loss": 5.521375189208984, "test_acc": 0.0535, "lyapunov": null, "grad_norm": 0.7869460876794067, "grad_max_sv": 0.292531880363822, "grad_min_sv": 1.448369401080285e-08, "grad_condition": 35029756.554903194, "lr": 0.000943101789615607, "time_sec": 49.63528370857239 }, { "epoch": 24, "train_loss": 2.7253317372131347, "train_acc": 0.3104, "test_loss": 6.1194743759155275, "test_acc": 0.0494, "lyapunov": null, "grad_norm": 0.7678368002286986, "grad_max_sv": 0.29576918072998526, "grad_min_sv": 1.4323617783529307e-08, "grad_condition": 28702466.777186085, "lr": 0.0009381533400219313, "time_sec": 49.64074897766113 }, { "epoch": 25, "train_loss": 2.7074700713348387, "train_acc": 0.31266, "test_loss": 6.289851884460449, "test_acc": 0.0462, "lyapunov": null, "grad_norm": 0.7683642905855677, "grad_max_sv": 0.2851465784013271, "grad_min_sv": 1.4292519384673242e-08, "grad_condition": 22761462.806346737, "lr": 0.0009330127018922189, "time_sec": 49.631171464920044 }, { "epoch": 26, "train_loss": 2.686272830505371, "train_acc": 0.3169, "test_loss": 6.941660729980469, "test_acc": 0.0479, "lyapunov": null, "grad_norm": 0.755488240958268, "grad_max_sv": 0.28228237964212893, "grad_min_sv": 1.4025971441233854e-08, "grad_condition": 35803882.89457456, "lr": 0.000927682130080253, "time_sec": 49.64768934249878 }, { "epoch": 27, "train_loss": 2.6507435781860353, "train_acc": 0.32476, "test_loss": 5.651136081695556, "test_acc": 0.0552, "lyapunov": null, "grad_norm": 0.7510174800021984, "grad_max_sv": 0.2705878522247076, "grad_min_sv": 1.3801869563900837e-08, "grad_condition": 24650339.234644465, "lr": 0.0009221639627510072, "time_sec": 49.63985729217529 }, { "epoch": 28, "train_loss": 2.6402551649475097, "train_acc": 0.32708, "test_loss": 6.290144860839844, "test_acc": 0.042, "lyapunov": null, "grad_norm": 0.7327305496870947, "grad_max_sv": 0.26595143899321555, "grad_min_sv": 1.3485531080714708e-08, "grad_condition": 24838092.070290618, "lr": 0.0009164606203550494, "time_sec": 49.668391704559326 }, { "epoch": 29, "train_loss": 2.6250381271362304, "train_acc": 0.32904, "test_loss": 5.969137829589844, "test_acc": 0.0584, "lyapunov": null, "grad_norm": 0.7326068006390382, "grad_max_sv": 0.27750224173069, "grad_min_sv": 1.3820259439634164e-08, "grad_condition": 23369103.19183632, "lr": 0.0009105746045668516, "time_sec": 49.66312098503113 }, { "epoch": 30, "train_loss": 2.5943477003479005, "train_acc": 0.3349, "test_loss": 5.8657053939819335, "test_acc": 0.0662, "lyapunov": null, "grad_norm": 0.7282576381570287, "grad_max_sv": 0.267722587287426, "grad_min_sv": 1.3611432567173232e-08, "grad_condition": 33832306.890324585, "lr": 0.0009045084971874733, "time_sec": 49.635533809661865 }, { "epoch": 31, "train_loss": 2.5734296069335936, "train_acc": 0.3377, "test_loss": 5.947202941894531, "test_acc": 0.0536, "lyapunov": null, "grad_norm": 0.72371197105418, "grad_max_sv": 0.2766475807875395, "grad_min_sv": 1.3626912859915353e-08, "grad_condition": 57961221.39827029, "lr": 0.0008982649590120977, "time_sec": 49.64917349815369 }, { "epoch": 32, "train_loss": 2.564406160736084, "train_acc": 0.34312, "test_loss": 5.720430706787109, "test_acc": 0.0515, "lyapunov": null, "grad_norm": 0.7163915374705971, "grad_max_sv": 0.25801267102360725, "grad_min_sv": 1.3336803814101295e-08, "grad_condition": 26182544.879379902, "lr": 0.0008918467286629196, "time_sec": 49.67513680458069 }, { "epoch": 33, "train_loss": 2.5487507371520994, "train_acc": 0.3468, "test_loss": 6.23959475479126, "test_acc": 0.0534, "lyapunov": null, "grad_norm": 0.7054942364907418, "grad_max_sv": 0.24919774606823922, "grad_min_sv": 1.306408175666407e-08, "grad_condition": 26801620.75531055, "lr": 0.0008852566213878943, "time_sec": 49.64692521095276 }, { "epoch": 34, "train_loss": 2.5242181804656982, "train_acc": 0.34942, "test_loss": 6.2963892974853515, "test_acc": 0.0553, "lyapunov": null, "grad_norm": 0.7016169815154498, "grad_max_sv": 0.25484145022928717, "grad_min_sv": 1.3042181151723397e-08, "grad_condition": 22430709.73115928, "lr": 0.000878497527825878, "time_sec": 49.654839754104614 }, { "epoch": 35, "train_loss": 2.5094819609832766, "train_acc": 0.35066, "test_loss": 6.719456141662597, "test_acc": 0.0546, "lyapunov": null, "grad_norm": 0.6984323559876441, "grad_max_sv": 0.25291088260710237, "grad_min_sv": 1.3091225495309722e-08, "grad_condition": 24055952.13732664, "lr": 0.000871572412738697, "time_sec": 49.63660550117493 }, { "epoch": 36, "train_loss": 2.482266076126099, "train_acc": 0.35974, "test_loss": 6.552088442993164, "test_acc": 0.0652, "lyapunov": null, "grad_norm": 0.6961085506168149, "grad_max_sv": 0.25587535500526426, "grad_min_sv": 1.3084706912414034e-08, "grad_condition": 29953242.59302296, "lr": 0.0008644843137107055, "time_sec": 49.636728286743164 }, { "epoch": 37, "train_loss": 2.4597298861694337, "train_acc": 0.36194, "test_loss": 7.314365348815918, "test_acc": 0.0495, "lyapunov": null, "grad_norm": 0.6914952761349973, "grad_max_sv": 0.24747973680496216, "grad_min_sv": 1.3026676748406629e-08, "grad_condition": 27342755.995011915, "lr": 0.0008572363398164014, "time_sec": 49.638224363327026 }, { "epoch": 38, "train_loss": 2.4654034370422364, "train_acc": 0.36094, "test_loss": 6.702982992553711, "test_acc": 0.0509, "lyapunov": null, "grad_norm": 0.6892432022946228, "grad_max_sv": 0.2394346885383129, "grad_min_sv": 1.273180681438113e-08, "grad_condition": 22022203.054304175, "lr": 0.0008498316702566826, "time_sec": 49.639644145965576 }, { "epoch": 39, "train_loss": 2.42667671333313, "train_acc": 0.36782, "test_loss": 6.179627616882324, "test_acc": 0.0407, "lyapunov": null, "grad_norm": 0.6855295822993354, "grad_max_sv": 0.24026529379189016, "grad_min_sv": 1.2694210569513809e-08, "grad_condition": 40057775.67721417, "lr": 0.0008422735529643442, "time_sec": 49.63581466674805 }, { "epoch": 40, "train_loss": 2.4109215718841552, "train_acc": 0.37052, "test_loss": 6.805292085266113, "test_acc": 0.0527, "lyapunov": null, "grad_norm": 0.6807278981220505, "grad_max_sv": 0.23731110394001007, "grad_min_sv": 1.2639894338140056e-08, "grad_condition": 27610612.2175704, "lr": 0.0008345653031794289, "time_sec": 49.64470100402832 }, { "epoch": 41, "train_loss": 2.394052338409424, "train_acc": 0.37456, "test_loss": 6.000495677947998, "test_acc": 0.0498, "lyapunov": null, "grad_norm": 0.684187370269629, "grad_max_sv": 0.24500937685370444, "grad_min_sv": 1.290876201071045e-08, "grad_condition": 57507496.68239377, "lr": 0.0008267103019950526, "time_sec": 49.64144778251648 }, { "epoch": 42, "train_loss": 2.369488366241455, "train_acc": 0.37932, "test_loss": 5.813188542175293, "test_acc": 0.0442, "lyapunov": null, "grad_norm": 0.6660607900191566, "grad_max_sv": 0.23581123538315296, "grad_min_sv": 1.243826876218268e-08, "grad_condition": 43225809.82445784, "lr": 0.0008187119948743447, "time_sec": 49.65106153488159 }, { "epoch": 43, "train_loss": 2.349871713409424, "train_acc": 0.38354, "test_loss": 6.650400701904297, "test_acc": 0.054, "lyapunov": null, "grad_norm": 0.6728559080292662, "grad_max_sv": 0.23216901496052741, "grad_min_sv": 1.2423243067605228e-08, "grad_condition": 97229672.46407479, "lr": 0.000810573890139155, "time_sec": 49.6483952999115 }, { "epoch": 44, "train_loss": 2.3327147588348387, "train_acc": 0.38762, "test_loss": 7.37770638885498, "test_acc": 0.0556, "lyapunov": null, "grad_norm": 0.6708437479650249, "grad_max_sv": 0.2353798534721136, "grad_min_sv": 1.2329054610571433e-08, "grad_condition": 24315327.09270349, "lr": 0.0008022995574311873, "time_sec": 49.649359464645386 }, { "epoch": 45, "train_loss": 2.3379388195037842, "train_acc": 0.38554, "test_loss": 7.32100400390625, "test_acc": 0.0447, "lyapunov": null, "grad_norm": 0.6690933212170967, "grad_max_sv": 0.23992121778428555, "grad_min_sv": 1.2581548722301328e-08, "grad_condition": 23582198.377444454, "lr": 0.0007938926261462363, "time_sec": 49.65408158302307 }, { "epoch": 46, "train_loss": 2.3259339227294924, "train_acc": 0.3881, "test_loss": 5.903630683898926, "test_acc": 0.0532, "lyapunov": null, "grad_norm": 0.6696674111669629, "grad_max_sv": 0.24237493835389615, "grad_min_sv": 1.264802341723395e-08, "grad_condition": 189995164.68487653, "lr": 0.0007853567838422158, "time_sec": 49.62894296646118 }, { "epoch": 47, "train_loss": 2.3060372606658937, "train_acc": 0.39222, "test_loss": 6.722331466674805, "test_acc": 0.052, "lyapunov": null, "grad_norm": 0.6608950831630619, "grad_max_sv": 0.2247944913804531, "grad_min_sv": 1.2062996512373236e-08, "grad_condition": 1083025267.50655, "lr": 0.0007766957746216719, "time_sec": 49.62338829040527 }, { "epoch": 48, "train_loss": 2.283214527587891, "train_acc": 0.39554, "test_loss": 6.30029787979126, "test_acc": 0.058, "lyapunov": null, "grad_norm": 0.6607285996206229, "grad_max_sv": 0.23341836147010325, "grad_min_sv": 1.2354938326575304e-08, "grad_condition": 30471435.85248127, "lr": 0.0007679133974894982, "time_sec": 49.62940454483032 }, { "epoch": 49, "train_loss": 2.2607837000274658, "train_acc": 0.39988, "test_loss": 5.6582544311523435, "test_acc": 0.0597, "lyapunov": null, "grad_norm": 0.6558663174998175, "grad_max_sv": 0.22986114919185638, "grad_min_sv": 1.2380245191512263e-08, "grad_condition": 37434404.18782197, "lr": 0.000759013504686565, "time_sec": 49.63751459121704 }, { "epoch": 50, "train_loss": 2.245105714797974, "train_acc": 0.40408, "test_loss": 6.382824391937256, "test_acc": 0.0387, "lyapunov": null, "grad_norm": 0.6549241097715082, "grad_max_sv": 0.2248407918959856, "grad_min_sv": 1.2180415326357163e-08, "grad_condition": 21126842.856077008, "lr": 0.0007499999999999998, "time_sec": 49.62160301208496 }, { "epoch": 51, "train_loss": 2.235931240615845, "train_acc": 0.40734, "test_loss": 5.594304537963867, "test_acc": 0.0703, "lyapunov": null, "grad_norm": 0.6606674978525966, "grad_max_sv": 0.23265439458191395, "grad_min_sv": 1.2417693201483005e-08, "grad_condition": 38123270.60577395, "lr": 0.0007408768370508575, "time_sec": 49.63914489746094 }, { "epoch": 52, "train_loss": 2.220252141571045, "train_acc": 0.40908, "test_loss": 5.49668860168457, "test_acc": 0.0417, "lyapunov": null, "grad_norm": 0.6502905279074903, "grad_max_sv": 0.23435013145208358, "grad_min_sv": 1.2266832496304891e-08, "grad_condition": 38310230.157323316, "lr": 0.0007316480175599307, "time_sec": 49.623440980911255 }, { "epoch": 53, "train_loss": 2.20186401260376, "train_acc": 0.41488, "test_loss": 6.196598785400391, "test_acc": 0.052, "lyapunov": null, "grad_norm": 0.6529977877477179, "grad_max_sv": 0.23160336054861547, "grad_min_sv": 1.213869888216923e-08, "grad_condition": 32786030.078148127, "lr": 0.0007223175895924635, "time_sec": 49.645137548446655 }, { "epoch": 54, "train_loss": 2.192180712852478, "train_acc": 0.41462, "test_loss": 6.966438492584229, "test_acc": 0.0515, "lyapunov": null, "grad_norm": 0.6546718868496101, "grad_max_sv": 0.23001223765313625, "grad_min_sv": 1.2304833968412864e-08, "grad_condition": 26553928.3741663, "lr": 0.0007128896457825361, "time_sec": 49.642454862594604 }, { "epoch": 55, "train_loss": 2.1692851805114746, "train_acc": 0.42174, "test_loss": 6.76854267578125, "test_acc": 0.0514, "lyapunov": null, "grad_norm": 0.6573722021244011, "grad_max_sv": 0.22808259911835194, "grad_min_sv": 1.2273855956590473e-08, "grad_condition": 23253160.925169718, "lr": 0.0007033683215378998, "time_sec": 49.62129521369934 }, { "epoch": 56, "train_loss": 2.1607114459228516, "train_acc": 0.42392, "test_loss": 6.366939366912842, "test_acc": 0.0595, "lyapunov": null, "grad_norm": 0.6541197760013122, "grad_max_sv": 0.2261738982051611, "grad_min_sv": 1.2211666097772245e-08, "grad_condition": 40339824.5426622, "lr": 0.0006937577932260512, "time_sec": 49.614548444747925 }, { "epoch": 57, "train_loss": 2.1550695499420165, "train_acc": 0.42292, "test_loss": 6.088698851013183, "test_acc": 0.0407, "lyapunov": null, "grad_norm": 0.6495499294349419, "grad_max_sv": 0.22787895202636718, "grad_min_sv": 1.2191535223027294e-08, "grad_condition": 46151755.99995027, "lr": 0.0006840622763423388, "time_sec": 49.86520218849182 }, { "epoch": 58, "train_loss": 2.1309228759002687, "train_acc": 0.4298, "test_loss": 6.714969717407227, "test_acc": 0.0476, "lyapunov": null, "grad_norm": 0.6501923826294874, "grad_max_sv": 0.2294207103550434, "grad_min_sv": 1.2324306024324993e-08, "grad_condition": 27012371.00660652, "lr": 0.0006742860236609073, "time_sec": 49.61659789085388 }, { "epoch": 59, "train_loss": 2.1276511294555664, "train_acc": 0.43052, "test_loss": 7.850105988311768, "test_acc": 0.0531, "lyapunov": null, "grad_norm": 0.6522053097296127, "grad_max_sv": 0.23177195861935615, "grad_min_sv": 1.2570549945412068e-08, "grad_condition": 21066069.902124517, "lr": 0.0006644333233692913, "time_sec": 49.61627125740051 }, { "epoch": 60, "train_loss": 2.108223154907227, "train_acc": 0.43206, "test_loss": 6.194909986877441, "test_acc": 0.0601, "lyapunov": null, "grad_norm": 0.6509457366232547, "grad_max_sv": 0.2232413150370121, "grad_min_sv": 1.2092985912648402e-08, "grad_condition": 20482533.369790833, "lr": 0.0006545084971874734, "time_sec": 49.638840198516846 }, { "epoch": 61, "train_loss": 2.0873364936828613, "train_acc": 0.43732, "test_loss": 7.149879702758789, "test_acc": 0.0579, "lyapunov": null, "grad_norm": 0.6448496636259025, "grad_max_sv": 0.2204914376139641, "grad_min_sv": 1.2118930678428619e-08, "grad_condition": 22158498.545212857, "lr": 0.0006445158984722354, "time_sec": 49.64352631568909 }, { "epoch": 62, "train_loss": 2.0711798847961425, "train_acc": 0.4403, "test_loss": 6.873784851074219, "test_acc": 0.0519, "lyapunov": null, "grad_norm": 0.650740813617645, "grad_max_sv": 0.23042820766568184, "grad_min_sv": 1.2226469767173676e-08, "grad_condition": 22253714.267564178, "lr": 0.0006344599103076324, "time_sec": 49.61197328567505 }, { "epoch": 63, "train_loss": 2.0670838510131837, "train_acc": 0.44428, "test_loss": 8.138898289489745, "test_acc": 0.0465, "lyapunov": null, "grad_norm": 0.6500300321497959, "grad_max_sv": 0.22807052806019784, "grad_min_sv": 1.2282747885450362e-08, "grad_condition": 25613801.10650332, "lr": 0.0006243449435824269, "time_sec": 49.64067339897156 }, { "epoch": 64, "train_loss": 2.0602053503417967, "train_acc": 0.44336, "test_loss": 6.739065780639648, "test_acc": 0.0435, "lyapunov": null, "grad_norm": 0.6438167751087027, "grad_max_sv": 0.21950027868151664, "grad_min_sv": 1.1978744509505424e-08, "grad_condition": 69086045.79764383, "lr": 0.0006141754350553275, "time_sec": 49.63843250274658 }, { "epoch": 65, "train_loss": 2.0289339319610598, "train_acc": 0.4504, "test_loss": 5.612693282318115, "test_acc": 0.0624, "lyapunov": null, "grad_norm": 0.643091891417901, "grad_max_sv": 0.2296879008412361, "grad_min_sv": 1.2095985612095573e-08, "grad_condition": 207267738.03108597, "lr": 0.0006039558454088793, "time_sec": 49.621809244155884 }, { "epoch": 66, "train_loss": 2.017880793533325, "train_acc": 0.45524, "test_loss": 5.917317507934571, "test_acc": 0.0569, "lyapunov": null, "grad_norm": 0.6458313703477052, "grad_max_sv": 0.2203237745910883, "grad_min_sv": 1.2053612886975263e-08, "grad_condition": 30573308.01952803, "lr": 0.000593690657292862, "time_sec": 49.62665867805481 }, { "epoch": 67, "train_loss": 2.00664087310791, "train_acc": 0.45516, "test_loss": 5.649988233947754, "test_acc": 0.0551, "lyapunov": null, "grad_norm": 0.6469506065081965, "grad_max_sv": 0.22469568885862828, "grad_min_sv": 1.2245062176730048e-08, "grad_condition": 29605005.92733214, "lr": 0.0005833843733580507, "time_sec": 49.66580653190613 }, { "epoch": 68, "train_loss": 1.9934558868789674, "train_acc": 0.45752, "test_loss": 6.518855290222168, "test_acc": 0.0474, "lyapunov": null, "grad_norm": 0.6449120600766396, "grad_max_sv": 0.22343773469328881, "grad_min_sv": 1.2075202887595893e-08, "grad_condition": 20470063.13805929, "lr": 0.0005730415142812054, "time_sec": 49.649908781051636 }, { "epoch": 69, "train_loss": 1.9819465933609008, "train_acc": 0.4615, "test_loss": 5.741820652770996, "test_acc": 0.0576, "lyapunov": null, "grad_norm": 0.6444073081455958, "grad_max_sv": 0.2133765324950218, "grad_min_sv": 1.1591837454538903e-08, "grad_condition": 7400690970.849569, "lr": 0.0005626666167821517, "time_sec": 49.64708852767944 }, { "epoch": 70, "train_loss": 1.9717326400756836, "train_acc": 0.4635, "test_loss": 6.180095139312744, "test_acc": 0.0538, "lyapunov": null, "grad_norm": 0.646339670655307, "grad_max_sv": 0.22971010841429235, "grad_min_sv": 1.1938921282844683e-08, "grad_condition": 42308986.45036293, "lr": 0.0005522642316338265, "time_sec": 49.65745282173157 }, { "epoch": 71, "train_loss": 1.947042868385315, "train_acc": 0.46858, "test_loss": 5.758691899871827, "test_acc": 0.0481, "lyapunov": null, "grad_norm": 0.6454285691467331, "grad_max_sv": 0.21988087929785252, "grad_min_sv": 1.2038080984128063e-08, "grad_condition": 54275907.24262571, "lr": 0.0005418389216661573, "time_sec": 49.655876874923706 }, { "epoch": 72, "train_loss": 1.9380216747283936, "train_acc": 0.47278, "test_loss": 5.360606885528564, "test_acc": 0.0499, "lyapunov": null, "grad_norm": 0.6445951712238421, "grad_max_sv": 0.22141558788716792, "grad_min_sv": 1.2052524836839163e-08, "grad_condition": 52658770.62947424, "lr": 0.0005313952597646563, "time_sec": 49.643407106399536 }, { "epoch": 73, "train_loss": 1.9315852340698243, "train_acc": 0.47042, "test_loss": 5.562986553955078, "test_acc": 0.0528, "lyapunov": null, "grad_norm": 0.6455449182300289, "grad_max_sv": 0.22759805843234063, "grad_min_sv": 1.2166670372570909e-08, "grad_condition": 25263034.87545003, "lr": 0.0005209378268645994, "time_sec": 49.65730333328247 }, { "epoch": 74, "train_loss": 1.9174984769439698, "train_acc": 0.47274, "test_loss": 5.779887171173096, "test_acc": 0.0526, "lyapunov": null, "grad_norm": 0.6408982744466406, "grad_max_sv": 0.223176771402359, "grad_min_sv": 1.1881650463507754e-08, "grad_condition": 21609418.938555025, "lr": 0.0005104712099416781, "time_sec": 49.63982319831848 }, { "epoch": 75, "train_loss": 1.9022090718841553, "train_acc": 0.47956, "test_loss": 6.74227056427002, "test_acc": 0.0396, "lyapunov": null, "grad_norm": 0.6439391169821848, "grad_max_sv": 0.22340110316872597, "grad_min_sv": 1.1930816612437667e-08, "grad_condition": 22835938.88370643, "lr": 0.0004999999999999996, "time_sec": 49.6373016834259 }, { "epoch": 76, "train_loss": 1.8833642294311523, "train_acc": 0.48212, "test_loss": 6.253941902160644, "test_acc": 0.0401, "lyapunov": null, "grad_norm": 0.6458465784916259, "grad_max_sv": 0.2219920836389065, "grad_min_sv": 1.1862058124645358e-08, "grad_condition": 24923864.351812743, "lr": 0.0004895287900583212, "time_sec": 49.63244032859802 }, { "epoch": 77, "train_loss": 1.872097596054077, "train_acc": 0.4862, "test_loss": 7.115831829833985, "test_acc": 0.0455, "lyapunov": null, "grad_norm": 0.6389496343286681, "grad_max_sv": 0.2166093897074461, "grad_min_sv": 1.1753041695428124e-08, "grad_condition": 123847363.5090142, "lr": 0.0004790621731353997, "time_sec": 49.65565347671509 }, { "epoch": 78, "train_loss": 1.8647768477630615, "train_acc": 0.48824, "test_loss": 6.585789360046387, "test_acc": 0.0461, "lyapunov": null, "grad_norm": 0.6430712356182874, "grad_max_sv": 0.2195899412035942, "grad_min_sv": 1.2243656302224696e-08, "grad_condition": 424951771.80469763, "lr": 0.000468604740235343, "time_sec": 49.62981295585632 }, { "epoch": 79, "train_loss": 1.8419312603759765, "train_acc": 0.49144, "test_loss": 6.8796092208862305, "test_acc": 0.0534, "lyapunov": null, "grad_norm": 0.6438732522551095, "grad_max_sv": 0.223552468046546, "grad_min_sv": 1.2100811991712716e-08, "grad_condition": 310767823.54431427, "lr": 0.00045816107833384175, "time_sec": 49.63279318809509 }, { "epoch": 80, "train_loss": 1.8222150116348266, "train_acc": 0.49938, "test_loss": 6.9083010223388674, "test_acc": 0.0574, "lyapunov": null, "grad_norm": 0.646876723364354, "grad_max_sv": 0.22485989183187485, "grad_min_sv": 1.2241183645900212e-08, "grad_condition": 28086849.755860113, "lr": 0.0004477357683661729, "time_sec": 49.6425895690918 }, { "epoch": 81, "train_loss": 1.813687347946167, "train_acc": 0.49976, "test_loss": 6.90407081451416, "test_acc": 0.04, "lyapunov": null, "grad_norm": 0.642733217341124, "grad_max_sv": 0.22463089227676392, "grad_min_sv": 1.2082413675118531e-08, "grad_condition": 22301589.48218178, "lr": 0.00043733338321784746, "time_sec": 49.629480838775635 }, { "epoch": 82, "train_loss": 1.7951585668945313, "train_acc": 0.5034, "test_loss": 7.836273937988281, "test_acc": 0.0512, "lyapunov": null, "grad_norm": 0.6454340294520209, "grad_max_sv": 0.22539752162992954, "grad_min_sv": 1.1886250314216417e-08, "grad_condition": 59544024.862964645, "lr": 0.0004269584857187939, "time_sec": 49.61994457244873 }, { "epoch": 83, "train_loss": 1.7966358541488647, "train_acc": 0.50272, "test_loss": 7.222357276916504, "test_acc": 0.0579, "lyapunov": null, "grad_norm": 0.6453223951998842, "grad_max_sv": 0.22831037007272242, "grad_min_sv": 1.203974950118869e-08, "grad_condition": 82894748.52704917, "lr": 0.0004166156266419484, "time_sec": 49.673835039138794 }, { "epoch": 84, "train_loss": 1.7854290616226196, "train_acc": 0.50408, "test_loss": 6.414771678161621, "test_acc": 0.0601, "lyapunov": null, "grad_norm": 0.6427673490554981, "grad_max_sv": 0.2182640478014946, "grad_min_sv": 1.202259434229802e-08, "grad_condition": 21861556.418338913, "lr": 0.0004063093427071373, "time_sec": 49.64637732505798 }, { "epoch": 85, "train_loss": 1.7772653774261475, "train_acc": 0.5111, "test_loss": 7.505108009338379, "test_acc": 0.0616, "lyapunov": null, "grad_norm": 0.6410246970315546, "grad_max_sv": 0.2277263168245554, "grad_min_sv": 1.1847804396586393e-08, "grad_condition": 36055137.59124441, "lr": 0.0003960441545911199, "time_sec": 49.642088174819946 }, { "epoch": 86, "train_loss": 1.7477331000518799, "train_acc": 0.5147, "test_loss": 7.709722770690918, "test_acc": 0.0449, "lyapunov": null, "grad_norm": 0.6439998427728569, "grad_max_sv": 0.22573819942772388, "grad_min_sv": 1.2154757376287017e-08, "grad_condition": 47618357.203088775, "lr": 0.0003858245649446718, "time_sec": 49.63089942932129 }, { "epoch": 87, "train_loss": 1.7338512952423095, "train_acc": 0.51864, "test_loss": 7.293183726501465, "test_acc": 0.0531, "lyapunov": null, "grad_norm": 0.6450352139357391, "grad_max_sv": 0.2251686044037342, "grad_min_sv": 1.2090907994255495e-08, "grad_condition": 23129638.107943743, "lr": 0.00037565505641757235, "time_sec": 49.62959694862366 }, { "epoch": 88, "train_loss": 1.7305470868301391, "train_acc": 0.51752, "test_loss": 6.886636978912353, "test_acc": 0.0621, "lyapunov": null, "grad_norm": 0.6466229739487265, "grad_max_sv": 0.2285929098725319, "grad_min_sv": 1.2207108990238031e-08, "grad_condition": 639961294.3776948, "lr": 0.00036554008969236695, "time_sec": 49.64359998703003 }, { "epoch": 89, "train_loss": 1.7247330599212647, "train_acc": 0.52118, "test_loss": 7.737054846954345, "test_acc": 0.0492, "lyapunov": null, "grad_norm": 0.6431070021674609, "grad_max_sv": 0.21853713542222977, "grad_min_sv": 1.1871128499651996e-08, "grad_condition": 34316573.10990389, "lr": 0.0003554841015277638, "time_sec": 49.6319477558136 }, { "epoch": 90, "train_loss": 1.704887728881836, "train_acc": 0.52374, "test_loss": 6.713198412322998, "test_acc": 0.0556, "lyapunov": null, "grad_norm": 0.6451375385492529, "grad_max_sv": 0.22224950045347214, "grad_min_sv": 1.2021271361684072e-08, "grad_condition": 25574543.625141606, "lr": 0.000345491502812526, "time_sec": 49.63963174819946 }, { "epoch": 91, "train_loss": 1.701412860145569, "train_acc": 0.52644, "test_loss": 7.295478704833984, "test_acc": 0.0429, "lyapunov": null, "grad_norm": 0.6447266155116032, "grad_max_sv": 0.23335366621613501, "grad_min_sv": 1.257304017843186e-08, "grad_condition": 24036732.36328527, "lr": 0.0003355666766307081, "time_sec": 49.665791511535645 }, { "epoch": 92, "train_loss": 1.6871472067642213, "train_acc": 0.53048, "test_loss": 7.389536867523193, "test_acc": 0.0375, "lyapunov": null, "grad_norm": 0.6468836541708367, "grad_max_sv": 0.2225259728729725, "grad_min_sv": 1.1890293904331939e-08, "grad_condition": 29650216.370129876, "lr": 0.00032571397633909225, "time_sec": 49.64622926712036 }, { "epoch": 93, "train_loss": 1.6749127053833008, "train_acc": 0.53202, "test_loss": 8.144829412078858, "test_acc": 0.0401, "lyapunov": null, "grad_norm": 0.6416574148081634, "grad_max_sv": 0.22841569185256957, "grad_min_sv": 1.2051048693673128e-08, "grad_condition": 29017060.070413183, "lr": 0.00031593772365766094, "time_sec": 49.649181604385376 }, { "epoch": 94, "train_loss": 1.6659465893936156, "train_acc": 0.53198, "test_loss": 7.906325871276856, "test_acc": 0.0523, "lyapunov": null, "grad_norm": 0.6442484947336338, "grad_max_sv": 0.22283854335546494, "grad_min_sv": 1.1940718097624981e-08, "grad_condition": 23900914.940908086, "lr": 0.0003062422067739483, "time_sec": 49.64401292800903 }, { "epoch": 95, "train_loss": 1.6399671975326537, "train_acc": 0.53952, "test_loss": 7.157633497619629, "test_acc": 0.0527, "lyapunov": null, "grad_norm": 0.6406645370679923, "grad_max_sv": 0.22293368987739087, "grad_min_sv": 1.2085724485771942e-08, "grad_condition": 56163384.20133088, "lr": 0.00029663167846209965, "time_sec": 49.6225950717926 }, { "epoch": 96, "train_loss": 1.6436440280532838, "train_acc": 0.5397, "test_loss": 8.535991598510742, "test_acc": 0.0515, "lyapunov": null, "grad_norm": 0.6492588500387332, "grad_max_sv": 0.22496760375797747, "grad_min_sv": 1.180983480297132e-08, "grad_condition": 106906297.43684229, "lr": 0.00028711035421746345, "time_sec": 49.64288353919983 }, { "epoch": 97, "train_loss": 1.6246039770889282, "train_acc": 0.54446, "test_loss": 8.059152350616456, "test_acc": 0.0505, "lyapunov": null, "grad_norm": 0.6473823340688163, "grad_max_sv": 0.23146028257906437, "grad_min_sv": 1.2134549565862019e-08, "grad_condition": 35822540.74264745, "lr": 0.00027768241040753615, "time_sec": 49.6298463344574 }, { "epoch": 98, "train_loss": 1.61877662109375, "train_acc": 0.54736, "test_loss": 8.167729595947266, "test_acc": 0.038, "lyapunov": null, "grad_norm": 0.6455041816035443, "grad_max_sv": 0.22865931317210197, "grad_min_sv": 1.1919900413936979e-08, "grad_condition": 28498587.531759303, "lr": 0.00026835198244006903, "time_sec": 49.63332438468933 }, { "epoch": 99, "train_loss": 3.068192625274658, "train_acc": 0.31474, "test_loss": 5.048260988616943, "test_acc": 0.1146, "lyapunov": null, "grad_norm": 0.8608040247164788, "grad_max_sv": 0.3330514427274466, "grad_min_sv": 1.6094786775555646e-08, "grad_condition": 28526093.82209841, "lr": 0.0002591231629491421, "time_sec": 49.662447690963745 }, { "epoch": 100, "train_loss": 2.316078476104736, "train_acc": 0.39026, "test_loss": 5.392445658874512, "test_acc": 0.0879, "lyapunov": null, "grad_norm": 0.658192665007455, "grad_max_sv": 0.22761380225419997, "grad_min_sv": 1.2582580913994557e-08, "grad_condition": 55399675.47104869, "lr": 0.0002499999999999997, "time_sec": 49.64076352119446 }, { "epoch": 101, "train_loss": 2.1483063832855223, "train_acc": 0.42276, "test_loss": 5.986578815460205, "test_acc": 0.0707, "lyapunov": null, "grad_norm": 0.6484922643705857, "grad_max_sv": 0.22837907671928406, "grad_min_sv": 1.2391293061075892e-08, "grad_condition": 23094080.352399424, "lr": 0.00024098649531343477, "time_sec": 49.6578733921051 }, { "epoch": 102, "train_loss": 2.05953384185791, "train_acc": 0.4427, "test_loss": 6.080546961212158, "test_acc": 0.0573, "lyapunov": null, "grad_norm": 0.6484188898656511, "grad_max_sv": 0.22914629317820073, "grad_min_sv": 1.2451091090104338e-08, "grad_condition": 62209882.03375574, "lr": 0.0002320866025105016, "time_sec": 49.63767695426941 }, { "epoch": 103, "train_loss": 2.004299710121155, "train_acc": 0.45614, "test_loss": 5.895175799560547, "test_acc": 0.0578, "lyapunov": null, "grad_norm": 0.6399422615270736, "grad_max_sv": 0.23107412382960318, "grad_min_sv": 1.2409910121746748e-08, "grad_condition": 22284137.40025208, "lr": 0.0002233042253783278, "time_sec": 49.65248942375183 }, { "epoch": 104, "train_loss": 1.9571235482788085, "train_acc": 0.46526, "test_loss": 5.738465850830078, "test_acc": 0.0523, "lyapunov": null, "grad_norm": 0.6391319009023594, "grad_max_sv": 0.2172716658562422, "grad_min_sv": 1.1984206682580378e-08, "grad_condition": 20112915.921763636, "lr": 0.000214643216157784, "time_sec": 49.633373975753784 }, { "epoch": 105, "train_loss": 1.9224023293304444, "train_acc": 0.47322, "test_loss": 6.117083155059815, "test_acc": 0.05, "lyapunov": null, "grad_norm": 0.6402482339469217, "grad_max_sv": 0.21523526906967164, "grad_min_sv": 1.1972073542948491e-08, "grad_condition": 36228791.07592559, "lr": 0.00020610737385376332, "time_sec": 49.63998031616211 }, { "epoch": 106, "train_loss": 1.8866684201812745, "train_acc": 0.4833, "test_loss": 5.936769345855713, "test_acc": 0.0439, "lyapunov": null, "grad_norm": 0.6419042012012792, "grad_max_sv": 0.22602429389953613, "grad_min_sv": 1.2054361504115762e-08, "grad_condition": 48343281.63861313, "lr": 0.00019770044256881242, "time_sec": 49.65153455734253 }, { "epoch": 107, "train_loss": 1.8594331677246094, "train_acc": 0.48626, "test_loss": 6.035185343170166, "test_acc": 0.046, "lyapunov": null, "grad_norm": 0.6436629646723144, "grad_max_sv": 0.21455634236335755, "grad_min_sv": 1.1783472720489074e-08, "grad_condition": 38784276.09698713, "lr": 0.0001894261098608447, "time_sec": 49.66721272468567 }, { "epoch": 108, "train_loss": 1.8262966638946534, "train_acc": 0.49558, "test_loss": 6.42567989654541, "test_acc": 0.0425, "lyapunov": null, "grad_norm": 0.6468304513936767, "grad_max_sv": 0.22701141163706778, "grad_min_sv": 1.216740327554533e-08, "grad_condition": 72116525.85188936, "lr": 0.000181288005125655, "time_sec": 49.65104866027832 }, { "epoch": 109, "train_loss": 1.8205863860321045, "train_acc": 0.49754, "test_loss": 5.783528507995605, "test_acc": 0.0367, "lyapunov": null, "grad_norm": 0.643976690980956, "grad_max_sv": 0.21868419870734215, "grad_min_sv": 1.2079363115313768e-08, "grad_condition": 20195547.998739578, "lr": 0.0001732896980049473, "time_sec": 49.66611671447754 }, { "epoch": 110, "train_loss": 1.793330860900879, "train_acc": 0.5022, "test_loss": 6.1977317413330075, "test_acc": 0.0425, "lyapunov": null, "grad_norm": 0.6468160086891667, "grad_max_sv": 0.2236340381205082, "grad_min_sv": 1.1926133475226308e-08, "grad_condition": 32237535.591110267, "lr": 0.00016543469682057076, "time_sec": 49.63362669944763 }, { "epoch": 111, "train_loss": 1.7825101839828492, "train_acc": 0.5064, "test_loss": 6.178716979980469, "test_acc": 0.0443, "lyapunov": null, "grad_norm": 0.6424263059147781, "grad_max_sv": 0.22070568352937697, "grad_min_sv": 1.1919835535972866e-08, "grad_condition": 37842182.06602182, "lr": 0.00015772644703565552, "time_sec": 49.65402150154114 }, { "epoch": 112, "train_loss": 1.7541921194458008, "train_acc": 0.5103, "test_loss": 6.0973250106811525, "test_acc": 0.0475, "lyapunov": null, "grad_norm": 0.6481497742539534, "grad_max_sv": 0.22489695958793163, "grad_min_sv": 1.2136619546854188e-08, "grad_condition": 29561688.482165914, "lr": 0.00015016832974331713, "time_sec": 49.65926122665405 }, { "epoch": 113, "train_loss": 1.7488899993515015, "train_acc": 0.51458, "test_loss": 5.979724680328369, "test_acc": 0.0424, "lyapunov": null, "grad_norm": 0.6406667137370472, "grad_max_sv": 0.22864535339176656, "grad_min_sv": 1.191089982824356e-08, "grad_condition": 56508420.06490357, "lr": 0.00014276366018359834, "time_sec": 49.62884473800659 }, { "epoch": 114, "train_loss": 1.7389903827667237, "train_acc": 0.51522, "test_loss": 5.958202845001221, "test_acc": 0.0517, "lyapunov": null, "grad_norm": 0.6426356824149351, "grad_max_sv": 0.22491934411227704, "grad_min_sv": 1.2247705622608906e-08, "grad_condition": 58131203.41244085, "lr": 0.00013551568628929425, "time_sec": 49.62388038635254 }, { "epoch": 115, "train_loss": 1.7231919304656982, "train_acc": 0.52138, "test_loss": 6.056362869262696, "test_acc": 0.0478, "lyapunov": null, "grad_norm": 0.6495040089755264, "grad_max_sv": 0.22354965060949325, "grad_min_sv": 1.2017865864966116e-08, "grad_condition": 28069335.9052594, "lr": 0.00012842758726130276, "time_sec": 49.6635365486145 }, { "epoch": 116, "train_loss": 1.6999663226699828, "train_acc": 0.52556, "test_loss": 6.322325106811523, "test_acc": 0.0459, "lyapunov": null, "grad_norm": 0.6439980745634726, "grad_max_sv": 0.22484406568109988, "grad_min_sv": 1.2245539982025377e-08, "grad_condition": 27693634.55346756, "lr": 0.0001215024721741218, "time_sec": 49.667264223098755 }, { "epoch": 117, "train_loss": 1.6914007580566406, "train_acc": 0.52596, "test_loss": 6.2398702270507815, "test_acc": 0.0358, "lyapunov": null, "grad_norm": 0.6406992341206976, "grad_max_sv": 0.22702743746340276, "grad_min_sv": 1.2027920018309323e-08, "grad_condition": 25480937.943885125, "lr": 0.00011474337861210538, "time_sec": 49.75715970993042 }, { "epoch": 118, "train_loss": 1.682532057723999, "train_acc": 0.5269, "test_loss": 6.022721984863281, "test_acc": 0.0502, "lyapunov": null, "grad_norm": 0.6475614121887046, "grad_max_sv": 0.22498515360057353, "grad_min_sv": 1.2050166899382763e-08, "grad_condition": 76251711.1097268, "lr": 0.00010815327133708009, "time_sec": 49.63880777359009 }, { "epoch": 119, "train_loss": 1.6772437452697755, "train_acc": 0.53014, "test_loss": 5.847724533081054, "test_acc": 0.0456, "lyapunov": null, "grad_norm": 0.645505943920055, "grad_max_sv": 0.22384067326784135, "grad_min_sv": 1.1783700598622104e-08, "grad_condition": 22583004.98493171, "lr": 0.00010173504098790182, "time_sec": 49.63686180114746 }, { "epoch": 120, "train_loss": 1.6719491082763671, "train_acc": 0.53248, "test_loss": 5.856200427246094, "test_acc": 0.0427, "lyapunov": null, "grad_norm": 0.6466969899308954, "grad_max_sv": 0.2293648473918438, "grad_min_sv": 1.2215246461555474e-08, "grad_condition": 26750165.211627714, "lr": 9.549150281252629e-05, "time_sec": 49.633697748184204 }, { "epoch": 121, "train_loss": 1.6578344228744506, "train_acc": 0.53442, "test_loss": 5.862105746459961, "test_acc": 0.0534, "lyapunov": null, "grad_norm": 0.6460809469464214, "grad_max_sv": 0.2225838266313076, "grad_min_sv": 1.212055693311509e-08, "grad_condition": 24676272.501794428, "lr": 8.942539543314794e-05, "time_sec": 49.647422790527344 }, { "epoch": 122, "train_loss": 1.6389700134658813, "train_acc": 0.54052, "test_loss": 5.913293504333496, "test_acc": 0.0439, "lyapunov": null, "grad_norm": 0.6468970710870378, "grad_max_sv": 0.22489394322037698, "grad_min_sv": 1.1876642090624667e-08, "grad_condition": 27879869.134462822, "lr": 8.353937964495024e-05, "time_sec": 49.6471688747406 }, { "epoch": 123, "train_loss": 1.6408760947418213, "train_acc": 0.539, "test_loss": 5.881608892822266, "test_acc": 0.0455, "lyapunov": null, "grad_norm": 0.6409502867501498, "grad_max_sv": 0.2229029569774866, "grad_min_sv": 1.1994366785894606e-08, "grad_condition": 23946080.329339217, "lr": 7.783603724899243e-05, "time_sec": 49.645761013031006 }, { "epoch": 124, "train_loss": 1.6327575244140624, "train_acc": 0.54088, "test_loss": 6.092592315673828, "test_acc": 0.0442, "lyapunov": null, "grad_norm": 0.6388358623443664, "grad_max_sv": 0.22407596856355666, "grad_min_sv": 1.1999070549661983e-08, "grad_condition": 29088864.422511287, "lr": 7.231786991974666e-05, "time_sec": 49.63370180130005 }, { "epoch": 125, "train_loss": 1.626538638381958, "train_acc": 0.54214, "test_loss": 6.060646697998047, "test_acc": 0.0498, "lyapunov": null, "grad_norm": 0.649112571277706, "grad_max_sv": 0.22536444179713727, "grad_min_sv": 1.2212023835916908e-08, "grad_condition": 35126636.74446645, "lr": 6.698729810778072e-05, "time_sec": 49.61126947402954 }, { "epoch": 126, "train_loss": 1.6151732135009766, "train_acc": 0.54378, "test_loss": 6.19133405456543, "test_acc": 0.0452, "lyapunov": null, "grad_norm": 0.645551187410472, "grad_max_sv": 0.227165062725544, "grad_min_sv": 1.194181808161776e-08, "grad_condition": 24734104.665951073, "lr": 6.184665997806817e-05, "time_sec": 49.74283456802368 }, { "epoch": 127, "train_loss": 1.6116835289764404, "train_acc": 0.54702, "test_loss": 6.264876268768311, "test_acc": 0.0576, "lyapunov": null, "grad_norm": 0.6449882086043084, "grad_max_sv": 0.2281236581504345, "grad_min_sv": 1.2174795581409992e-08, "grad_condition": 33327591.078247894, "lr": 5.6898210384392595e-05, "time_sec": 49.66547632217407 }, { "epoch": 128, "train_loss": 1.6025007713317871, "train_acc": 0.55014, "test_loss": 6.29011365814209, "test_acc": 0.0469, "lyapunov": null, "grad_norm": 0.6498584112316286, "grad_max_sv": 0.22942896112799643, "grad_min_sv": 1.2217025608090431e-08, "grad_condition": 181633490.37894756, "lr": 5.214411988029363e-05, "time_sec": 49.644524574279785 }, { "epoch": 129, "train_loss": 1.6006367045974732, "train_acc": 0.55154, "test_loss": 5.960230406188965, "test_acc": 0.0484, "lyapunov": null, "grad_norm": 0.6474761633146622, "grad_max_sv": 0.22425766214728354, "grad_min_sv": 1.2069871824227363e-08, "grad_condition": 25614798.36847374, "lr": 4.7586473766990294e-05, "time_sec": 49.63229012489319 }, { "epoch": 130, "train_loss": 1.5994749016952514, "train_acc": 0.54798, "test_loss": 6.082809280395508, "test_acc": 0.0462, "lyapunov": null, "grad_norm": 0.6436297587317452, "grad_max_sv": 0.2260743647813797, "grad_min_sv": 1.197359623186789e-08, "grad_condition": 47224918.84575805, "lr": 4.32272711786996e-05, "time_sec": 49.653711795806885 }, { "epoch": 131, "train_loss": 1.5907676587677002, "train_acc": 0.55338, "test_loss": 6.253540195465088, "test_acc": 0.0493, "lyapunov": null, "grad_norm": 0.6404122118978958, "grad_max_sv": 0.2243455123156309, "grad_min_sv": 1.1890854798024541e-08, "grad_condition": 28094398.171041556, "lr": 3.906842420574966e-05, "time_sec": 49.65587568283081 }, { "epoch": 132, "train_loss": 1.591219468383789, "train_acc": 0.55168, "test_loss": 6.408939161682129, "test_acc": 0.0426, "lyapunov": null, "grad_norm": 0.6506622903315123, "grad_max_sv": 0.23343092501163482, "grad_min_sv": 1.2356089287846039e-08, "grad_condition": 31524710.75405284, "lr": 3.5111757055874305e-05, "time_sec": 49.64363932609558 }, { "epoch": 133, "train_loss": 1.5818653707885741, "train_acc": 0.55544, "test_loss": 6.288112886047363, "test_acc": 0.0416, "lyapunov": null, "grad_norm": 0.641538436455134, "grad_max_sv": 0.22353356778621675, "grad_min_sv": 1.1930217144046074e-08, "grad_condition": 35984070.824167676, "lr": 3.1359005254054254e-05, "time_sec": 49.6272132396698 }, { "epoch": 134, "train_loss": 1.5757408687973022, "train_acc": 0.5551, "test_loss": 6.169788475036621, "test_acc": 0.0436, "lyapunov": null, "grad_norm": 0.6422263506494424, "grad_max_sv": 0.22716106660664082, "grad_min_sv": 1.1833126612598166e-08, "grad_condition": 52859395.957509615, "lr": 2.7811814881259484e-05, "time_sec": 49.634817600250244 }, { "epoch": 135, "train_loss": 1.573296899986267, "train_acc": 0.5586, "test_loss": 6.409516627502441, "test_acc": 0.0398, "lyapunov": null, "grad_norm": 0.6422323193959601, "grad_max_sv": 0.21986942775547505, "grad_min_sv": 1.1918038018803035e-08, "grad_condition": 135103466.34543505, "lr": 2.4471741852423218e-05, "time_sec": 49.644601583480835 }, { "epoch": 136, "train_loss": 1.5735322719573974, "train_acc": 0.55498, "test_loss": 6.962667681884765, "test_acc": 0.0438, "lyapunov": null, "grad_norm": 0.6425705125331251, "grad_max_sv": 0.22957376427948475, "grad_min_sv": 1.2022417819265719e-08, "grad_condition": 84953424.74808493, "lr": 2.1340251233966362e-05, "time_sec": 49.65340971946716 }, { "epoch": 137, "train_loss": 1.5703629438018798, "train_acc": 0.55592, "test_loss": 6.347426979064942, "test_acc": 0.0416, "lyapunov": null, "grad_norm": 0.6470089432203813, "grad_max_sv": 0.22675703540444375, "grad_min_sv": 1.1964806787001515e-08, "grad_condition": 42242032.09383811, "lr": 1.8418716601170932e-05, "time_sec": 49.65664100646973 }, { "epoch": 138, "train_loss": 1.5664401405334472, "train_acc": 0.55756, "test_loss": 6.496471109771728, "test_acc": 0.0445, "lyapunov": null, "grad_norm": 0.6430396727274027, "grad_max_sv": 0.22493685856461526, "grad_min_sv": 1.2061497275950295e-08, "grad_condition": 23954534.1998593, "lr": 1.570841943568445e-05, "time_sec": 49.642067432403564 }, { "epoch": 139, "train_loss": 1.5627032785415649, "train_acc": 0.5605, "test_loss": 6.283855271148681, "test_acc": 0.0447, "lyapunov": null, "grad_norm": 0.6409841113210015, "grad_max_sv": 0.2232666589319706, "grad_min_sv": 1.1962911396386222e-08, "grad_condition": 259592659.58503166, "lr": 1.3210548563419845e-05, "time_sec": 49.632962465286255 }, { "epoch": 140, "train_loss": 1.5663015616226197, "train_acc": 0.55768, "test_loss": 6.220936709594727, "test_acc": 0.0479, "lyapunov": null, "grad_norm": 0.6429008373506699, "grad_max_sv": 0.22778371684253215, "grad_min_sv": 1.2041603553170077e-08, "grad_condition": 67987905.64758533, "lr": 1.0926199633097203e-05, "time_sec": 49.615734338760376 }, { "epoch": 141, "train_loss": 1.5625858126068115, "train_acc": 0.56096, "test_loss": 6.526646176147461, "test_acc": 0.0493, "lyapunov": null, "grad_norm": 0.6377897998533895, "grad_max_sv": 0.2237264908850193, "grad_min_sv": 1.2073943828072586e-08, "grad_condition": 21432345.22954327, "lr": 8.856374635655688e-06, "time_sec": 49.64499115943909 }, { "epoch": 142, "train_loss": 1.551087869529724, "train_acc": 0.56178, "test_loss": 6.401860023498535, "test_acc": 0.0441, "lyapunov": null, "grad_norm": 0.6415643857015031, "grad_max_sv": 0.2261370625346899, "grad_min_sv": 1.2029182526809845e-08, "grad_condition": 66314375.58164777, "lr": 7.001981464747503e-06, "time_sec": 49.65327548980713 }, { "epoch": 143, "train_loss": 1.5571945658111572, "train_acc": 0.55928, "test_loss": 6.133491006469726, "test_acc": 0.0486, "lyapunov": null, "grad_norm": 0.6447257277887289, "grad_max_sv": 0.22846047319471835, "grad_min_sv": 1.2135202965418701e-08, "grad_condition": 37586048.51019514, "lr": 5.3638335185058295e-06, "time_sec": 49.65649223327637 }, { "epoch": 144, "train_loss": 1.5559558386611938, "train_acc": 0.5614, "test_loss": 6.064924475097656, "test_acc": 0.052, "lyapunov": null, "grad_norm": 0.6401487690577669, "grad_max_sv": 0.2242697723209858, "grad_min_sv": 1.1992281666317605e-08, "grad_condition": 25437338.27988875, "lr": 3.942649342761114e-06, "time_sec": 49.635279178619385 }, { "epoch": 145, "train_loss": 1.553707954940796, "train_acc": 0.56286, "test_loss": 6.5988156112670895, "test_acc": 0.0458, "lyapunov": null, "grad_norm": 0.6407793832198755, "grad_max_sv": 0.23003120347857475, "grad_min_sv": 1.1913595625301366e-08, "grad_condition": 32004871.034651928, "lr": 2.7390523158633524e-06, "time_sec": 49.659799575805664 }, { "epoch": 146, "train_loss": 1.556730777015686, "train_acc": 0.56224, "test_loss": 6.555442190551758, "test_acc": 0.0442, "lyapunov": null, "grad_norm": 0.6414928448640214, "grad_max_sv": 0.22317990958690642, "grad_min_sv": 1.2069366867430501e-08, "grad_condition": 382827154.51718956, "lr": 1.7535703752478133e-06, "time_sec": 49.64200186729431 }, { "epoch": 147, "train_loss": 1.5659333599090577, "train_acc": 0.55716, "test_loss": 6.271022132873535, "test_acc": 0.0492, "lyapunov": null, "grad_norm": 0.6449744450875666, "grad_max_sv": 0.22341229021549225, "grad_min_sv": 1.2069372681833279e-08, "grad_condition": 29803939.928126138, "lr": 9.866357858642196e-07, "time_sec": 49.677895069122314 }, { "epoch": 148, "train_loss": 1.55233530418396, "train_acc": 0.5624, "test_loss": 6.24937745513916, "test_acc": 0.0474, "lyapunov": null, "grad_norm": 0.643448067037432, "grad_max_sv": 0.22757547162473202, "grad_min_sv": 1.2111119601643239e-08, "grad_condition": 33967427.03926191, "lr": 4.38584950570808e-07, "time_sec": 49.623542070388794 }, { "epoch": 149, "train_loss": 1.5480224239730835, "train_acc": 0.5639, "test_loss": 6.394064616394043, "test_acc": 0.0438, "lyapunov": null, "grad_norm": 0.642149980505916, "grad_max_sv": 0.21981638856232166, "grad_min_sv": 1.1695069362070709e-08, "grad_condition": 254731993.0398627, "lr": 1.096582625772501e-07, "time_sec": 49.63520789146423 }, { "epoch": 150, "train_loss": 1.5609092629623413, "train_acc": 0.55828, "test_loss": 6.494824208068848, "test_acc": 0.042, "lyapunov": null, "grad_norm": 0.645124236315014, "grad_max_sv": 0.2247354317456484, "grad_min_sv": 1.2051133440466044e-08, "grad_condition": 35388252.370039664, "lr": 0.0, "time_sec": 49.63965940475464 } ], "16": [ { "epoch": 1, "train_loss": 5.089254416656495, "train_acc": 0.01344, "test_loss": 4.870831555175781, "test_acc": 0.01, "lyapunov": null, "grad_norm": 5.582063459208639, "grad_max_sv": 5.0306542873382565, "grad_min_sv": 8.441757832766683e-08, "grad_condition": 74707534.78681344, "lr": 0.0009998903417374227, "time_sec": 66.78056359291077 }, { "epoch": 2, "train_loss": 4.736304296569824, "train_acc": 0.02172, "test_loss": 4.92340059890747, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.087296772772229, "grad_max_sv": 3.672157108783722, "grad_min_sv": 6.109624839933935e-08, "grad_condition": 230714811.36310124, "lr": 0.0009995614150494292, "time_sec": 66.77934241294861 }, { "epoch": 3, "train_loss": 4.52685978515625, "train_acc": 0.03204, "test_loss": 5.045831031799317, "test_acc": 0.0094, "lyapunov": null, "grad_norm": 3.1470044543912175, "grad_max_sv": 2.6447540044784548, "grad_min_sv": 4.639755384339139e-08, "grad_condition": 65625701.84585605, "lr": 0.0009990133642141358, "time_sec": 66.76001167297363 }, { "epoch": 4, "train_loss": 4.371717319641113, "train_acc": 0.04112, "test_loss": 4.993129699707032, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 2.5123688948843395, "grad_max_sv": 2.1027904629707335, "grad_min_sv": 3.615837387664633e-08, "grad_condition": 418817692.03399765, "lr": 0.0009982464296247522, "time_sec": 66.79424738883972 }, { "epoch": 5, "train_loss": 4.27407361251831, "train_acc": 0.0488, "test_loss": 5.161634465789795, "test_acc": 0.0119, "lyapunov": null, "grad_norm": 1.9573801826064445, "grad_max_sv": 1.613087645173073, "grad_min_sv": 2.8529539808364034e-08, "grad_condition": 62747668.20627429, "lr": 0.0009972609476841367, "time_sec": 66.81961727142334 }, { "epoch": 6, "train_loss": 4.183251854553222, "train_acc": 0.05812, "test_loss": 5.447854755401611, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 1.436449079599314, "grad_max_sv": 1.0459295481443405, "grad_min_sv": 2.0654144772258576e-08, "grad_condition": 94732574.16372415, "lr": 0.000996057350657239, "time_sec": 66.73661756515503 }, { "epoch": 7, "train_loss": 4.103355536193848, "train_acc": 0.06872, "test_loss": 5.544150679016114, "test_acc": 0.0124, "lyapunov": null, "grad_norm": 1.082624040556548, "grad_max_sv": 0.678101472556591, "grad_min_sv": 1.6660088839048904e-08, "grad_condition": 49338508.46283151, "lr": 0.000994636166481494, "time_sec": 66.81501913070679 }, { "epoch": 8, "train_loss": 4.040529095458984, "train_acc": 0.07876, "test_loss": 5.577163777160645, "test_acc": 0.0172, "lyapunov": null, "grad_norm": 0.963869121683512, "grad_max_sv": 0.5578698106110096, "grad_min_sv": 1.4817374840991882e-08, "grad_condition": 46172185.25999212, "lr": 0.0009929980185352525, "time_sec": 66.78599071502686 }, { "epoch": 9, "train_loss": 3.999490645446777, "train_acc": 0.0856, "test_loss": 5.472281336975097, "test_acc": 0.0116, "lyapunov": null, "grad_norm": 0.9198022107734598, "grad_max_sv": 0.5003849364817142, "grad_min_sv": 1.3862486752946878e-08, "grad_condition": 137028895.09887612, "lr": 0.0009911436253643444, "time_sec": 66.77566862106323 }, { "epoch": 10, "train_loss": 3.9641557629394533, "train_acc": 0.09124, "test_loss": 5.43024553604126, "test_acc": 0.0112, "lyapunov": null, "grad_norm": 0.8539816540258655, "grad_max_sv": 0.4397390566766262, "grad_min_sv": 1.3177782898221579e-08, "grad_condition": 50953468.3517745, "lr": 0.0009890738003669028, "time_sec": 66.84108996391296 }, { "epoch": 11, "train_loss": 3.9142907052612306, "train_acc": 0.09788, "test_loss": 5.24972756652832, "test_acc": 0.0174, "lyapunov": null, "grad_norm": 0.8303589651826888, "grad_max_sv": 0.4246540553867817, "grad_min_sv": 1.288730961390705e-08, "grad_condition": 88294678.08247125, "lr": 0.00098678945143658, "time_sec": 66.87874603271484 }, { "epoch": 12, "train_loss": 3.881778168411255, "train_acc": 0.1037, "test_loss": 5.765969756317139, "test_acc": 0.0186, "lyapunov": null, "grad_norm": 0.7855031029198277, "grad_max_sv": 0.3756070680916309, "grad_min_sv": 1.2611303298881715e-08, "grad_condition": 36786532.210794725, "lr": 0.0009842915805643154, "time_sec": 66.82181406021118 }, { "epoch": 13, "train_loss": 3.8490214154815674, "train_acc": 0.1068, "test_loss": 5.832162282562256, "test_acc": 0.0138, "lyapunov": null, "grad_norm": 0.7681061932199776, "grad_max_sv": 0.3604050487279892, "grad_min_sv": 1.2243067453593382e-08, "grad_condition": 131143000.26933214, "lr": 0.000981581283398829, "time_sec": 66.72735929489136 }, { "epoch": 14, "train_loss": 3.828877674636841, "train_acc": 0.11234, "test_loss": 6.293205305480957, "test_acc": 0.0134, "lyapunov": null, "grad_norm": 0.7460407539013362, "grad_max_sv": 0.34510768875479697, "grad_min_sv": 1.1813573212726692e-08, "grad_condition": 49629148.15911349, "lr": 0.0009786597487660333, "time_sec": 66.80630326271057 }, { "epoch": 15, "train_loss": 3.803487832107544, "train_acc": 0.1159, "test_loss": 6.4087516273498535, "test_acc": 0.013, "lyapunov": null, "grad_norm": 0.716379034773642, "grad_max_sv": 0.3261814657598734, "grad_min_sv": 1.1572917107960378e-08, "grad_condition": 31644703.4401185, "lr": 0.0009755282581475766, "time_sec": 66.77157950401306 }, { "epoch": 16, "train_loss": 3.7804446031188963, "train_acc": 0.11974, "test_loss": 6.637075031280518, "test_acc": 0.0121, "lyapunov": null, "grad_norm": 0.696010315133547, "grad_max_sv": 0.3137427795678377, "grad_min_sv": 1.127850834219124e-08, "grad_condition": 69462833.27053933, "lr": 0.0009721881851187403, "time_sec": 66.79616379737854 }, { "epoch": 17, "train_loss": 3.752294116973877, "train_acc": 0.12396, "test_loss": 6.783492227935791, "test_acc": 0.0146, "lyapunov": null, "grad_norm": 0.6728326480937213, "grad_max_sv": 0.29628029987216, "grad_min_sv": 1.0862121784666057e-08, "grad_condition": 67951530.61721244, "lr": 0.0009686409947459456, "time_sec": 66.90411448478699 }, { "epoch": 18, "train_loss": 3.7320939672851563, "train_acc": 0.12876, "test_loss": 6.78950693283081, "test_acc": 0.0166, "lyapunov": null, "grad_norm": 0.6616867936990236, "grad_max_sv": 0.2953863974660635, "grad_min_sv": 1.095610695379251e-08, "grad_condition": 136390664.3535565, "lr": 0.0009648882429441254, "time_sec": 66.75479531288147 }, { "epoch": 19, "train_loss": 3.7112531086730955, "train_acc": 0.13056, "test_loss": 6.585515812683106, "test_acc": 0.0163, "lyapunov": null, "grad_norm": 0.6494124624609345, "grad_max_sv": 0.2933062981814146, "grad_min_sv": 1.0763416760650734e-08, "grad_condition": 31017442.193528943, "lr": 0.00096093157579425, "time_sec": 66.74547505378723 }, { "epoch": 20, "train_loss": 3.6964602882385256, "train_acc": 0.13444, "test_loss": 6.817514788818359, "test_acc": 0.0125, "lyapunov": null, "grad_norm": 0.6419428954986147, "grad_max_sv": 0.28524503484368324, "grad_min_sv": 1.07556832606992e-08, "grad_condition": 29053863.493932776, "lr": 0.0009567727288213001, "time_sec": 66.75940012931824 }, { "epoch": 21, "train_loss": 3.6749328507995607, "train_acc": 0.13862, "test_loss": 6.693168528747559, "test_acc": 0.0132, "lyapunov": null, "grad_norm": 0.6273897945446711, "grad_max_sv": 0.27434321865439415, "grad_min_sv": 1.0629087081326371e-08, "grad_condition": 34272866.07000697, "lr": 0.0009524135262330095, "time_sec": 66.76537322998047 }, { "epoch": 22, "train_loss": 3.6651853931427003, "train_acc": 0.13714, "test_loss": 7.5128926712036135, "test_acc": 0.0145, "lyapunov": null, "grad_norm": 0.6127571430728127, "grad_max_sv": 0.2585024815052748, "grad_min_sv": 9.990007998617045e-09, "grad_condition": 29464610.145040773, "lr": 0.0009478558801197061, "time_sec": 66.88315868377686 }, { "epoch": 23, "train_loss": 3.6479580931091307, "train_acc": 0.14048, "test_loss": 7.259157413482666, "test_acc": 0.013, "lyapunov": null, "grad_norm": 0.6101108448302026, "grad_max_sv": 0.26707915738224985, "grad_min_sv": 1.0416663243084657e-08, "grad_condition": 44782214.320293196, "lr": 0.000943101789615607, "time_sec": 66.73595952987671 }, { "epoch": 24, "train_loss": 3.630135404510498, "train_acc": 0.14444, "test_loss": 6.769294599151611, "test_acc": 0.0187, "lyapunov": null, "grad_norm": 0.5973985296812159, "grad_max_sv": 0.25335801765322685, "grad_min_sv": 9.992184554080685e-09, "grad_condition": 42939810.102056004, "lr": 0.0009381533400219313, "time_sec": 66.83198976516724 }, { "epoch": 25, "train_loss": 3.6139439612579345, "train_acc": 0.14892, "test_loss": 6.755159613037109, "test_acc": 0.0168, "lyapunov": null, "grad_norm": 0.5830251618606708, "grad_max_sv": 0.2401360861957073, "grad_min_sv": 9.682792681542374e-09, "grad_condition": 104126991.37138663, "lr": 0.0009330127018922189, "time_sec": 66.7968385219574 }, { "epoch": 26, "train_loss": 3.5970758290100098, "train_acc": 0.14988, "test_loss": 6.900474179840088, "test_acc": 0.0154, "lyapunov": null, "grad_norm": 0.5787074408614666, "grad_max_sv": 0.23566974550485612, "grad_min_sv": 9.719574232958105e-09, "grad_condition": 38538660.37346102, "lr": 0.000927682130080253, "time_sec": 66.79184246063232 }, { "epoch": 27, "train_loss": 3.5895483708190916, "train_acc": 0.1518, "test_loss": 6.669962855529785, "test_acc": 0.0167, "lyapunov": null, "grad_norm": 0.5803094423675084, "grad_max_sv": 0.2358210153877735, "grad_min_sv": 9.626696496206621e-09, "grad_condition": 193890246.2613204, "lr": 0.0009221639627510072, "time_sec": 66.7768383026123 }, { "epoch": 28, "train_loss": 3.5726418092346193, "train_acc": 0.15258, "test_loss": 7.085537405395508, "test_acc": 0.0168, "lyapunov": null, "grad_norm": 0.570193330921248, "grad_max_sv": 0.23036426715552807, "grad_min_sv": 9.589828041736691e-09, "grad_condition": 89352936.15952519, "lr": 0.0009164606203550494, "time_sec": 66.79721999168396 }, { "epoch": 29, "train_loss": 3.5572311797332765, "train_acc": 0.15608, "test_loss": 6.67531994934082, "test_acc": 0.0189, "lyapunov": null, "grad_norm": 0.5675152442756493, "grad_max_sv": 0.22562474496662616, "grad_min_sv": 9.685276963766754e-09, "grad_condition": 25178417.23491483, "lr": 0.0009105746045668516, "time_sec": 66.85751271247864 }, { "epoch": 30, "train_loss": 3.548038801879883, "train_acc": 0.15748, "test_loss": 6.45415048828125, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.5621117218085827, "grad_max_sv": 0.222617195174098, "grad_min_sv": 9.435066891660959e-09, "grad_condition": 26340041.97866543, "lr": 0.0009045084971874733, "time_sec": 66.79050874710083 }, { "epoch": 31, "train_loss": 3.5402868547058106, "train_acc": 0.16092, "test_loss": 6.451704531860352, "test_acc": 0.0227, "lyapunov": null, "grad_norm": 0.5521957030096883, "grad_max_sv": 0.22002805732190608, "grad_min_sv": 9.47574586573907e-09, "grad_condition": 26149277.514949474, "lr": 0.0008982649590120977, "time_sec": 66.78902292251587 }, { "epoch": 32, "train_loss": 3.5309471380615234, "train_acc": 0.16198, "test_loss": 6.8702184638977055, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.5464579230817538, "grad_max_sv": 0.21435559950768948, "grad_min_sv": 9.215979125329344e-09, "grad_condition": 59638036.88956574, "lr": 0.0008918467286629196, "time_sec": 66.78767824172974 }, { "epoch": 33, "train_loss": 3.5130342961120604, "train_acc": 0.16284, "test_loss": 7.181190188598633, "test_acc": 0.0173, "lyapunov": null, "grad_norm": 0.5437244358450883, "grad_max_sv": 0.22251709625124932, "grad_min_sv": 9.34404511543363e-09, "grad_condition": 28699663.06993841, "lr": 0.0008852566213878943, "time_sec": 66.71953392028809 }, { "epoch": 34, "train_loss": 3.51255979675293, "train_acc": 0.16636, "test_loss": 7.333110241699218, "test_acc": 0.0181, "lyapunov": null, "grad_norm": 0.5393640775064226, "grad_max_sv": 0.20921555384993554, "grad_min_sv": 9.167450806812916e-09, "grad_condition": 25706901.28825941, "lr": 0.000878497527825878, "time_sec": 66.7765941619873 }, { "epoch": 35, "train_loss": 3.4977930699157715, "train_acc": 0.16716, "test_loss": 7.278058241271973, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.5438001473750539, "grad_max_sv": 0.20897603183984756, "grad_min_sv": 9.184564683795137e-09, "grad_condition": 34997969.65153339, "lr": 0.000871572412738697, "time_sec": 66.78994917869568 }, { "epoch": 36, "train_loss": 3.4839546405029296, "train_acc": 0.17056, "test_loss": 6.461000657653808, "test_acc": 0.0224, "lyapunov": null, "grad_norm": 0.5343462863238121, "grad_max_sv": 0.20449809469282626, "grad_min_sv": 9.16483587076744e-09, "grad_condition": 24381579.447592642, "lr": 0.0008644843137107055, "time_sec": 66.78629851341248 }, { "epoch": 37, "train_loss": 3.473933819503784, "train_acc": 0.16984, "test_loss": 6.470654428100586, "test_acc": 0.0179, "lyapunov": null, "grad_norm": 0.5324136173248342, "grad_max_sv": 0.20008243359625338, "grad_min_sv": 9.049705299718491e-09, "grad_condition": 34636922.167240486, "lr": 0.0008572363398164014, "time_sec": 66.79992747306824 }, { "epoch": 38, "train_loss": 3.4661802910614012, "train_acc": 0.17092, "test_loss": 6.690065528869629, "test_acc": 0.0169, "lyapunov": null, "grad_norm": 0.5281123151657661, "grad_max_sv": 0.20084053687751294, "grad_min_sv": 8.970145487507963e-09, "grad_condition": 26480283.34014668, "lr": 0.0008498316702566826, "time_sec": 66.92348313331604 }, { "epoch": 39, "train_loss": 3.4540661865997313, "train_acc": 0.17118, "test_loss": 6.078438919830322, "test_acc": 0.0211, "lyapunov": null, "grad_norm": 0.5227451103728683, "grad_max_sv": 0.1980721667408943, "grad_min_sv": 8.970438091903537e-09, "grad_condition": 149441951.98208869, "lr": 0.0008422735529643442, "time_sec": 66.80566644668579 }, { "epoch": 40, "train_loss": 3.439123515701294, "train_acc": 0.17768, "test_loss": 6.255719974517822, "test_acc": 0.0246, "lyapunov": null, "grad_norm": 0.5238902894663456, "grad_max_sv": 0.2012732930481434, "grad_min_sv": 8.989019251171015e-09, "grad_condition": 26996532.399999082, "lr": 0.0008345653031794289, "time_sec": 66.78863906860352 }, { "epoch": 41, "train_loss": 3.4350976667022706, "train_acc": 0.17682, "test_loss": 5.942692041015625, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.5230791130306572, "grad_max_sv": 0.19939371161162853, "grad_min_sv": 9.040618726557925e-09, "grad_condition": 35747119.67190552, "lr": 0.0008267103019950526, "time_sec": 66.78709435462952 }, { "epoch": 42, "train_loss": 3.4243579791259764, "train_acc": 0.17844, "test_loss": 6.007703511047363, "test_acc": 0.0262, "lyapunov": null, "grad_norm": 0.517545208070228, "grad_max_sv": 0.1922302544116974, "grad_min_sv": 8.860449580982976e-09, "grad_condition": 30602577.279376544, "lr": 0.0008187119948743447, "time_sec": 66.81675243377686 }, { "epoch": 43, "train_loss": 3.41020792137146, "train_acc": 0.1805, "test_loss": 6.532727696228028, "test_acc": 0.0201, "lyapunov": null, "grad_norm": 0.5184771014750174, "grad_max_sv": 0.1960398443043232, "grad_min_sv": 9.042896009781032e-09, "grad_condition": 109678067.45442054, "lr": 0.000810573890139155, "time_sec": 66.88858389854431 }, { "epoch": 44, "train_loss": 3.407023912811279, "train_acc": 0.18096, "test_loss": 6.134778085327149, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.5141850532973719, "grad_max_sv": 0.18923728726804256, "grad_min_sv": 9.02819977631475e-09, "grad_condition": 100774753.52111238, "lr": 0.0008022995574311873, "time_sec": 66.80017518997192 }, { "epoch": 45, "train_loss": 3.395647827911377, "train_acc": 0.1839, "test_loss": 6.376823687744141, "test_acc": 0.0222, "lyapunov": null, "grad_norm": 0.5126811791455754, "grad_max_sv": 0.18771996162831783, "grad_min_sv": 9.025198291837122e-09, "grad_condition": 44468339.93349115, "lr": 0.0007938926261462363, "time_sec": 66.7608630657196 }, { "epoch": 46, "train_loss": 3.3928714478302, "train_acc": 0.18238, "test_loss": 6.053843517303466, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5084041434605487, "grad_max_sv": 0.1855287253856659, "grad_min_sv": 8.774856632975947e-09, "grad_condition": 31787391.609472472, "lr": 0.0007853567838422158, "time_sec": 66.74166297912598 }, { "epoch": 47, "train_loss": 3.379834383621216, "train_acc": 0.18724, "test_loss": 6.8861193962097165, "test_acc": 0.0191, "lyapunov": null, "grad_norm": 0.5060633641106507, "grad_max_sv": 0.1826419185847044, "grad_min_sv": 8.790497434824073e-09, "grad_condition": 34120677.482305124, "lr": 0.0007766957746216719, "time_sec": 66.7685010433197 }, { "epoch": 48, "train_loss": 3.374839401092529, "train_acc": 0.1861, "test_loss": 5.864614242553711, "test_acc": 0.0184, "lyapunov": null, "grad_norm": 0.5042105096702133, "grad_max_sv": 0.18606598749756814, "grad_min_sv": 8.831608784565237e-09, "grad_condition": 28878813.551795878, "lr": 0.0007679133974894982, "time_sec": 66.80099678039551 }, { "epoch": 49, "train_loss": 3.3662559477996825, "train_acc": 0.1887, "test_loss": 6.230384608459473, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.5036215455963197, "grad_max_sv": 0.19020347222685813, "grad_min_sv": 8.961205007554373e-09, "grad_condition": 47201312.24723457, "lr": 0.000759013504686565, "time_sec": 66.75482654571533 }, { "epoch": 50, "train_loss": 3.360496557159424, "train_acc": 0.18832, "test_loss": 6.6197496559143065, "test_acc": 0.0224, "lyapunov": null, "grad_norm": 0.5042398036515723, "grad_max_sv": 0.1836124774068594, "grad_min_sv": 8.934804758553572e-09, "grad_condition": 69600275.62778898, "lr": 0.0007499999999999998, "time_sec": 66.77506113052368 }, { "epoch": 51, "train_loss": 3.350079543914795, "train_acc": 0.1919, "test_loss": 6.343868575286865, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5043278001350275, "grad_max_sv": 0.1825037430971861, "grad_min_sv": 8.887193922446634e-09, "grad_condition": 30024861.754817694, "lr": 0.0007408768370508575, "time_sec": 66.72825312614441 }, { "epoch": 52, "train_loss": 3.3426339905548095, "train_acc": 0.1928, "test_loss": 7.225718658447265, "test_acc": 0.0199, "lyapunov": null, "grad_norm": 0.50252992009141, "grad_max_sv": 0.17567641101777554, "grad_min_sv": 8.804220427770064e-09, "grad_condition": 740966766.3274126, "lr": 0.0007316480175599307, "time_sec": 66.72319173812866 }, { "epoch": 53, "train_loss": 3.3341299864959715, "train_acc": 0.1933, "test_loss": 6.803897232055664, "test_acc": 0.0206, "lyapunov": null, "grad_norm": 0.5011496244728447, "grad_max_sv": 0.17870272882282734, "grad_min_sv": 8.831609968340536e-09, "grad_condition": 22412356.279497318, "lr": 0.0007223175895924635, "time_sec": 66.7704975605011 }, { "epoch": 54, "train_loss": 3.3261182179260254, "train_acc": 0.19572, "test_loss": 6.764497369384766, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.4979381618436104, "grad_max_sv": 0.1770651936531067, "grad_min_sv": 8.860568483093357e-09, "grad_condition": 25306461.91969143, "lr": 0.0007128896457825361, "time_sec": 66.77421927452087 }, { "epoch": 55, "train_loss": 3.316899408569336, "train_acc": 0.196, "test_loss": 6.540015605163574, "test_acc": 0.024, "lyapunov": null, "grad_norm": 0.4977367964912547, "grad_max_sv": 0.17745399177074433, "grad_min_sv": 8.913811780364434e-09, "grad_condition": 22903051.94229058, "lr": 0.0007033683215378998, "time_sec": 66.79190754890442 }, { "epoch": 56, "train_loss": 3.310275382003784, "train_acc": 0.19632, "test_loss": 6.745750244140625, "test_acc": 0.0197, "lyapunov": null, "grad_norm": 0.4988650354422387, "grad_max_sv": 0.17153157331049443, "grad_min_sv": 8.749649851869101e-09, "grad_condition": 22030625.492303018, "lr": 0.0006937577932260512, "time_sec": 66.7638955116272 }, { "epoch": 57, "train_loss": 3.290559967803955, "train_acc": 0.20002, "test_loss": 6.366741171264648, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.4982910029946987, "grad_max_sv": 0.17201930955052375, "grad_min_sv": 8.79568313487053e-09, "grad_condition": 151885613.93341595, "lr": 0.0006840622763423388, "time_sec": 66.78560328483582 }, { "epoch": 58, "train_loss": 3.2923309088134767, "train_acc": 0.20166, "test_loss": 6.417476829528809, "test_acc": 0.0246, "lyapunov": null, "grad_norm": 0.49889716140548146, "grad_max_sv": 0.17567893117666245, "grad_min_sv": 8.913143439981397e-09, "grad_condition": 24256220.95115678, "lr": 0.0006742860236609073, "time_sec": 66.843590259552 }, { "epoch": 59, "train_loss": 3.2908721295928953, "train_acc": 0.19948, "test_loss": 6.640488920593262, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.49266049285108265, "grad_max_sv": 0.17507032714784146, "grad_min_sv": 8.739878155916703e-09, "grad_condition": 26595294.449066617, "lr": 0.0006644333233692913, "time_sec": 66.74992251396179 }, { "epoch": 60, "train_loss": 3.284796617889404, "train_acc": 0.2013, "test_loss": 6.291868576049804, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.49223922966029576, "grad_max_sv": 0.17198019847273827, "grad_min_sv": 8.672205609183693e-09, "grad_condition": 22947196.39326378, "lr": 0.0006545084971874734, "time_sec": 66.7844717502594 }, { "epoch": 61, "train_loss": 3.2731484245300293, "train_acc": 0.20498, "test_loss": 6.035749476623535, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 0.49100354548098263, "grad_max_sv": 0.1670747336000204, "grad_min_sv": 8.751909007925774e-09, "grad_condition": 38402617.820078045, "lr": 0.0006445158984722354, "time_sec": 66.78787755966187 }, { "epoch": 62, "train_loss": 3.2566023439025877, "train_acc": 0.20938, "test_loss": 6.511487716674805, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.4914300539125354, "grad_max_sv": 0.16597167886793612, "grad_min_sv": 8.786484798073424e-09, "grad_condition": 21670471.110839043, "lr": 0.0006344599103076324, "time_sec": 66.70972204208374 }, { "epoch": 63, "train_loss": 3.2568167697143555, "train_acc": 0.20498, "test_loss": 6.652309313964844, "test_acc": 0.0253, "lyapunov": null, "grad_norm": 0.4918024874902063, "grad_max_sv": 0.16560027711093425, "grad_min_sv": 8.785258739235635e-09, "grad_condition": 71694500.46039832, "lr": 0.0006243449435824269, "time_sec": 66.82298398017883 }, { "epoch": 64, "train_loss": 3.2456203374481203, "train_acc": 0.20808, "test_loss": 6.344074755859375, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.49095369226258845, "grad_max_sv": 0.1667012270539999, "grad_min_sv": 8.78574491491868e-09, "grad_condition": 23075446.134346228, "lr": 0.0006141754350553275, "time_sec": 66.78016519546509 }, { "epoch": 65, "train_loss": 3.236674240646362, "train_acc": 0.21152, "test_loss": 6.2899073806762695, "test_acc": 0.0224, "lyapunov": null, "grad_norm": 0.4921779891011333, "grad_max_sv": 0.1677238956093788, "grad_min_sv": 8.828472619626382e-09, "grad_condition": 22441240.736154817, "lr": 0.0006039558454088793, "time_sec": 66.85806608200073 }, { "epoch": 66, "train_loss": 3.22965085647583, "train_acc": 0.2126, "test_loss": 6.429703979492188, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.4881811720746172, "grad_max_sv": 0.164219119399786, "grad_min_sv": 8.673666965219873e-09, "grad_condition": 21892913.98496552, "lr": 0.000593690657292862, "time_sec": 66.78576803207397 }, { "epoch": 67, "train_loss": 3.224384484176636, "train_acc": 0.21134, "test_loss": 6.922704602050781, "test_acc": 0.0234, "lyapunov": null, "grad_norm": 0.48741557028554877, "grad_max_sv": 0.16480680033564568, "grad_min_sv": 8.729063946666394e-09, "grad_condition": 23200356.121009313, "lr": 0.0005833843733580507, "time_sec": 66.77217102050781 }, { "epoch": 68, "train_loss": 3.2157058325195313, "train_acc": 0.21262, "test_loss": 6.7681282539367675, "test_acc": 0.0231, "lyapunov": null, "grad_norm": 0.493681050551615, "grad_max_sv": 0.16986403651535512, "grad_min_sv": 8.815265072070754e-09, "grad_condition": 29441294.083651233, "lr": 0.0005730415142812054, "time_sec": 66.77236366271973 }, { "epoch": 69, "train_loss": 3.210006919326782, "train_acc": 0.21728, "test_loss": 6.470967771148682, "test_acc": 0.0254, "lyapunov": null, "grad_norm": 0.4878926422472019, "grad_max_sv": 0.1638301569968462, "grad_min_sv": 8.75584678441954e-09, "grad_condition": 52016652.85495178, "lr": 0.0005626666167821517, "time_sec": 66.80931973457336 }, { "epoch": 70, "train_loss": 3.196190078125, "train_acc": 0.21792, "test_loss": 5.951667370605469, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.48950735034118803, "grad_max_sv": 0.16142398156225682, "grad_min_sv": 8.815271614059927e-09, "grad_condition": 24483281.259911567, "lr": 0.0005522642316338265, "time_sec": 66.77829360961914 }, { "epoch": 71, "train_loss": 3.2064027897644043, "train_acc": 0.21506, "test_loss": 6.750360327148438, "test_acc": 0.0227, "lyapunov": null, "grad_norm": 0.4871695073962276, "grad_max_sv": 0.16285001635551452, "grad_min_sv": 8.758729140578848e-09, "grad_condition": 23565681.777415752, "lr": 0.0005418389216661573, "time_sec": 66.78215885162354 }, { "epoch": 72, "train_loss": 3.1924329637908935, "train_acc": 0.21822, "test_loss": 6.714482778167724, "test_acc": 0.025, "lyapunov": null, "grad_norm": 0.48778155896125935, "grad_max_sv": 0.1631274577230215, "grad_min_sv": 8.720527765009033e-09, "grad_condition": 63496326.10433636, "lr": 0.0005313952597646563, "time_sec": 66.8333637714386 }, { "epoch": 73, "train_loss": 3.188364574279785, "train_acc": 0.2196, "test_loss": 7.193912121582032, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.4880279755205525, "grad_max_sv": 0.1620686575770378, "grad_min_sv": 8.740592850886574e-09, "grad_condition": 27935085.988161374, "lr": 0.0005209378268645994, "time_sec": 66.71236157417297 }, { "epoch": 74, "train_loss": 3.1774999662780763, "train_acc": 0.22036, "test_loss": 6.498540209960938, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.48663554748850196, "grad_max_sv": 0.16149300280958415, "grad_min_sv": 8.688670802628472e-09, "grad_condition": 102102915.61516626, "lr": 0.0005104712099416781, "time_sec": 66.7784776687622 }, { "epoch": 75, "train_loss": 3.1686367027282714, "train_acc": 0.22206, "test_loss": 7.174583370971679, "test_acc": 0.0209, "lyapunov": null, "grad_norm": 0.48682394841302745, "grad_max_sv": 0.16311258710920812, "grad_min_sv": 8.786071105382209e-09, "grad_condition": 24724999.404770423, "lr": 0.0004999999999999996, "time_sec": 66.76251482963562 }, { "epoch": 76, "train_loss": 3.1639041161346437, "train_acc": 0.225, "test_loss": 7.478772677612305, "test_acc": 0.0197, "lyapunov": null, "grad_norm": 0.49049069180345295, "grad_max_sv": 0.16360066644847393, "grad_min_sv": 8.74060119004927e-09, "grad_condition": 24496844.849027783, "lr": 0.0004895287900583212, "time_sec": 66.72801065444946 }, { "epoch": 77, "train_loss": 3.154632388381958, "train_acc": 0.22396, "test_loss": 6.57794190826416, "test_acc": 0.0277, "lyapunov": null, "grad_norm": 0.4868448729214284, "grad_max_sv": 0.1649958923459053, "grad_min_sv": 8.840505302809554e-09, "grad_condition": 21095789.830121905, "lr": 0.0004790621731353997, "time_sec": 66.73516988754272 }, { "epoch": 78, "train_loss": 3.1528517010498045, "train_acc": 0.22312, "test_loss": 7.1080197311401365, "test_acc": 0.0217, "lyapunov": null, "grad_norm": 0.4887319331046421, "grad_max_sv": 0.1634005270898342, "grad_min_sv": 8.874131324221323e-09, "grad_condition": 20245229.779506456, "lr": 0.000468604740235343, "time_sec": 66.71177268028259 }, { "epoch": 79, "train_loss": 3.1432092308807373, "train_acc": 0.229, "test_loss": 7.214095246887207, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.48838038818221724, "grad_max_sv": 0.16252909004688262, "grad_min_sv": 8.819199073806239e-09, "grad_condition": 26520623.470668785, "lr": 0.00045816107833384175, "time_sec": 66.7255470752716 }, { "epoch": 80, "train_loss": 3.1343304455566408, "train_acc": 0.22744, "test_loss": 6.940009968566894, "test_acc": 0.0255, "lyapunov": null, "grad_norm": 0.48846815734372934, "grad_max_sv": 0.1635790452361107, "grad_min_sv": 8.798821884981045e-09, "grad_condition": 21131375.648625843, "lr": 0.0004477357683661729, "time_sec": 66.72595143318176 }, { "epoch": 81, "train_loss": 3.1298222771453856, "train_acc": 0.22642, "test_loss": 7.29024638671875, "test_acc": 0.0259, "lyapunov": null, "grad_norm": 0.49086957943567056, "grad_max_sv": 0.15947132408618928, "grad_min_sv": 8.788132586923236e-09, "grad_condition": 28060653.55060955, "lr": 0.00043733338321784746, "time_sec": 66.77222657203674 }, { "epoch": 82, "train_loss": 3.117735626373291, "train_acc": 0.23038, "test_loss": 6.9144718528747555, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.49138593312101014, "grad_max_sv": 0.159454994648695, "grad_min_sv": 8.759537291390742e-09, "grad_condition": 308046195.23178655, "lr": 0.0004269584857187939, "time_sec": 66.75987410545349 }, { "epoch": 83, "train_loss": 3.1175857275390624, "train_acc": 0.23194, "test_loss": 6.706077085876465, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.4924089866784705, "grad_max_sv": 0.16311928667128087, "grad_min_sv": 8.90124301697326e-09, "grad_condition": 32153498.186816484, "lr": 0.0004166156266419484, "time_sec": 66.74847078323364 }, { "epoch": 84, "train_loss": 3.1045476649475097, "train_acc": 0.23228, "test_loss": 6.154573769378662, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.49118329484452294, "grad_max_sv": 0.16205354779958725, "grad_min_sv": 8.760578144861864e-09, "grad_condition": 52646848.44888155, "lr": 0.0004063093427071373, "time_sec": 66.74011945724487 }, { "epoch": 85, "train_loss": 3.1078517518615723, "train_acc": 0.2344, "test_loss": 6.530753035736084, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.4904367995984335, "grad_max_sv": 0.161368178576231, "grad_min_sv": 8.888137861817746e-09, "grad_condition": 21303276.13293609, "lr": 0.0003960441545911199, "time_sec": 66.72609543800354 }, { "epoch": 86, "train_loss": 3.0952324195861816, "train_acc": 0.23368, "test_loss": 6.240639804077149, "test_acc": 0.0308, "lyapunov": null, "grad_norm": 0.49428635963779644, "grad_max_sv": 0.15839767456054688, "grad_min_sv": 8.964046511322766e-09, "grad_condition": 28785588.134401, "lr": 0.0003858245649446718, "time_sec": 66.74975419044495 }, { "epoch": 87, "train_loss": 3.0952587001037597, "train_acc": 0.23356, "test_loss": 6.628809076690674, "test_acc": 0.0322, "lyapunov": null, "grad_norm": 0.49144116518393927, "grad_max_sv": 0.16221071667969228, "grad_min_sv": 8.962699898917847e-09, "grad_condition": 20571826.020635325, "lr": 0.00037565505641757235, "time_sec": 66.7199854850769 }, { "epoch": 88, "train_loss": 3.0922299211120605, "train_acc": 0.2344, "test_loss": 6.5014627777099605, "test_acc": 0.0295, "lyapunov": null, "grad_norm": 0.49360674992051745, "grad_max_sv": 0.1644837912172079, "grad_min_sv": 8.975622673573769e-09, "grad_condition": 28771115.174499214, "lr": 0.00036554008969236695, "time_sec": 66.74195861816406 }, { "epoch": 89, "train_loss": 3.0761431072235106, "train_acc": 0.23966, "test_loss": 7.287914637756348, "test_acc": 0.0263, "lyapunov": null, "grad_norm": 0.4909525286245839, "grad_max_sv": 0.16159643046557903, "grad_min_sv": 8.858207814488317e-09, "grad_condition": 22425426.033500116, "lr": 0.0003554841015277638, "time_sec": 66.68954610824585 }, { "epoch": 90, "train_loss": 3.0747881409454347, "train_acc": 0.2377, "test_loss": 7.193168222808838, "test_acc": 0.0262, "lyapunov": null, "grad_norm": 0.4911854264861308, "grad_max_sv": 0.1574687145650387, "grad_min_sv": 8.917724771215912e-09, "grad_condition": 118300212.93482408, "lr": 0.000345491502812526, "time_sec": 66.77580857276917 }, { "epoch": 91, "train_loss": 3.070805363311768, "train_acc": 0.23994, "test_loss": 6.052177616882324, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 0.49339922868661756, "grad_max_sv": 0.1602653257548809, "grad_min_sv": 8.95202442799392e-09, "grad_condition": 44017380.37680817, "lr": 0.0003355666766307081, "time_sec": 66.69368362426758 }, { "epoch": 92, "train_loss": 3.0647792414855957, "train_acc": 0.23982, "test_loss": 6.179595366668702, "test_acc": 0.0301, "lyapunov": null, "grad_norm": 0.4931917462731246, "grad_max_sv": 0.1606559857726097, "grad_min_sv": 9.0662935353647e-09, "grad_condition": 19908430.164367903, "lr": 0.00032571397633909225, "time_sec": 66.70123243331909 }, { "epoch": 93, "train_loss": 3.0550636367034913, "train_acc": 0.2422, "test_loss": 6.34838355255127, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.49186583360988956, "grad_max_sv": 0.1579043295234442, "grad_min_sv": 8.987567995388801e-09, "grad_condition": 22006714.29709431, "lr": 0.00031593772365766094, "time_sec": 66.71771335601807 }, { "epoch": 94, "train_loss": 3.043202466583252, "train_acc": 0.24232, "test_loss": 6.682511094665528, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.4962595942491337, "grad_max_sv": 0.1622728668153286, "grad_min_sv": 9.030461697867587e-09, "grad_condition": 30360701.35233465, "lr": 0.0003062422067739483, "time_sec": 66.82941317558289 }, { "epoch": 95, "train_loss": 3.0412676640319822, "train_acc": 0.2447, "test_loss": 6.22475659866333, "test_acc": 0.0318, "lyapunov": null, "grad_norm": 0.4915093368948821, "grad_max_sv": 0.15892955474555492, "grad_min_sv": 8.946618996336086e-09, "grad_condition": 69026491.3661272, "lr": 0.00029663167846209965, "time_sec": 66.73191213607788 }, { "epoch": 96, "train_loss": 3.0352964888000487, "train_acc": 0.2471, "test_loss": 6.5577602828979495, "test_acc": 0.0293, "lyapunov": null, "grad_norm": 0.49248702226826524, "grad_max_sv": 0.1611651573330164, "grad_min_sv": 8.952907482040472e-09, "grad_condition": 31830348.776786767, "lr": 0.00028711035421746345, "time_sec": 66.75891017913818 }, { "epoch": 97, "train_loss": 3.029721915130615, "train_acc": 0.24842, "test_loss": 6.651570160675049, "test_acc": 0.0289, "lyapunov": null, "grad_norm": 0.4943874310747337, "grad_max_sv": 0.1606567233800888, "grad_min_sv": 9.076670715035818e-09, "grad_condition": 36874515.58106691, "lr": 0.00027768241040753615, "time_sec": 66.74775719642639 }, { "epoch": 98, "train_loss": 3.0293620677948, "train_acc": 0.24548, "test_loss": 6.7938948928833005, "test_acc": 0.0291, "lyapunov": null, "grad_norm": 0.4970218817533374, "grad_max_sv": 0.15979058742523194, "grad_min_sv": 9.025258917993995e-09, "grad_condition": 21461503.719760668, "lr": 0.00026835198244006903, "time_sec": 66.71226525306702 }, { "epoch": 99, "train_loss": 3.0232276085662844, "train_acc": 0.24992, "test_loss": 6.842255628967285, "test_acc": 0.0287, "lyapunov": null, "grad_norm": 0.4964386837271484, "grad_max_sv": 0.16297372654080391, "grad_min_sv": 9.074463314107107e-09, "grad_condition": 38263953.83433555, "lr": 0.0002591231629491421, "time_sec": 66.73949241638184 }, { "epoch": 100, "train_loss": 3.0220013402557373, "train_acc": 0.24942, "test_loss": 7.044534214782715, "test_acc": 0.0264, "lyapunov": null, "grad_norm": 0.4963097153496672, "grad_max_sv": 0.1608368031680584, "grad_min_sv": 8.999894975450506e-09, "grad_condition": 41372527.951466024, "lr": 0.0002499999999999997, "time_sec": 66.77927494049072 }, { "epoch": 101, "train_loss": 3.0203451880645753, "train_acc": 0.2487, "test_loss": 6.837228249359131, "test_acc": 0.0287, "lyapunov": null, "grad_norm": 0.49771273059241083, "grad_max_sv": 0.16355772241950034, "grad_min_sv": 9.09030489493201e-09, "grad_condition": 21122520.470805176, "lr": 0.00024098649531343477, "time_sec": 66.73630166053772 }, { "epoch": 102, "train_loss": 3.0023662061309815, "train_acc": 0.2517, "test_loss": 7.122745419311523, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.4990559135673985, "grad_max_sv": 0.16072520166635512, "grad_min_sv": 9.129048311740107e-09, "grad_condition": 20645009.356589716, "lr": 0.0002320866025105016, "time_sec": 66.75698280334473 }, { "epoch": 103, "train_loss": 2.998011736526489, "train_acc": 0.25374, "test_loss": 7.035623414611816, "test_acc": 0.0277, "lyapunov": null, "grad_norm": 0.49574085619625, "grad_max_sv": 0.15668718423694372, "grad_min_sv": 9.148743505132951e-09, "grad_condition": 33626359.10658366, "lr": 0.0002233042253783278, "time_sec": 66.75562310218811 }, { "epoch": 104, "train_loss": 2.997530387496948, "train_acc": 0.25132, "test_loss": 6.999302207946777, "test_acc": 0.0292, "lyapunov": null, "grad_norm": 0.5002716771455139, "grad_max_sv": 0.16238998733460902, "grad_min_sv": 9.078950441443468e-09, "grad_condition": 20349177.478017032, "lr": 0.000214643216157784, "time_sec": 66.79467344284058 }, { "epoch": 105, "train_loss": 2.9906964135742187, "train_acc": 0.25506, "test_loss": 7.1786759597778325, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.4946350333441307, "grad_max_sv": 0.1600412342697382, "grad_min_sv": 9.088851333008408e-09, "grad_condition": 57224884.57519225, "lr": 0.00020610737385376332, "time_sec": 66.74862432479858 }, { "epoch": 106, "train_loss": 2.984202498321533, "train_acc": 0.25656, "test_loss": 7.172381106567383, "test_acc": 0.0269, "lyapunov": null, "grad_norm": 0.4982362018645274, "grad_max_sv": 0.1571014266461134, "grad_min_sv": 9.054493026183775e-09, "grad_condition": 22960817.2493112, "lr": 0.00019770044256881242, "time_sec": 66.77469301223755 }, { "epoch": 107, "train_loss": 2.975272487335205, "train_acc": 0.25552, "test_loss": 7.0334813690185545, "test_acc": 0.0316, "lyapunov": null, "grad_norm": 0.49588396234922755, "grad_max_sv": 0.16075790040194987, "grad_min_sv": 9.117187717289087e-09, "grad_condition": 22400105.746660806, "lr": 0.0001894261098608447, "time_sec": 66.76792025566101 }, { "epoch": 108, "train_loss": 2.9756462240600587, "train_acc": 0.25536, "test_loss": 7.59121438293457, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.4971626921836716, "grad_max_sv": 0.15787492766976358, "grad_min_sv": 9.170698456424448e-09, "grad_condition": 2842260093.4746685, "lr": 0.000181288005125655, "time_sec": 66.72157907485962 }, { "epoch": 109, "train_loss": 2.9735143406677245, "train_acc": 0.25872, "test_loss": 6.839995979309082, "test_acc": 0.0305, "lyapunov": null, "grad_norm": 0.49760629850795685, "grad_max_sv": 0.16163251921534538, "grad_min_sv": 9.179918801505149e-09, "grad_condition": 26931510.48697853, "lr": 0.0001732896980049473, "time_sec": 66.76784825325012 }, { "epoch": 110, "train_loss": 2.971026375198364, "train_acc": 0.25932, "test_loss": 6.99457964477539, "test_acc": 0.0301, "lyapunov": null, "grad_norm": 0.4972222462184193, "grad_max_sv": 0.1576628390699625, "grad_min_sv": 9.118256634466082e-09, "grad_condition": 25805428.695002638, "lr": 0.00016543469682057076, "time_sec": 66.7546181678772 }, { "epoch": 111, "train_loss": 2.961785153198242, "train_acc": 0.25938, "test_loss": 7.5968095703125, "test_acc": 0.0278, "lyapunov": null, "grad_norm": 0.499682712724269, "grad_max_sv": 0.16410896554589272, "grad_min_sv": 9.131004422013866e-09, "grad_condition": 21672900.170981936, "lr": 0.00015772644703565552, "time_sec": 66.74458265304565 }, { "epoch": 112, "train_loss": 2.9625577368927, "train_acc": 0.25878, "test_loss": 7.764190951538086, "test_acc": 0.026, "lyapunov": null, "grad_norm": 0.498213643225678, "grad_max_sv": 0.15600935891270637, "grad_min_sv": 9.151295493614598e-09, "grad_condition": 20410187.211308915, "lr": 0.00015016832974331713, "time_sec": 66.75516033172607 }, { "epoch": 113, "train_loss": 2.95476414642334, "train_acc": 0.25912, "test_loss": 7.14678690032959, "test_acc": 0.0306, "lyapunov": null, "grad_norm": 0.4989192084378189, "grad_max_sv": 0.16326018050312996, "grad_min_sv": 9.208972755539447e-09, "grad_condition": 51946084.62151481, "lr": 0.00014276366018359834, "time_sec": 66.8117504119873 }, { "epoch": 114, "train_loss": 2.959580585861206, "train_acc": 0.26152, "test_loss": 7.228822399902343, "test_acc": 0.0306, "lyapunov": null, "grad_norm": 0.4993052937105196, "grad_max_sv": 0.1597112886607647, "grad_min_sv": 9.184225070735242e-09, "grad_condition": 24287456.61544974, "lr": 0.00013551568628929425, "time_sec": 66.71526288986206 }, { "epoch": 115, "train_loss": 2.951429924316406, "train_acc": 0.2597, "test_loss": 6.857805014038086, "test_acc": 0.0311, "lyapunov": null, "grad_norm": 0.5001172379881009, "grad_max_sv": 0.16317447423934936, "grad_min_sv": 9.167603101656319e-09, "grad_condition": 19878785.72490542, "lr": 0.00012842758726130276, "time_sec": 66.7846131324768 }, { "epoch": 116, "train_loss": 2.9463225456237794, "train_acc": 0.26044, "test_loss": 7.2446568466186525, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.4998364506796334, "grad_max_sv": 0.16249994188547134, "grad_min_sv": 9.130782213651045e-09, "grad_condition": 19998723.305069156, "lr": 0.0001215024721741218, "time_sec": 66.7700080871582 }, { "epoch": 117, "train_loss": 2.937184557876587, "train_acc": 0.26268, "test_loss": 7.438090939331055, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.5024891978806302, "grad_max_sv": 0.16552512347698212, "grad_min_sv": 9.170617681214522e-09, "grad_condition": 40015057.54321941, "lr": 0.00011474337861210538, "time_sec": 66.80615854263306 }, { "epoch": 118, "train_loss": 2.942110910797119, "train_acc": 0.2621, "test_loss": 7.324624530029297, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.5000364684279365, "grad_max_sv": 0.16344034522771836, "grad_min_sv": 9.328158331878279e-09, "grad_condition": 21122225.248831175, "lr": 0.00010815327133708009, "time_sec": 66.78372955322266 }, { "epoch": 119, "train_loss": 2.93369575592041, "train_acc": 0.26596, "test_loss": 8.056785229492187, "test_acc": 0.0234, "lyapunov": null, "grad_norm": 0.5006441450285836, "grad_max_sv": 0.1595278237015009, "grad_min_sv": 9.219788181871746e-09, "grad_condition": 69721984.41132018, "lr": 0.00010173504098790182, "time_sec": 66.76624512672424 }, { "epoch": 120, "train_loss": 2.932797766189575, "train_acc": 0.26344, "test_loss": 7.282906192016601, "test_acc": 0.0275, "lyapunov": null, "grad_norm": 0.5037900163559795, "grad_max_sv": 0.16313258111476897, "grad_min_sv": 9.198472578075822e-09, "grad_condition": 21164339.052237906, "lr": 9.549150281252629e-05, "time_sec": 66.71441149711609 }, { "epoch": 121, "train_loss": 2.9284527645874023, "train_acc": 0.26852, "test_loss": 7.262115740966797, "test_acc": 0.0293, "lyapunov": null, "grad_norm": 0.5036251360683918, "grad_max_sv": 0.1591605730354786, "grad_min_sv": 9.272000557614124e-09, "grad_condition": 40898149.281216756, "lr": 8.942539543314794e-05, "time_sec": 66.74046039581299 }, { "epoch": 122, "train_loss": 2.936891605682373, "train_acc": 0.2668, "test_loss": 7.490768426513672, "test_acc": 0.0269, "lyapunov": null, "grad_norm": 0.5021434540478252, "grad_max_sv": 0.16143947280943394, "grad_min_sv": 9.394398098327983e-09, "grad_condition": 19799976.943244066, "lr": 8.353937964495024e-05, "time_sec": 66.81744265556335 }, { "epoch": 123, "train_loss": 2.9236154601287843, "train_acc": 0.26716, "test_loss": 7.120488947296143, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.5028382354847799, "grad_max_sv": 0.15968299470841885, "grad_min_sv": 9.204075489266384e-09, "grad_condition": 47939633.576168984, "lr": 7.783603724899243e-05, "time_sec": 66.76852679252625 }, { "epoch": 124, "train_loss": 2.92061264755249, "train_acc": 0.2666, "test_loss": 7.461192834472656, "test_acc": 0.0278, "lyapunov": null, "grad_norm": 0.5005688158224261, "grad_max_sv": 0.1629866801202297, "grad_min_sv": 9.212228484906105e-09, "grad_condition": 33814966.96761195, "lr": 7.231786991974666e-05, "time_sec": 66.7814073562622 }, { "epoch": 125, "train_loss": 2.9229219720458985, "train_acc": 0.26648, "test_loss": 7.498983331298828, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.5030160580327866, "grad_max_sv": 0.16155149266123772, "grad_min_sv": 9.212426940741203e-09, "grad_condition": 19527956.667884845, "lr": 6.698729810778072e-05, "time_sec": 66.79239439964294 }, { "epoch": 126, "train_loss": 2.9202857413482666, "train_acc": 0.26618, "test_loss": 7.286036429595947, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.5046458563501821, "grad_max_sv": 0.16270169503986837, "grad_min_sv": 9.235521156170102e-09, "grad_condition": 21514883.897712767, "lr": 6.184665997806817e-05, "time_sec": 66.79009366035461 }, { "epoch": 127, "train_loss": 2.9112009690093994, "train_acc": 0.27148, "test_loss": 6.8060284591674804, "test_acc": 0.0299, "lyapunov": null, "grad_norm": 0.5048043752309758, "grad_max_sv": 0.1627126146107912, "grad_min_sv": 9.337147274801615e-09, "grad_condition": 20067936.42847693, "lr": 5.6898210384392595e-05, "time_sec": 66.7122654914856 }, { "epoch": 128, "train_loss": 2.915534998703003, "train_acc": 0.26936, "test_loss": 7.528692306518555, "test_acc": 0.027, "lyapunov": null, "grad_norm": 0.505141680481134, "grad_max_sv": 0.15927630066871643, "grad_min_sv": 9.138972020816815e-09, "grad_condition": 283653990.6139595, "lr": 5.214411988029363e-05, "time_sec": 66.76755571365356 }, { "epoch": 129, "train_loss": 2.911044763031006, "train_acc": 0.26856, "test_loss": 7.442652993774414, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.5029480129383956, "grad_max_sv": 0.16405761763453483, "grad_min_sv": 9.220356501568604e-09, "grad_condition": 46047919.55891801, "lr": 4.7586473766990294e-05, "time_sec": 66.69603776931763 }, { "epoch": 130, "train_loss": 2.907666951751709, "train_acc": 0.26828, "test_loss": 7.026823535919189, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.5025376312973467, "grad_max_sv": 0.15946717746555805, "grad_min_sv": 9.221378457352492e-09, "grad_condition": 33199750.366487652, "lr": 4.32272711786996e-05, "time_sec": 66.69535183906555 }, { "epoch": 131, "train_loss": 2.902869781417847, "train_acc": 0.26958, "test_loss": 7.536094513702393, "test_acc": 0.0292, "lyapunov": null, "grad_norm": 0.5050312390729839, "grad_max_sv": 0.16128032505512238, "grad_min_sv": 9.28452798905008e-09, "grad_condition": 135705763.13078815, "lr": 3.906842420574966e-05, "time_sec": 66.77000784873962 }, { "epoch": 132, "train_loss": 2.9037561528778078, "train_acc": 0.27136, "test_loss": 7.281431489562988, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.5052870516198174, "grad_max_sv": 0.1615588180720806, "grad_min_sv": 9.289024057758388e-09, "grad_condition": 128507811.16031823, "lr": 3.5111757055874305e-05, "time_sec": 66.75163435935974 }, { "epoch": 133, "train_loss": 2.8991165522766114, "train_acc": 0.27156, "test_loss": 7.282987453460693, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.5034061589294716, "grad_max_sv": 0.1581054452806711, "grad_min_sv": 9.274782794554958e-09, "grad_condition": 19574470.928057812, "lr": 3.1359005254054254e-05, "time_sec": 66.75138425827026 }, { "epoch": 134, "train_loss": 2.9077910748291016, "train_acc": 0.2711, "test_loss": 7.448024377441406, "test_acc": 0.0294, "lyapunov": null, "grad_norm": 0.5046423793403062, "grad_max_sv": 0.1635249551385641, "grad_min_sv": 9.433638015199363e-09, "grad_condition": 28668380.335333012, "lr": 2.7811814881259484e-05, "time_sec": 66.7329490184784 }, { "epoch": 135, "train_loss": 2.896955527267456, "train_acc": 0.27268, "test_loss": 7.478409793090821, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.5037173672388571, "grad_max_sv": 0.1622908242046833, "grad_min_sv": 9.298784615918709e-09, "grad_condition": 61773843.27193861, "lr": 2.4471741852423218e-05, "time_sec": 66.7459568977356 }, { "epoch": 136, "train_loss": 2.8964898432922364, "train_acc": 0.27182, "test_loss": 7.354159661865235, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.5028619652958791, "grad_max_sv": 0.1600797414779663, "grad_min_sv": 9.074624002236575e-09, "grad_condition": 22249764.299153708, "lr": 2.1340251233966362e-05, "time_sec": 66.75164866447449 }, { "epoch": 137, "train_loss": 2.895348368530273, "train_acc": 0.27172, "test_loss": 7.632054917144775, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.5031853951467254, "grad_max_sv": 0.16463851928710938, "grad_min_sv": 9.441171729823727e-09, "grad_condition": 30855600.541313868, "lr": 1.8418716601170932e-05, "time_sec": 66.75186562538147 }, { "epoch": 138, "train_loss": 2.900583278427124, "train_acc": 0.2717, "test_loss": 7.199238876342774, "test_acc": 0.0295, "lyapunov": null, "grad_norm": 0.5034869997386973, "grad_max_sv": 0.16063327342271805, "grad_min_sv": 9.296063535613186e-09, "grad_condition": 25145907.489137426, "lr": 1.570841943568445e-05, "time_sec": 66.75230479240417 }, { "epoch": 139, "train_loss": 2.8933637355804445, "train_acc": 0.27194, "test_loss": 7.248442086029053, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.504304603082473, "grad_max_sv": 0.162884946167469, "grad_min_sv": 9.367608214128075e-09, "grad_condition": 19993036.722377926, "lr": 1.3210548563419845e-05, "time_sec": 66.7671320438385 }, { "epoch": 140, "train_loss": 2.894832459564209, "train_acc": 0.27222, "test_loss": 7.71000400390625, "test_acc": 0.0294, "lyapunov": null, "grad_norm": 0.5047832470696201, "grad_max_sv": 0.16155096814036368, "grad_min_sv": 9.160464450874706e-09, "grad_condition": 20567241.25641649, "lr": 1.0926199633097203e-05, "time_sec": 66.73179697990417 }, { "epoch": 141, "train_loss": 2.897352989578247, "train_acc": 0.27064, "test_loss": 7.4464299194335934, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.5061737427703262, "grad_max_sv": 0.16413113810122013, "grad_min_sv": 9.289870605763695e-09, "grad_condition": 51343563.84333199, "lr": 8.856374635655688e-06, "time_sec": 66.75452041625977 }, { "epoch": 142, "train_loss": 2.8876253887939454, "train_acc": 0.2751, "test_loss": 7.67550869064331, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.50486204633145, "grad_max_sv": 0.16515321880578995, "grad_min_sv": 9.218709545733006e-09, "grad_condition": 25662988.761511788, "lr": 7.001981464747503e-06, "time_sec": 66.76586389541626 }, { "epoch": 143, "train_loss": 2.8951072731781005, "train_acc": 0.2711, "test_loss": 7.276433151245117, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.5066003424324655, "grad_max_sv": 0.16512982696294784, "grad_min_sv": 9.368238332307932e-09, "grad_condition": 20872282.150921334, "lr": 5.3638335185058295e-06, "time_sec": 66.77883982658386 }, { "epoch": 144, "train_loss": 2.896107662887573, "train_acc": 0.27174, "test_loss": 7.442941972351075, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.5058752626030726, "grad_max_sv": 0.1646978858858347, "grad_min_sv": 9.187450514258621e-09, "grad_condition": 21323054.46289139, "lr": 3.942649342761114e-06, "time_sec": 66.74654960632324 }, { "epoch": 145, "train_loss": 2.8981069023132324, "train_acc": 0.27052, "test_loss": 7.511137809753418, "test_acc": 0.0286, "lyapunov": null, "grad_norm": 0.5043941197302124, "grad_max_sv": 0.16361674722284078, "grad_min_sv": 9.248454605793876e-09, "grad_condition": 124843071.51810357, "lr": 2.7390523158633524e-06, "time_sec": 66.71942782402039 }, { "epoch": 146, "train_loss": 2.897443035583496, "train_acc": 0.27094, "test_loss": 7.219273558044433, "test_acc": 0.0301, "lyapunov": null, "grad_norm": 0.5044889597609223, "grad_max_sv": 0.1617003157734871, "grad_min_sv": 9.33726697904813e-09, "grad_condition": 20578970.810026187, "lr": 1.7535703752478133e-06, "time_sec": 66.74967193603516 }, { "epoch": 147, "train_loss": 2.8972148944854736, "train_acc": 0.27036, "test_loss": 7.628332612609864, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.5052009377242357, "grad_max_sv": 0.15890285596251488, "grad_min_sv": 9.382556353555727e-09, "grad_condition": 91821063.92388035, "lr": 9.866357858642196e-07, "time_sec": 66.73621463775635 }, { "epoch": 148, "train_loss": 2.8898702787017823, "train_acc": 0.27194, "test_loss": 7.505082284545899, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.5047197831030149, "grad_max_sv": 0.16516413502395152, "grad_min_sv": 9.324620061507139e-09, "grad_condition": 43789169.5949554, "lr": 4.38584950570808e-07, "time_sec": 66.76141929626465 }, { "epoch": 149, "train_loss": 2.9011361352539065, "train_acc": 0.26824, "test_loss": 7.6542517242431645, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.5054339021083573, "grad_max_sv": 0.16298294067382812, "grad_min_sv": 9.178197371562114e-09, "grad_condition": 21653740.393576562, "lr": 1.096582625772501e-07, "time_sec": 66.75421690940857 }, { "epoch": 150, "train_loss": 2.9011223357391356, "train_acc": 0.27114, "test_loss": 7.460437265014648, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.5059469716903541, "grad_max_sv": 0.16557817347347736, "grad_min_sv": 9.153120701372967e-09, "grad_condition": 361494763.7112081, "lr": 0.0, "time_sec": 66.78962397575378 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 4.580237577819824, "train_acc": 0.07172, "test_loss": 4.204835011291504, "test_acc": 0.0865, "lyapunov": 2.1020694111314273, "grad_norm": 5.891421444416132, "grad_max_sv": 4.6086235523223875, "grad_min_sv": 1.0778671248878879e-07, "grad_condition": 54871165.85509853, "lr": 0.0009998903417374227, "time_sec": 41.860575914382935 }, { "epoch": 2, "train_loss": 4.172055626296997, "train_acc": 0.0921, "test_loss": 4.402019414520264, "test_acc": 0.0558, "lyapunov": 1.6787975471647805, "grad_norm": 3.9258769364442525, "grad_max_sv": 2.9158192813396453, "grad_min_sv": 7.291154454081017e-08, "grad_condition": 84308361.49485277, "lr": 0.0009995614150494292, "time_sec": 41.754839181900024 }, { "epoch": 3, "train_loss": 4.050799645080566, "train_acc": 0.10584, "test_loss": 5.545398815917968, "test_acc": 0.041, "lyapunov": 1.5661922080437545, "grad_norm": 3.128537052862856, "grad_max_sv": 2.1766103327274324, "grad_min_sv": 5.8618463349979774e-08, "grad_condition": 41372858.502355784, "lr": 0.0009990133642141358, "time_sec": 41.694422006607056 }, { "epoch": 4, "train_loss": 3.9627039431762694, "train_acc": 0.11682, "test_loss": 6.328290705871582, "test_acc": 0.0228, "lyapunov": 1.5445425864070883, "grad_norm": 2.5082278391489035, "grad_max_sv": 1.6217471033334732, "grad_min_sv": 4.5938650922172644e-08, "grad_condition": 63153156.340209946, "lr": 0.0009982464296247522, "time_sec": 41.7418487071991 }, { "epoch": 5, "train_loss": 3.9077672985839844, "train_acc": 0.1305, "test_loss": 6.821084007263184, "test_acc": 0.0156, "lyapunov": 1.530182860086641, "grad_norm": 2.041783975921356, "grad_max_sv": 1.2541583150625228, "grad_min_sv": 3.773506419557649e-08, "grad_condition": 36438804.96965951, "lr": 0.0009972609476841367, "time_sec": 41.74874401092529 }, { "epoch": 6, "train_loss": 3.978193638305664, "train_acc": 0.1273, "test_loss": 10.715914828491211, "test_acc": 0.015, "lyapunov": 1.5294916736500344, "grad_norm": 1.884529182522603, "grad_max_sv": 1.174074074625969, "grad_min_sv": 3.492432684992774e-08, "grad_condition": 56687028.60603394, "lr": 0.000996057350657239, "time_sec": 41.79358172416687 }, { "epoch": 7, "train_loss": 4.028493068466187, "train_acc": 0.12364, "test_loss": 8.849580982971192, "test_acc": 0.0108, "lyapunov": 1.5220741317095354, "grad_norm": 1.6311583818363289, "grad_max_sv": 0.9764176219701767, "grad_min_sv": 2.9745892293764343e-08, "grad_condition": 38380014.867613696, "lr": 0.000994636166481494, "time_sec": 41.74577260017395 }, { "epoch": 8, "train_loss": 4.104167304382324, "train_acc": 0.11452, "test_loss": 9.404642602539063, "test_acc": 0.0179, "lyapunov": 1.5335235891439725, "grad_norm": 1.4435862607793115, "grad_max_sv": 0.8796723946928978, "grad_min_sv": 2.6115679115784607e-08, "grad_condition": 100856221.49209695, "lr": 0.0009929980185352525, "time_sec": 41.813751220703125 }, { "epoch": 9, "train_loss": 4.36510063079834, "train_acc": 0.08636, "test_loss": 7.074767668151855, "test_acc": 0.0144, "lyapunov": 1.5799841203957872, "grad_norm": 1.3148798714645298, "grad_max_sv": 0.7969768509268761, "grad_min_sv": 2.3226430623246585e-08, "grad_condition": 42533078.34572536, "lr": 0.0009911436253643444, "time_sec": 41.729400634765625 }, { "epoch": 10, "train_loss": 4.559664976348877, "train_acc": 0.06118, "test_loss": 6.018364582824707, "test_acc": 0.01, "lyapunov": 1.5615371959593596, "grad_norm": 1.0712815395536825, "grad_max_sv": 0.5929864205420017, "grad_min_sv": 1.803380545450928e-08, "grad_condition": 45789422.46232475, "lr": 0.0009890738003669028, "time_sec": 41.75548052787781 }, { "epoch": 11, "train_loss": 4.644180833282471, "train_acc": 0.05202, "test_loss": 6.277861665344238, "test_acc": 0.01, "lyapunov": 1.5085474514900266, "grad_norm": 0.9280338123504958, "grad_max_sv": 0.5784458503127098, "grad_min_sv": 1.5023789502743857e-08, "grad_condition": 63657686.089994095, "lr": 0.00098678945143658, "time_sec": 41.724050760269165 }, { "epoch": 12, "train_loss": 4.769687054901123, "train_acc": 0.03436, "test_loss": 7.280889709472656, "test_acc": 0.01, "lyapunov": 1.4389935622129904, "grad_norm": 0.7003645750231552, "grad_max_sv": 0.4854817561805248, "grad_min_sv": 1.030722744932433e-08, "grad_condition": 53249509.08795764, "lr": 0.0009842915805643154, "time_sec": 41.72962784767151 }, { "epoch": 13, "train_loss": 4.684542055053711, "train_acc": 0.047, "test_loss": 6.991418453979493, "test_acc": 0.0112, "lyapunov": 1.4236155184333588, "grad_norm": 0.5991208192017541, "grad_max_sv": 0.38398267030715943, "grad_min_sv": 9.323978394926158e-09, "grad_condition": 49967645.39513852, "lr": 0.000981581283398829, "time_sec": 41.743834018707275 }, { "epoch": 14, "train_loss": 4.875620534667969, "train_acc": 0.02944, "test_loss": 7.128801351165771, "test_acc": 0.01, "lyapunov": 1.427685697060412, "grad_norm": 0.5025111739329319, "grad_max_sv": 0.35512366965413095, "grad_min_sv": 6.843199759284935e-09, "grad_condition": 179836296.82542375, "lr": 0.0009786597487660333, "time_sec": 41.73904871940613 }, { "epoch": 15, "train_loss": 4.896511934967041, "train_acc": 0.0335, "test_loss": 17.298480625915527, "test_acc": 0.01, "lyapunov": 1.4632702230492516, "grad_norm": 0.6331107294627782, "grad_max_sv": 0.40708996057510377, "grad_min_sv": 8.00606376749613e-09, "grad_condition": 61874764.454221845, "lr": 0.0009755282581475766, "time_sec": 41.74419069290161 }, { "epoch": 16, "train_loss": 4.912100847015381, "train_acc": 0.03632, "test_loss": 8.131814362335206, "test_acc": 0.0173, "lyapunov": 1.4873096464235154, "grad_norm": 0.826404597993897, "grad_max_sv": 0.5076741345226765, "grad_min_sv": 9.837833857273547e-09, "grad_condition": 88718975.42972028, "lr": 0.0009721881851187403, "time_sec": 41.72049045562744 }, { "epoch": 17, "train_loss": 5.142030757446289, "train_acc": 0.01672, "test_loss": 6.458518544006347, "test_acc": 0.01, "lyapunov": 1.4868055615583649, "grad_norm": 0.685951759542417, "grad_max_sv": 0.5134769573807716, "grad_min_sv": 7.799288968823869e-09, "grad_condition": 85468742.13553956, "lr": 0.0009686409947459456, "time_sec": 41.73842525482178 }, { "epoch": 18, "train_loss": 5.188919100646973, "train_acc": 0.00968, "test_loss": 10.075014764404298, "test_acc": 0.01, "lyapunov": 1.4449111775059225, "grad_norm": 0.4332247860431087, "grad_max_sv": 0.3550705298781395, "grad_min_sv": 4.337704034504397e-09, "grad_condition": 117230068.9379596, "lr": 0.0009648882429441254, "time_sec": 41.763601779937744 }, { "epoch": 19, "train_loss": 5.226645467529297, "train_acc": 0.01012, "test_loss": 10.154055513000488, "test_acc": 0.01, "lyapunov": 1.4546792269362818, "grad_norm": 0.3237987289049562, "grad_max_sv": 0.2639503736048937, "grad_min_sv": 2.060994466181133e-09, "grad_condition": 14048870017.770252, "lr": 0.00096093157579425, "time_sec": 41.76903176307678 }, { "epoch": 20, "train_loss": 5.22861256149292, "train_acc": 0.00962, "test_loss": 9.159314030456542, "test_acc": 0.01, "lyapunov": 1.4311617704303674, "grad_norm": 0.2580272391441697, "grad_max_sv": 0.2014818772673607, "grad_min_sv": 4.775887305801581e-11, "grad_condition": 131599872645.97823, "lr": 0.0009567727288213001, "time_sec": 41.77689838409424 }, { "epoch": 21, "train_loss": 5.2369175091552735, "train_acc": 0.0091, "test_loss": 9.329907885742188, "test_acc": 0.01, "lyapunov": 1.4427513545736328, "grad_norm": 0.20829668219493744, "grad_max_sv": 0.15635721795260907, "grad_min_sv": 7.96448125755094e-11, "grad_condition": 123768275801.26958, "lr": 0.0009524135262330095, "time_sec": 41.749500036239624 }, { "epoch": 22, "train_loss": 5.232069122619629, "train_acc": 0.00928, "test_loss": 8.256287899780274, "test_acc": 0.01, "lyapunov": 1.43826272115683, "grad_norm": 0.18574459317073533, "grad_max_sv": 0.13343477975577117, "grad_min_sv": 3.891468616243542e-11, "grad_condition": 128132122536.13669, "lr": 0.0009478558801197061, "time_sec": 41.73808455467224 }, { "epoch": 23, "train_loss": 5.223144430541992, "train_acc": 0.00912, "test_loss": 8.333074249267579, "test_acc": 0.01, "lyapunov": 1.431471188659863, "grad_norm": 0.15147554959008916, "grad_max_sv": 0.10204733423888683, "grad_min_sv": 2.03341283080962e-15, "grad_condition": 101827814032.01648, "lr": 0.000943101789615607, "time_sec": 41.746745347976685 }, { "epoch": 24, "train_loss": 5.233420145263672, "train_acc": 0.00942, "test_loss": 7.730482585906983, "test_acc": 0.01, "lyapunov": 1.443052962917806, "grad_norm": 0.1288834602441298, "grad_max_sv": 0.07254640674218535, "grad_min_sv": 1.1788800604957402e-13, "grad_condition": 69609233199.00801, "lr": 0.0009381533400219313, "time_sec": 41.73458123207092 }, { "epoch": 25, "train_loss": 5.248794226074219, "train_acc": 0.01224, "test_loss": 6.550568232727051, "test_acc": 0.01, "lyapunov": 1.4743182287191796, "grad_norm": 0.19543413013737237, "grad_max_sv": 0.08613794101402164, "grad_min_sv": 6.309014754681635e-11, "grad_condition": 60792110328.20559, "lr": 0.0009330127018922189, "time_sec": 41.73256278038025 }, { "epoch": 26, "train_loss": 5.226683191070556, "train_acc": 0.00892, "test_loss": 5.647989534759522, "test_acc": 0.01, "lyapunov": 1.434842828289627, "grad_norm": 0.14721341402984697, "grad_max_sv": 0.09509434262290598, "grad_min_sv": 1.0618768151186443e-15, "grad_condition": 94978842737.15823, "lr": 0.000927682130080253, "time_sec": 41.72614550590515 }, { "epoch": 27, "train_loss": 5.229176857604981, "train_acc": 0.00972, "test_loss": 5.612284447479248, "test_acc": 0.01, "lyapunov": 1.4389631537830128, "grad_norm": 0.1286875557895635, "grad_max_sv": 0.07554986858740449, "grad_min_sv": 1.9029346441684858e-16, "grad_condition": 75528406184.49973, "lr": 0.0009221639627510072, "time_sec": 41.73252606391907 }, { "epoch": 28, "train_loss": 5.226171473999023, "train_acc": 0.00934, "test_loss": 5.924600332641601, "test_acc": 0.01, "lyapunov": 1.4371787568797236, "grad_norm": 0.10743150341998972, "grad_max_sv": 0.048194893449544904, "grad_min_sv": 0.0, "grad_condition": 48194893449.54491, "lr": 0.0009164606203550494, "time_sec": 41.72467064857483 }, { "epoch": 29, "train_loss": 5.230549348297119, "train_acc": 0.00932, "test_loss": 5.312363116455078, "test_acc": 0.01, "lyapunov": 1.4417800442946842, "grad_norm": 0.10913623720356962, "grad_max_sv": 0.050634372420608996, "grad_min_sv": 0.0, "grad_condition": 50634372420.60899, "lr": 0.0009105746045668516, "time_sec": 41.754605531692505 }, { "epoch": 30, "train_loss": 5.229708560028076, "train_acc": 0.0092, "test_loss": 5.395946918487549, "test_acc": 0.01, "lyapunov": 1.441019511588699, "grad_norm": 0.10497591874908667, "grad_max_sv": 0.04387410613708198, "grad_min_sv": 0.0, "grad_condition": 43874106137.081985, "lr": 0.0009045084971874733, "time_sec": 41.71743130683899 }, { "epoch": 31, "train_loss": 5.2316739025878904, "train_acc": 0.00982, "test_loss": 6.248269965362549, "test_acc": 0.01, "lyapunov": 1.443965878023211, "grad_norm": 0.10154022323683165, "grad_max_sv": 0.03353279777802527, "grad_min_sv": 0.0, "grad_condition": 33532797778.02527, "lr": 0.0008982649590120977, "time_sec": 41.701202392578125 }, { "epoch": 32, "train_loss": 5.23400792678833, "train_acc": 0.00938, "test_loss": 5.782683653259277, "test_acc": 0.01, "lyapunov": 1.446322088046452, "grad_norm": 0.10537953489915908, "grad_max_sv": 0.04410789059475064, "grad_min_sv": 0.0, "grad_condition": 44107890594.75064, "lr": 0.0008918467286629196, "time_sec": 41.70464754104614 }, { "epoch": 33, "train_loss": 5.232683167877197, "train_acc": 0.00858, "test_loss": 5.318116857910156, "test_acc": 0.01, "lyapunov": 1.4452067232497818, "grad_norm": 0.1008655295742077, "grad_max_sv": 0.03291638647206128, "grad_min_sv": 0.0, "grad_condition": 32916386472.06128, "lr": 0.0008852566213878943, "time_sec": 41.68885540962219 }, { "epoch": 34, "train_loss": 5.237297785339355, "train_acc": 0.00966, "test_loss": 5.309081327819825, "test_acc": 0.01, "lyapunov": 1.450283215783746, "grad_norm": 0.10345313863412257, "grad_max_sv": 0.04121980397030711, "grad_min_sv": 0.0, "grad_condition": 41219803970.30711, "lr": 0.000878497527825878, "time_sec": 41.72196674346924 }, { "epoch": 35, "train_loss": 5.240170780029297, "train_acc": 0.00886, "test_loss": 5.1140812942504885, "test_acc": 0.01, "lyapunov": 1.4520895359156383, "grad_norm": 0.10252991679320593, "grad_max_sv": 0.038473002053797244, "grad_min_sv": 0.0, "grad_condition": 38473002053.79725, "lr": 0.000871572412738697, "time_sec": 41.704707622528076 }, { "epoch": 36, "train_loss": 5.237992069244385, "train_acc": 0.0091, "test_loss": 5.254914206695557, "test_acc": 0.01, "lyapunov": 1.4511004372326004, "grad_norm": 0.1034357825731679, "grad_max_sv": 0.03689436963759363, "grad_min_sv": 0.0, "grad_condition": 36894369637.59363, "lr": 0.0008644843137107055, "time_sec": 41.68847870826721 }, { "epoch": 37, "train_loss": 5.24728928100586, "train_acc": 0.00948, "test_loss": 5.015587938690185, "test_acc": 0.01, "lyapunov": 1.4593792114111468, "grad_norm": 0.10030700112378006, "grad_max_sv": 0.027813022676855325, "grad_min_sv": 0.0, "grad_condition": 27813022676.855324, "lr": 0.0008572363398164014, "time_sec": 41.67623424530029 }, { "epoch": 38, "train_loss": 5.240536932220459, "train_acc": 0.0092, "test_loss": 4.961225141906739, "test_acc": 0.01, "lyapunov": 1.454334620319669, "grad_norm": 0.09505358413147648, "grad_max_sv": 0.022648979304358365, "grad_min_sv": 0.0, "grad_condition": 22648979304.35836, "lr": 0.0008498316702566826, "time_sec": 41.65856647491455 }, { "epoch": 39, "train_loss": 5.24094622467041, "train_acc": 0.00906, "test_loss": 4.902838454437256, "test_acc": 0.01, "lyapunov": 1.4547367199607517, "grad_norm": 0.09365021131775912, "grad_max_sv": 0.02316552624106407, "grad_min_sv": 0.0, "grad_condition": 23165526241.06407, "lr": 0.0008422735529643442, "time_sec": 41.66074347496033 }, { "epoch": 40, "train_loss": 5.245578489685059, "train_acc": 0.00954, "test_loss": 4.859429032897949, "test_acc": 0.01, "lyapunov": 1.4598181689791667, "grad_norm": 0.10147367716516044, "grad_max_sv": 0.023039095243439077, "grad_min_sv": 0.0, "grad_condition": 23039095243.43908, "lr": 0.0008345653031794289, "time_sec": 41.646554708480835 }, { "epoch": 41, "train_loss": 5.245340968780518, "train_acc": 0.00972, "test_loss": 5.133834055328369, "test_acc": 0.01, "lyapunov": 1.4597191298404313, "grad_norm": 0.09983575491941106, "grad_max_sv": 0.023509565647691487, "grad_min_sv": 0.0, "grad_condition": 23509565647.69149, "lr": 0.0008267103019950526, "time_sec": 41.67466497421265 }, { "epoch": 42, "train_loss": 5.243727160949707, "train_acc": 0.0094, "test_loss": 5.177202513122559, "test_acc": 0.01, "lyapunov": 1.457551447936641, "grad_norm": 0.10012844556744109, "grad_max_sv": 0.04022635291330516, "grad_min_sv": 0.0, "grad_condition": 40226352913.30516, "lr": 0.0008187119948743447, "time_sec": 41.69778633117676 }, { "epoch": 43, "train_loss": 5.245192972717285, "train_acc": 0.00916, "test_loss": 4.837023108673096, "test_acc": 0.01, "lyapunov": 1.4592695629505246, "grad_norm": 0.0977089071025598, "grad_max_sv": 0.02978864456526935, "grad_min_sv": 0.0, "grad_condition": 29788644565.269356, "lr": 0.000810573890139155, "time_sec": 41.68951177597046 }, { "epoch": 44, "train_loss": 5.2786666191101075, "train_acc": 0.01064, "test_loss": 5.4122274887084965, "test_acc": 0.01, "lyapunov": 1.5007501855835585, "grad_norm": 0.12265113875538343, "grad_max_sv": 0.033590356819331646, "grad_min_sv": 5.169785690831125e-14, "grad_condition": 31777859057.197426, "lr": 0.0008022995574311873, "time_sec": 41.67222714424133 }, { "epoch": 45, "train_loss": 5.251278916320801, "train_acc": 0.00912, "test_loss": 5.717527485656738, "test_acc": 0.01, "lyapunov": 1.4666499061047877, "grad_norm": 0.09464479083441923, "grad_max_sv": 0.015212097018957139, "grad_min_sv": 0.0, "grad_condition": 15212097018.957138, "lr": 0.0007938926261462363, "time_sec": 41.66761112213135 }, { "epoch": 46, "train_loss": 5.248660043487549, "train_acc": 0.00922, "test_loss": 5.687412886047364, "test_acc": 0.01, "lyapunov": 1.4640466523597309, "grad_norm": 0.09250900682814509, "grad_max_sv": 0.00974161345511675, "grad_min_sv": 0.0, "grad_condition": 9741613455.116749, "lr": 0.0007853567838422158, "time_sec": 41.62896704673767 }, { "epoch": 47, "train_loss": 5.249529778289795, "train_acc": 0.00976, "test_loss": 5.35712462310791, "test_acc": 0.01, "lyapunov": 1.4639555450595554, "grad_norm": 0.09683136939926335, "grad_max_sv": 0.02266658809967339, "grad_min_sv": 0.0, "grad_condition": 22666588099.67339, "lr": 0.0007766957746216719, "time_sec": 41.632965326309204 }, { "epoch": 48, "train_loss": 5.2507288345336915, "train_acc": 0.00952, "test_loss": 5.053029971313476, "test_acc": 0.01, "lyapunov": 1.46576005692982, "grad_norm": 0.09407593048273037, "grad_max_sv": 0.027120837941765785, "grad_min_sv": 0.0, "grad_condition": 27120837941.765785, "lr": 0.0007679133974894982, "time_sec": 41.65870714187622 }, { "epoch": 49, "train_loss": 5.249875890960693, "train_acc": 0.00884, "test_loss": 5.38174955444336, "test_acc": 0.01, "lyapunov": 1.465318091690083, "grad_norm": 0.09064589183935413, "grad_max_sv": 0.008867102395743131, "grad_min_sv": 0.0, "grad_condition": 8867102395.743132, "lr": 0.000759013504686565, "time_sec": 41.735912561416626 }, { "epoch": 50, "train_loss": 5.250207867889404, "train_acc": 0.00898, "test_loss": 5.739707115173339, "test_acc": 0.01, "lyapunov": 1.4655792646091004, "grad_norm": 0.09717189190349201, "grad_max_sv": 0.021169214555993677, "grad_min_sv": 0.0, "grad_condition": 21169214555.993675, "lr": 0.0007499999999999998, "time_sec": 41.72933316230774 }, { "epoch": 51, "train_loss": 5.250648717803955, "train_acc": 0.00912, "test_loss": 6.128197521972656, "test_acc": 0.01, "lyapunov": 1.4661765546749925, "grad_norm": 0.09095698035941559, "grad_max_sv": 0.01055141636170447, "grad_min_sv": 0.0, "grad_condition": 10551416361.704468, "lr": 0.0007408768370508575, "time_sec": 41.69919180870056 }, { "epoch": 52, "train_loss": 5.251839170684814, "train_acc": 0.00908, "test_loss": 6.067484506225586, "test_acc": 0.01, "lyapunov": 1.4675627587091586, "grad_norm": 0.09067609636620885, "grad_max_sv": 0.004669012082740664, "grad_min_sv": 0.0, "grad_condition": 4669012082.7406645, "lr": 0.0007316480175599307, "time_sec": 41.654059171676636 }, { "epoch": 53, "train_loss": 5.253518835144043, "train_acc": 0.00896, "test_loss": 5.7827218193054195, "test_acc": 0.01, "lyapunov": 1.4693938874832504, "grad_norm": 0.09137616955031719, "grad_max_sv": 0.010091183660551905, "grad_min_sv": 0.0, "grad_condition": 10091183660.551905, "lr": 0.0007223175895924635, "time_sec": 41.642850160598755 }, { "epoch": 54, "train_loss": 5.254051934051514, "train_acc": 0.00872, "test_loss": 5.591477861022949, "test_acc": 0.01, "lyapunov": 1.4702323230026324, "grad_norm": 0.08996816491022355, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 41.657779932022095 }, { "epoch": 55, "train_loss": 5.255190885314941, "train_acc": 0.00916, "test_loss": 5.435504406738281, "test_acc": 0.01, "lyapunov": 1.4712699441348804, "grad_norm": 0.09391959822012276, "grad_max_sv": 0.005470911040902138, "grad_min_sv": 0.0, "grad_condition": 5470911040.902138, "lr": 0.0007033683215378998, "time_sec": 41.70645236968994 }, { "epoch": 56, "train_loss": 5.254567480010986, "train_acc": 0.0092, "test_loss": 5.745911796569824, "test_acc": 0.01, "lyapunov": 1.470891768670143, "grad_norm": 0.08856701808364516, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 41.71012330055237 }, { "epoch": 57, "train_loss": 5.255953155822754, "train_acc": 0.00902, "test_loss": 5.410791555023193, "test_acc": 0.01, "lyapunov": 1.4723095774955457, "grad_norm": 0.0914524874609732, "grad_max_sv": 0.005876953201368451, "grad_min_sv": 0.0, "grad_condition": 5876953201.368451, "lr": 0.0006840622763423388, "time_sec": 41.65397572517395 }, { "epoch": 58, "train_loss": 5.255620794372558, "train_acc": 0.00814, "test_loss": 5.248719776153565, "test_acc": 0.01, "lyapunov": 1.4720726202211112, "grad_norm": 0.08957407910190007, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 41.596808195114136 }, { "epoch": 59, "train_loss": 5.256758173370361, "train_acc": 0.00904, "test_loss": 5.839924575805664, "test_acc": 0.01, "lyapunov": 1.4729903738212098, "grad_norm": 0.09261814392317223, "grad_max_sv": 0.016021678689867258, "grad_min_sv": 0.0, "grad_condition": 16021678689.867258, "lr": 0.0006644333233692913, "time_sec": 41.65124177932739 }, { "epoch": 60, "train_loss": 5.256810084991455, "train_acc": 0.00942, "test_loss": 5.447851982879639, "test_acc": 0.01, "lyapunov": 1.4729429684636537, "grad_norm": 0.09328751710854948, "grad_max_sv": 0.018184319231659175, "grad_min_sv": 0.0, "grad_condition": 18184319231.659172, "lr": 0.0006545084971874734, "time_sec": 41.677849769592285 }, { "epoch": 61, "train_loss": 5.257736980895996, "train_acc": 0.00956, "test_loss": 5.214775198364258, "test_acc": 0.01, "lyapunov": 1.4742664586552574, "grad_norm": 0.09141104511491621, "grad_max_sv": 0.014100066805258393, "grad_min_sv": 0.0, "grad_condition": 14100066805.258392, "lr": 0.0006445158984722354, "time_sec": 41.65701365470886 }, { "epoch": 62, "train_loss": 5.257541732788086, "train_acc": 0.00888, "test_loss": 5.395826309204102, "test_acc": 0.01, "lyapunov": 1.4742513254780294, "grad_norm": 0.08871521712913655, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 41.64438438415527 }, { "epoch": 63, "train_loss": 5.258026624908447, "train_acc": 0.00826, "test_loss": 5.438673513793946, "test_acc": 0.01, "lyapunov": 1.474777021066612, "grad_norm": 0.08974006980177573, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 41.659621477127075 }, { "epoch": 64, "train_loss": 5.256656706237793, "train_acc": 0.00858, "test_loss": 5.30103558959961, "test_acc": 0.01, "lyapunov": 1.4732483726023409, "grad_norm": 0.08966165557801938, "grad_max_sv": 0.002812969218939543, "grad_min_sv": 0.0, "grad_condition": 2812969218.939543, "lr": 0.0006141754350553275, "time_sec": 41.680859327316284 }, { "epoch": 65, "train_loss": 5.25918576675415, "train_acc": 0.00894, "test_loss": 5.125008965301514, "test_acc": 0.01, "lyapunov": 1.4760865912108165, "grad_norm": 0.0887662183827418, "grad_max_sv": 0.0005635306239128113, "grad_min_sv": 0.0, "grad_condition": 563530623.9128113, "lr": 0.0006039558454088793, "time_sec": 41.60912251472473 }, { "epoch": 66, "train_loss": 5.260574841461182, "train_acc": 0.00874, "test_loss": 5.454896185302735, "test_acc": 0.01, "lyapunov": 1.4776358738579713, "grad_norm": 0.11531617666338094, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 41.6300413608551 }, { "epoch": 67, "train_loss": 5.259261641082763, "train_acc": 0.00928, "test_loss": 5.808028590393066, "test_acc": 0.01, "lyapunov": 1.4762413047463692, "grad_norm": 0.08815522678931535, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 41.62497115135193 }, { "epoch": 68, "train_loss": 5.2594527183532715, "train_acc": 0.00938, "test_loss": 5.654487629699707, "test_acc": 0.01, "lyapunov": 1.4761893337644885, "grad_norm": 0.09333979255701338, "grad_max_sv": 0.014018809190019965, "grad_min_sv": 0.0, "grad_condition": 14018809190.019964, "lr": 0.0005730415142812054, "time_sec": 41.621119260787964 }, { "epoch": 69, "train_loss": 5.26328825378418, "train_acc": 0.00966, "test_loss": 5.534258514404297, "test_acc": 0.01, "lyapunov": 1.4803016765038375, "grad_norm": 0.10303270455881028, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 41.61156606674194 }, { "epoch": 70, "train_loss": 5.261220071105957, "train_acc": 0.00968, "test_loss": 5.542517721557617, "test_acc": 0.01, "lyapunov": 1.4784168117796368, "grad_norm": 0.08844874021214537, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 41.62671518325806 }, { "epoch": 71, "train_loss": 5.260938765716553, "train_acc": 0.00862, "test_loss": 5.420013078308106, "test_acc": 0.01, "lyapunov": 1.4779477622502906, "grad_norm": 0.0889283460956175, "grad_max_sv": 0.0034733008593320846, "grad_min_sv": 0.0, "grad_condition": 3473300859.3320847, "lr": 0.0005418389216661573, "time_sec": 41.62442445755005 }, { "epoch": 72, "train_loss": 5.260601893157959, "train_acc": 0.00902, "test_loss": 5.176327791595459, "test_acc": 0.01, "lyapunov": 1.4776618431901078, "grad_norm": 0.0902718541800826, "grad_max_sv": 0.012300812685862184, "grad_min_sv": 0.0, "grad_condition": 12300812685.862183, "lr": 0.0005313952597646563, "time_sec": 41.66868996620178 }, { "epoch": 73, "train_loss": 5.264250277404785, "train_acc": 0.00884, "test_loss": 5.100635796356201, "test_acc": 0.01, "lyapunov": 1.4813997955883251, "grad_norm": 0.0903405536598621, "grad_max_sv": 0.007483795657753945, "grad_min_sv": 0.0, "grad_condition": 7483795657.7539425, "lr": 0.0005209378268645994, "time_sec": 41.626320600509644 }, { "epoch": 74, "train_loss": 5.26120802658081, "train_acc": 0.0087, "test_loss": 5.235371070861817, "test_acc": 0.01, "lyapunov": 1.4784196508510032, "grad_norm": 0.0879091159548037, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 41.62154483795166 }, { "epoch": 75, "train_loss": 5.267138383178711, "train_acc": 0.00858, "test_loss": 4.973852683258056, "test_acc": 0.01, "lyapunov": 1.4819577859185846, "grad_norm": 0.08881358787274304, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 41.638519048690796 }, { "epoch": 76, "train_loss": 5.2642199221801755, "train_acc": 0.00822, "test_loss": 5.071284794616699, "test_acc": 0.01, "lyapunov": 1.4816657048661996, "grad_norm": 0.08882388372557563, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 41.619221925735474 }, { "epoch": 77, "train_loss": 5.273737740020752, "train_acc": 0.00884, "test_loss": 4.974697065734864, "test_acc": 0.01, "lyapunov": 1.490840724667015, "grad_norm": 0.08942192638502924, "grad_max_sv": 0.0068177991081029175, "grad_min_sv": 0.0, "grad_condition": 6817799108.102918, "lr": 0.0004790621731353997, "time_sec": 41.63776922225952 }, { "epoch": 78, "train_loss": 5.261278802490234, "train_acc": 0.00874, "test_loss": 4.976500602722168, "test_acc": 0.01, "lyapunov": 1.4785530381190501, "grad_norm": 0.0880515343100226, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 41.607832193374634 }, { "epoch": 79, "train_loss": 5.263828933258057, "train_acc": 0.00816, "test_loss": 4.9257099716186525, "test_acc": 0.01, "lyapunov": 1.4813517496713897, "grad_norm": 0.08863134124223197, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 41.631874561309814 }, { "epoch": 80, "train_loss": 5.268178493652344, "train_acc": 0.00912, "test_loss": 4.912583598327637, "test_acc": 0.01, "lyapunov": 1.4849315034154127, "grad_norm": 0.08860861584524822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 41.710554122924805 }, { "epoch": 81, "train_loss": 5.26138502532959, "train_acc": 0.00922, "test_loss": 4.878695037841797, "test_acc": 0.01, "lyapunov": 1.478672110820975, "grad_norm": 0.09157782940494599, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 41.64098763465881 }, { "epoch": 82, "train_loss": 5.268409018859863, "train_acc": 0.00922, "test_loss": 4.908391270446777, "test_acc": 0.01, "lyapunov": 1.4861254643296342, "grad_norm": 0.11020465642062108, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 41.60934782028198 }, { "epoch": 83, "train_loss": 5.265614703063965, "train_acc": 0.00942, "test_loss": 4.864893129730224, "test_acc": 0.01, "lyapunov": 1.4825067782341061, "grad_norm": 0.09011764156233357, "grad_max_sv": 0.002433748124167323, "grad_min_sv": 0.0, "grad_condition": 2433748124.167323, "lr": 0.0004166156266419484, "time_sec": 41.60301470756531 }, { "epoch": 84, "train_loss": 5.262646561889649, "train_acc": 0.0091, "test_loss": 4.719803262329101, "test_acc": 0.01, "lyapunov": 1.4800378392114664, "grad_norm": 0.08987030714157009, "grad_max_sv": 0.005705382255837321, "grad_min_sv": 0.0, "grad_condition": 5705382255.837321, "lr": 0.0004063093427071373, "time_sec": 41.6301634311676 }, { "epoch": 85, "train_loss": 5.263007119445801, "train_acc": 0.00892, "test_loss": 4.765390521240234, "test_acc": 0.01, "lyapunov": 1.4803728941456435, "grad_norm": 0.08908420576392925, "grad_max_sv": 0.005673544481396675, "grad_min_sv": 0.0, "grad_condition": 5673544481.396675, "lr": 0.0003960441545911199, "time_sec": 41.6158664226532 }, { "epoch": 86, "train_loss": 5.261938611297607, "train_acc": 0.00896, "test_loss": 4.7486605583190915, "test_acc": 0.01, "lyapunov": 1.479363068900145, "grad_norm": 0.08783615573103698, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 41.63826298713684 }, { "epoch": 87, "train_loss": 5.263675572814941, "train_acc": 0.00854, "test_loss": 4.729234335327148, "test_acc": 0.01, "lyapunov": 1.481331856354423, "grad_norm": 0.08839938213840319, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 41.63784456253052 }, { "epoch": 88, "train_loss": 5.262854153900147, "train_acc": 0.00876, "test_loss": 4.702548780822754, "test_acc": 0.01, "lyapunov": 1.4803594689235053, "grad_norm": 0.08793981551347788, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 41.71681451797485 }, { "epoch": 89, "train_loss": 5.2630352787780765, "train_acc": 0.00878, "test_loss": 4.71384239654541, "test_acc": 0.01, "lyapunov": 1.4806065233162298, "grad_norm": 0.08814160681144886, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 41.7017023563385 }, { "epoch": 90, "train_loss": 5.262895381469726, "train_acc": 0.00916, "test_loss": 4.708866213226318, "test_acc": 0.01, "lyapunov": 1.4804326811105089, "grad_norm": 0.08915485528106772, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 41.66344165802002 }, { "epoch": 91, "train_loss": 5.2640660131835935, "train_acc": 0.00894, "test_loss": 4.7449420501708985, "test_acc": 0.01, "lyapunov": 1.481703461588496, "grad_norm": 0.09104557989631236, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 41.65228295326233 }, { "epoch": 92, "train_loss": 5.2634638612365725, "train_acc": 0.00882, "test_loss": 4.755833000946045, "test_acc": 0.01, "lyapunov": 1.4810923280008614, "grad_norm": 0.08888836178350999, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 41.6901330947876 }, { "epoch": 93, "train_loss": 5.264835737762451, "train_acc": 0.00874, "test_loss": 4.721351288604736, "test_acc": 0.01, "lyapunov": 1.4826934395543754, "grad_norm": 0.08947356736587055, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 41.6052131652832 }, { "epoch": 94, "train_loss": 5.263670272369385, "train_acc": 0.00868, "test_loss": 4.785962379455566, "test_acc": 0.01, "lyapunov": 1.4813081669380597, "grad_norm": 0.08849247443481073, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 41.60963582992554 }, { "epoch": 95, "train_loss": 5.2619873828125, "train_acc": 0.00798, "test_loss": 4.723102865600586, "test_acc": 0.01, "lyapunov": 1.479443594927678, "grad_norm": 0.08787170616898271, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 41.6090726852417 }, { "epoch": 96, "train_loss": 5.264093981323242, "train_acc": 0.00886, "test_loss": 4.719023175048828, "test_acc": 0.01, "lyapunov": 1.4818146923923736, "grad_norm": 0.08820019238952795, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 41.62479615211487 }, { "epoch": 97, "train_loss": 5.2660337771606445, "train_acc": 0.00826, "test_loss": 4.683718409729004, "test_acc": 0.01, "lyapunov": 1.4838567975232058, "grad_norm": 0.08832542758192675, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 41.61792826652527 }, { "epoch": 98, "train_loss": 5.264854827270508, "train_acc": 0.00872, "test_loss": 4.66099263305664, "test_acc": 0.01, "lyapunov": 1.4826005797861788, "grad_norm": 0.08770768444548716, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 41.65434980392456 }, { "epoch": 99, "train_loss": 5.26445282623291, "train_acc": 0.00872, "test_loss": 4.680420280456543, "test_acc": 0.01, "lyapunov": 1.482219386588582, "grad_norm": 0.08789455257207789, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 41.626431465148926 }, { "epoch": 100, "train_loss": 5.267974179992676, "train_acc": 0.00926, "test_loss": 4.719721762084961, "test_acc": 0.01, "lyapunov": 1.4858673469489798, "grad_norm": 0.08804026825834858, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 41.61785125732422 }, { "epoch": 101, "train_loss": 5.265785012969971, "train_acc": 0.00908, "test_loss": 4.677582652282715, "test_acc": 0.01, "lyapunov": 1.4835739272939579, "grad_norm": 0.08811206484625347, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 41.61317491531372 }, { "epoch": 102, "train_loss": 5.262550980682373, "train_acc": 0.00804, "test_loss": 4.721813179779053, "test_acc": 0.01, "lyapunov": 1.4801046043405752, "grad_norm": 0.08851673086495025, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 41.67564344406128 }, { "epoch": 103, "train_loss": 5.2642667413330075, "train_acc": 0.00882, "test_loss": 4.740510238647461, "test_acc": 0.01, "lyapunov": 1.4820212802618666, "grad_norm": 0.08821117687751044, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 41.63251256942749 }, { "epoch": 104, "train_loss": 5.263534827728272, "train_acc": 0.0081, "test_loss": 4.700486143493652, "test_acc": 0.01, "lyapunov": 1.4811951995200818, "grad_norm": 0.08907217589685106, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 41.62003540992737 }, { "epoch": 105, "train_loss": 5.263595247192383, "train_acc": 0.00866, "test_loss": 4.685244355773926, "test_acc": 0.01, "lyapunov": 1.4812764624500518, "grad_norm": 0.087999698905291, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 41.59307098388672 }, { "epoch": 106, "train_loss": 5.2640459841918945, "train_acc": 0.00788, "test_loss": 4.679230912780762, "test_acc": 0.01, "lyapunov": 1.481674498914148, "grad_norm": 0.08791576128060906, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 41.62804102897644 }, { "epoch": 107, "train_loss": 5.264458420715332, "train_acc": 0.00878, "test_loss": 4.693680247497559, "test_acc": 0.01, "lyapunov": 1.4822333346852257, "grad_norm": 0.0877864562223225, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 41.72821760177612 }, { "epoch": 108, "train_loss": 5.263148934020996, "train_acc": 0.0092, "test_loss": 4.703213790130615, "test_acc": 0.01, "lyapunov": 1.480785415300628, "grad_norm": 0.08786524330498742, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 41.68737983703613 }, { "epoch": 109, "train_loss": 5.264703175201416, "train_acc": 0.0078, "test_loss": 4.703215410614014, "test_acc": 0.01, "lyapunov": 1.482531173454831, "grad_norm": 0.0887187166875537, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 41.6301372051239 }, { "epoch": 110, "train_loss": 5.262354034423828, "train_acc": 0.00878, "test_loss": 4.673253472900391, "test_acc": 0.01, "lyapunov": 1.4798865848794922, "grad_norm": 0.08823123281084728, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 41.61501979827881 }, { "epoch": 111, "train_loss": 5.261907596282959, "train_acc": 0.00774, "test_loss": 4.6810761657714846, "test_acc": 0.01, "lyapunov": 1.4794099962010103, "grad_norm": 0.08847327230851044, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 41.66792058944702 }, { "epoch": 112, "train_loss": 5.263451714782715, "train_acc": 0.00876, "test_loss": 4.675498142242431, "test_acc": 0.01, "lyapunov": 1.4811130951127738, "grad_norm": 0.08821763372055312, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 41.6463463306427 }, { "epoch": 113, "train_loss": 5.271167716522217, "train_acc": 0.00842, "test_loss": 4.685236253356933, "test_acc": 0.01, "lyapunov": 1.489286311447163, "grad_norm": 0.08951867713473023, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 41.74271559715271 }, { "epoch": 114, "train_loss": 5.271448510589599, "train_acc": 0.00896, "test_loss": 4.690647507476807, "test_acc": 0.01, "lyapunov": 1.4897843382852463, "grad_norm": 0.08820177476113898, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 41.668110609054565 }, { "epoch": 115, "train_loss": 5.2816896908569335, "train_acc": 0.00868, "test_loss": 4.690107788085937, "test_acc": 0.01, "lyapunov": 1.49836193996927, "grad_norm": 0.0881224924879974, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 41.65963578224182 }, { "epoch": 116, "train_loss": 5.265034445343018, "train_acc": 0.00848, "test_loss": 4.69013021774292, "test_acc": 0.01, "lyapunov": 1.4828510912483002, "grad_norm": 0.0884889002186026, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 41.68511462211609 }, { "epoch": 117, "train_loss": 5.26604537612915, "train_acc": 0.00834, "test_loss": 4.690117681884765, "test_acc": 0.01, "lyapunov": 1.4837996590777736, "grad_norm": 0.087812082346243, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 41.62825393676758 }, { "epoch": 118, "train_loss": 5.271575555877686, "train_acc": 0.00838, "test_loss": 4.688699510192871, "test_acc": 0.01, "lyapunov": 1.4897897758752183, "grad_norm": 0.08852661249085975, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 41.813793897628784 }, { "epoch": 119, "train_loss": 5.270083126525879, "train_acc": 0.00882, "test_loss": 4.678613103485107, "test_acc": 0.01, "lyapunov": 1.4881404150477455, "grad_norm": 0.08809098199633093, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 41.60239052772522 }, { "epoch": 120, "train_loss": 5.2668604069519045, "train_acc": 0.00916, "test_loss": 4.668810566711426, "test_acc": 0.01, "lyapunov": 1.484404284630895, "grad_norm": 0.08801465824181619, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 41.67430233955383 }, { "epoch": 121, "train_loss": 5.270687980041504, "train_acc": 0.00844, "test_loss": 4.678598808288574, "test_acc": 0.01, "lyapunov": 1.4865265313316793, "grad_norm": 0.08823636157170499, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 41.651268005371094 }, { "epoch": 122, "train_loss": 5.262444466705322, "train_acc": 0.00858, "test_loss": 4.678612301635742, "test_acc": 0.01, "lyapunov": 1.48004513079553, "grad_norm": 0.09003261469940216, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 41.676185607910156 }, { "epoch": 123, "train_loss": 5.263941179351806, "train_acc": 0.0086, "test_loss": 4.671801266479492, "test_acc": 0.01, "lyapunov": 1.4817558716020316, "grad_norm": 0.09047110449687606, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 41.740845918655396 }, { "epoch": 124, "train_loss": 5.269082255859375, "train_acc": 0.00892, "test_loss": 4.671809730529785, "test_acc": 0.01, "lyapunov": 1.4871390643327131, "grad_norm": 0.08793369061349017, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 41.75574517250061 }, { "epoch": 125, "train_loss": 5.262843768310547, "train_acc": 0.00886, "test_loss": 4.662115892028808, "test_acc": 0.01, "lyapunov": 1.4804938851719927, "grad_norm": 0.08792553586108803, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 41.601502656936646 }, { "epoch": 126, "train_loss": 5.262783556365966, "train_acc": 0.0087, "test_loss": 4.671795330810546, "test_acc": 0.01, "lyapunov": 1.4804595739335356, "grad_norm": 0.08818916489651518, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 41.719630002975464 }, { "epoch": 127, "train_loss": 5.287085924682617, "train_acc": 0.00884, "test_loss": 4.670085035705567, "test_acc": 0.01, "lyapunov": 1.5052251651159028, "grad_norm": 0.09375403073023182, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 41.655165672302246 }, { "epoch": 128, "train_loss": 5.3060646118164065, "train_acc": 0.00794, "test_loss": 4.6709625457763675, "test_acc": 0.01, "lyapunov": 1.5216917436750954, "grad_norm": 0.08857015682665342, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 41.698471546173096 }, { "epoch": 129, "train_loss": 5.263810299682617, "train_acc": 0.00862, "test_loss": 4.679794757080078, "test_acc": 0.01, "lyapunov": 1.4815860233648355, "grad_norm": 0.08793008720913074, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 41.65286087989807 }, { "epoch": 130, "train_loss": 5.2642881167602535, "train_acc": 0.00886, "test_loss": 4.679787918853759, "test_acc": 0.01, "lyapunov": 1.4821607542159918, "grad_norm": 0.08826309404088324, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 41.60878133773804 }, { "epoch": 131, "train_loss": 5.264142718353272, "train_acc": 0.00912, "test_loss": 4.679794540405274, "test_acc": 0.01, "lyapunov": 1.4819643613322617, "grad_norm": 0.0879145106714535, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 41.631954193115234 }, { "epoch": 132, "train_loss": 5.264426311187744, "train_acc": 0.00912, "test_loss": 4.686964068603515, "test_acc": 0.01, "lyapunov": 1.4822249098507034, "grad_norm": 0.08772387144138033, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 41.61648106575012 }, { "epoch": 133, "train_loss": 5.263279991149902, "train_acc": 0.00928, "test_loss": 4.673583326721191, "test_acc": 0.01, "lyapunov": 1.481004032332574, "grad_norm": 0.08756701265820996, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 41.61954092979431 }, { "epoch": 134, "train_loss": 5.264391135559082, "train_acc": 0.00916, "test_loss": 4.673584260559082, "test_acc": 0.01, "lyapunov": 1.482238910387239, "grad_norm": 0.08773099630417767, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 41.636422872543335 }, { "epoch": 135, "train_loss": 5.264316839904785, "train_acc": 0.00918, "test_loss": 4.673586289215088, "test_acc": 0.01, "lyapunov": 1.4821837125226969, "grad_norm": 0.0883951408561693, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 41.637362241744995 }, { "epoch": 136, "train_loss": 5.263837189178467, "train_acc": 0.00856, "test_loss": 4.673583441162109, "test_acc": 0.01, "lyapunov": 1.4816227761071052, "grad_norm": 0.08805256597520511, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 41.648523807525635 }, { "epoch": 137, "train_loss": 5.263810054168701, "train_acc": 0.00914, "test_loss": 4.673584091186523, "test_acc": 0.01, "lyapunov": 1.4815898499525417, "grad_norm": 0.08812282585660734, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 41.73938012123108 }, { "epoch": 138, "train_loss": 5.2631301567077635, "train_acc": 0.00882, "test_loss": 4.673581381225586, "test_acc": 0.01, "lyapunov": 1.4808570945354373, "grad_norm": 0.0884075853889321, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 41.70086741447449 }, { "epoch": 139, "train_loss": 5.264147056427002, "train_acc": 0.00966, "test_loss": 4.673584265136719, "test_acc": 0.01, "lyapunov": 1.4819788155348406, "grad_norm": 0.08781225710160669, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 41.63281536102295 }, { "epoch": 140, "train_loss": 5.264177637023926, "train_acc": 0.00946, "test_loss": 4.673582272338868, "test_acc": 0.01, "lyapunov": 1.4820371799151917, "grad_norm": 0.08778605437009919, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 41.605711221694946 }, { "epoch": 141, "train_loss": 5.264175823974609, "train_acc": 0.01, "test_loss": 4.673583470153808, "test_acc": 0.01, "lyapunov": 1.482038261030641, "grad_norm": 0.08820186315365212, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 41.616660594940186 }, { "epoch": 142, "train_loss": 5.263000276947022, "train_acc": 0.01, "test_loss": 4.67358302154541, "test_acc": 0.01, "lyapunov": 1.4806900521373505, "grad_norm": 0.08785028349994792, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 41.626938819885254 }, { "epoch": 143, "train_loss": 5.264303789367676, "train_acc": 0.0093, "test_loss": 4.673582839202881, "test_acc": 0.01, "lyapunov": 1.4821641326255506, "grad_norm": 0.08832630889985595, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 41.62687826156616 }, { "epoch": 144, "train_loss": 5.266550144958496, "train_acc": 0.01, "test_loss": 4.673582318115234, "test_acc": 0.01, "lyapunov": 1.4840948478035305, "grad_norm": 0.08863982897252927, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 41.63750672340393 }, { "epoch": 145, "train_loss": 5.2637120777893065, "train_acc": 0.01, "test_loss": 4.673582674407959, "test_acc": 0.01, "lyapunov": 1.4815035524880489, "grad_norm": 0.08799138407501185, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 41.61049675941467 }, { "epoch": 146, "train_loss": 5.263380687713623, "train_acc": 0.01, "test_loss": 4.6735828002929685, "test_acc": 0.01, "lyapunov": 1.48112582825029, "grad_norm": 0.08789323778024616, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 41.664053201675415 }, { "epoch": 147, "train_loss": 5.262870178375244, "train_acc": 0.01, "test_loss": 4.67358247756958, "test_acc": 0.01, "lyapunov": 1.4805500345766698, "grad_norm": 0.08785274592155841, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 41.73871088027954 }, { "epoch": 148, "train_loss": 5.263046730651856, "train_acc": 0.01, "test_loss": 4.673582760620117, "test_acc": 0.01, "lyapunov": 1.480766166811404, "grad_norm": 0.08817919214333009, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 41.71699619293213 }, { "epoch": 149, "train_loss": 5.264003658447265, "train_acc": 0.01, "test_loss": 4.673582760620117, "test_acc": 0.01, "lyapunov": 1.4818289621406808, "grad_norm": 0.08840976368023683, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 41.63391995429993 }, { "epoch": 150, "train_loss": 5.264799559326172, "train_acc": 0.01, "test_loss": 4.673582650756836, "test_acc": 0.01, "lyapunov": 1.4827044315045448, "grad_norm": 0.08814260335342491, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 41.604254484176636 } ], "8": [ { "epoch": 1, "train_loss": 5.146115896911621, "train_acc": 0.02178, "test_loss": 4.658292015838623, "test_acc": 0.0179, "lyapunov": 2.2941700692676825, "grad_norm": 5.7514440172256105, "grad_max_sv": 4.608755576610565, "grad_min_sv": 9.931108821970013e-08, "grad_condition": 54298677.31321855, "lr": 0.0009998903417374227, "time_sec": 86.91112756729126 }, { "epoch": 2, "train_loss": 4.702691088256836, "train_acc": 0.02976, "test_loss": 4.6687107803344725, "test_acc": 0.0173, "lyapunov": 1.8152018111685049, "grad_norm": 3.1269645106600352, "grad_max_sv": 2.3287330240011217, "grad_min_sv": 5.3721432058395636e-08, "grad_condition": 52432891.31661774, "lr": 0.0009995614150494292, "time_sec": 86.96670389175415 }, { "epoch": 3, "train_loss": 4.563177616271973, "train_acc": 0.03108, "test_loss": 4.458634540557862, "test_acc": 0.0275, "lyapunov": 1.659614868481141, "grad_norm": 1.6241391637016038, "grad_max_sv": 1.0878711834549903, "grad_min_sv": 2.6067565292442475e-08, "grad_condition": 83662403.24623688, "lr": 0.0009990133642141358, "time_sec": 86.90370392799377 }, { "epoch": 4, "train_loss": 4.516682284240723, "train_acc": 0.03726, "test_loss": 4.491609892272949, "test_acc": 0.0226, "lyapunov": 1.5915839062322437, "grad_norm": 1.140832409431892, "grad_max_sv": 0.6813461020588875, "grad_min_sv": 1.4620473591086398e-08, "grad_condition": 563097834.1159084, "lr": 0.0009982464296247522, "time_sec": 86.99007058143616 }, { "epoch": 5, "train_loss": 4.5070478215026855, "train_acc": 0.04338, "test_loss": 4.482846225738525, "test_acc": 0.0231, "lyapunov": 1.5719971531797248, "grad_norm": 0.9891134281920906, "grad_max_sv": 0.576826149970293, "grad_min_sv": 1.4178649894447393e-08, "grad_condition": 58885947.278740086, "lr": 0.0009972609476841367, "time_sec": 86.98556971549988 }, { "epoch": 6, "train_loss": 4.547509643402099, "train_acc": 0.0439, "test_loss": 4.9390108833312985, "test_acc": 0.0116, "lyapunov": 1.566867695744995, "grad_norm": 0.8577969738236341, "grad_max_sv": 0.45468067899346354, "grad_min_sv": 1.1785924136642478e-08, "grad_condition": 51467445.538705364, "lr": 0.000996057350657239, "time_sec": 86.93410611152649 }, { "epoch": 7, "train_loss": 4.532205999908447, "train_acc": 0.04932, "test_loss": 4.854185777282715, "test_acc": 0.0105, "lyapunov": 1.5658333350325484, "grad_norm": 0.7813900002362055, "grad_max_sv": 0.42395056039094925, "grad_min_sv": 1.0807322919567653e-08, "grad_condition": 102461132.44291899, "lr": 0.000994636166481494, "time_sec": 86.96581149101257 }, { "epoch": 8, "train_loss": 4.556547904968261, "train_acc": 0.0504, "test_loss": 5.202551012420654, "test_acc": 0.0104, "lyapunov": 1.5580533120943152, "grad_norm": 0.7496749300980402, "grad_max_sv": 0.3704929508268833, "grad_min_sv": 9.9690008810438e-09, "grad_condition": 130808798.44108884, "lr": 0.0009929980185352525, "time_sec": 86.94089555740356 }, { "epoch": 9, "train_loss": 4.701766607666015, "train_acc": 0.03756, "test_loss": 5.755129487609863, "test_acc": 0.01, "lyapunov": 1.5552253073743543, "grad_norm": 0.6765304040507019, "grad_max_sv": 0.36201889589428904, "grad_min_sv": 8.426840739095276e-09, "grad_condition": 62920470.9578716, "lr": 0.0009911436253643444, "time_sec": 86.93878936767578 }, { "epoch": 10, "train_loss": 4.765756509094238, "train_acc": 0.03202, "test_loss": 5.775740480041504, "test_acc": 0.01, "lyapunov": 1.5391303578301159, "grad_norm": 0.7537997383732445, "grad_max_sv": 0.34123560786247253, "grad_min_sv": 8.077983985887994e-09, "grad_condition": 51423310.42648181, "lr": 0.0009890738003669028, "time_sec": 86.94973969459534 }, { "epoch": 11, "train_loss": 4.81721549484253, "train_acc": 0.0287, "test_loss": 5.310749195861816, "test_acc": 0.01, "lyapunov": 1.5252552425769894, "grad_norm": 0.6724423278308185, "grad_max_sv": 0.2991580605506897, "grad_min_sv": 5.889135633492526e-09, "grad_condition": 125659233.84784427, "lr": 0.00098678945143658, "time_sec": 86.92238068580627 }, { "epoch": 12, "train_loss": 4.815476130065918, "train_acc": 0.03228, "test_loss": 4.919392412567139, "test_acc": 0.01, "lyapunov": 1.5252421408358132, "grad_norm": 0.6745068286502589, "grad_max_sv": 0.2930708375293761, "grad_min_sv": 6.114008772872826e-09, "grad_condition": 71899366.71277946, "lr": 0.0009842915805643154, "time_sec": 86.96433067321777 }, { "epoch": 13, "train_loss": 4.802655950775146, "train_acc": 0.03752, "test_loss": 4.738039018249512, "test_acc": 0.01, "lyapunov": 1.5223182784321974, "grad_norm": 0.6997812002840638, "grad_max_sv": 0.34992206916213037, "grad_min_sv": 8.056309852566556e-09, "grad_condition": 47743142.04490039, "lr": 0.000981581283398829, "time_sec": 86.93432188034058 }, { "epoch": 14, "train_loss": 4.879040807647705, "train_acc": 0.03196, "test_loss": 4.635845722961426, "test_acc": 0.01, "lyapunov": 1.5264948713200173, "grad_norm": 0.7132128709453732, "grad_max_sv": 0.37259799614548683, "grad_min_sv": 7.726031005933498e-09, "grad_condition": 77087531.09708562, "lr": 0.0009786597487660333, "time_sec": 86.92895364761353 }, { "epoch": 15, "train_loss": 4.93996203048706, "train_acc": 0.0286, "test_loss": 4.715687692260742, "test_acc": 0.01, "lyapunov": 1.5275609859115327, "grad_norm": 0.7145493932975088, "grad_max_sv": 0.3383642140775919, "grad_min_sv": 6.660084050924553e-09, "grad_condition": 63568945.70900831, "lr": 0.0009755282581475766, "time_sec": 86.93708157539368 }, { "epoch": 16, "train_loss": 4.951732353668213, "train_acc": 0.03108, "test_loss": 4.694218672180176, "test_acc": 0.01, "lyapunov": 1.5221876610270546, "grad_norm": 0.6526072701529334, "grad_max_sv": 0.29856473468244077, "grad_min_sv": 5.5810975953029866e-09, "grad_condition": 3669494078.4381485, "lr": 0.0009721881851187403, "time_sec": 86.95431900024414 }, { "epoch": 17, "train_loss": 5.028552846374511, "train_acc": 0.02936, "test_loss": 4.582682956695557, "test_acc": 0.0148, "lyapunov": 1.5572718967257253, "grad_norm": 0.8395071465637489, "grad_max_sv": 0.2635829897597432, "grad_min_sv": 4.546329786998837e-09, "grad_condition": 9308629659.195911, "lr": 0.0009686409947459456, "time_sec": 86.94067001342773 }, { "epoch": 18, "train_loss": 5.080957429504394, "train_acc": 0.02958, "test_loss": 4.743882189178467, "test_acc": 0.01, "lyapunov": 1.573465526256415, "grad_norm": 0.7060094795148925, "grad_max_sv": 0.26090904884040356, "grad_min_sv": 4.9669986091141484e-09, "grad_condition": 158829567.68689433, "lr": 0.0009648882429441254, "time_sec": 86.93801307678223 }, { "epoch": 19, "train_loss": 5.163744027404785, "train_acc": 0.0251, "test_loss": 5.350689000701904, "test_acc": 0.01, "lyapunov": 1.5783103155662945, "grad_norm": 0.7236371812810315, "grad_max_sv": 0.32311243638396264, "grad_min_sv": 4.661415661322624e-09, "grad_condition": 362163554.1712912, "lr": 0.00096093157579425, "time_sec": 86.95386362075806 }, { "epoch": 20, "train_loss": 5.177699388122559, "train_acc": 0.02336, "test_loss": 4.728291717529297, "test_acc": 0.01, "lyapunov": 1.5543774262718533, "grad_norm": 0.6278235228394613, "grad_max_sv": 0.2316085107624531, "grad_min_sv": 2.9537814670154304e-09, "grad_condition": 3474032967.5441117, "lr": 0.0009567727288213001, "time_sec": 86.9823546409607 }, { "epoch": 21, "train_loss": 5.2000909381103515, "train_acc": 0.02436, "test_loss": 4.806672692871094, "test_acc": 0.01, "lyapunov": 1.5755902729985658, "grad_norm": 0.766013265906278, "grad_max_sv": 0.21709984578192235, "grad_min_sv": 2.2318304187728858e-09, "grad_condition": 8696284488.710842, "lr": 0.0009524135262330095, "time_sec": 86.9815993309021 }, { "epoch": 22, "train_loss": 5.172516224975586, "train_acc": 0.02578, "test_loss": 5.050736184692383, "test_acc": 0.01, "lyapunov": 1.5738651392709873, "grad_norm": 0.8548378900544575, "grad_max_sv": 0.21818067859858276, "grad_min_sv": 2.4550293141510983e-09, "grad_condition": 1446353295.730711, "lr": 0.0009478558801197061, "time_sec": 86.96929454803467 }, { "epoch": 23, "train_loss": 5.301382947845459, "train_acc": 0.01554, "test_loss": 5.921122685241699, "test_acc": 0.01, "lyapunov": 1.5795374422731912, "grad_norm": 1.072625133417376, "grad_max_sv": 0.29671905748546124, "grad_min_sv": 3.4811909517637897e-09, "grad_condition": 2268879972.814607, "lr": 0.000943101789615607, "time_sec": 87.05305171012878 }, { "epoch": 24, "train_loss": 5.308596148986816, "train_acc": 0.01028, "test_loss": 5.915314376831055, "test_acc": 0.01, "lyapunov": 1.5046202849853985, "grad_norm": 0.4300250072511413, "grad_max_sv": 0.29422527775168417, "grad_min_sv": 2.563464584050615e-09, "grad_condition": 1801474829.549522, "lr": 0.0009381533400219313, "time_sec": 86.9294683933258 }, { "epoch": 25, "train_loss": 5.30389043762207, "train_acc": 0.01028, "test_loss": 5.442194981384278, "test_acc": 0.01, "lyapunov": 1.5036146476140717, "grad_norm": 0.369004063413563, "grad_max_sv": 0.27016645595431327, "grad_min_sv": 1.563399900968634e-09, "grad_condition": 26105306242.6268, "lr": 0.0009330127018922189, "time_sec": 86.93831205368042 }, { "epoch": 26, "train_loss": 5.310046338348388, "train_acc": 0.00962, "test_loss": 6.1388027900695805, "test_acc": 0.01, "lyapunov": 1.5094104654648726, "grad_norm": 0.3921330241846595, "grad_max_sv": 0.27323133423924445, "grad_min_sv": 2.6655278586792953e-09, "grad_condition": 217735166.8546676, "lr": 0.000927682130080253, "time_sec": 87.04652237892151 }, { "epoch": 27, "train_loss": 5.301853795013428, "train_acc": 0.01042, "test_loss": 5.515717539215088, "test_acc": 0.01, "lyapunov": 1.508369487569765, "grad_norm": 0.30565280482621787, "grad_max_sv": 0.22872439920902252, "grad_min_sv": 7.688681849029263e-10, "grad_condition": 46178443525.53847, "lr": 0.0009221639627510072, "time_sec": 87.04486989974976 }, { "epoch": 28, "train_loss": 5.29817862487793, "train_acc": 0.00972, "test_loss": 5.770360753631592, "test_acc": 0.01, "lyapunov": 1.5080109913940625, "grad_norm": 0.277614712245464, "grad_max_sv": 0.196561511605978, "grad_min_sv": 1.2118332304701748e-12, "grad_condition": 124861391701.8731, "lr": 0.0009164606203550494, "time_sec": 86.97034883499146 }, { "epoch": 29, "train_loss": 5.299116547241211, "train_acc": 0.00974, "test_loss": 6.629917897796631, "test_acc": 0.01, "lyapunov": 1.5079803863144896, "grad_norm": 0.26773989693385675, "grad_max_sv": 0.19062257409095765, "grad_min_sv": 1.316391307854978e-12, "grad_condition": 118514569073.00333, "lr": 0.0009105746045668516, "time_sec": 86.9515905380249 }, { "epoch": 30, "train_loss": 5.301858203277588, "train_acc": 0.00952, "test_loss": 7.616147738647461, "test_acc": 0.01, "lyapunov": 1.5108254772927754, "grad_norm": 0.2739642757327739, "grad_max_sv": 0.2010789501480758, "grad_min_sv": 3.194205121044685e-10, "grad_condition": 84817443385.97237, "lr": 0.0009045084971874733, "time_sec": 86.96926951408386 }, { "epoch": 31, "train_loss": 5.299806740875244, "train_acc": 0.01004, "test_loss": 7.885091897583008, "test_acc": 0.01, "lyapunov": 1.5118325930422225, "grad_norm": 0.23726371187902562, "grad_max_sv": 0.1534210465848446, "grad_min_sv": 3.777587378576868e-12, "grad_condition": 117298463694.8497, "lr": 0.0008982649590120977, "time_sec": 86.93767380714417 }, { "epoch": 32, "train_loss": 5.294980096740723, "train_acc": 0.01054, "test_loss": 7.175394052124023, "test_acc": 0.01, "lyapunov": 1.5122702329055122, "grad_norm": 0.18490861832393377, "grad_max_sv": 0.09243289618752897, "grad_min_sv": 7.151144434390166e-15, "grad_condition": 91554722602.0434, "lr": 0.0008918467286629196, "time_sec": 86.92625045776367 }, { "epoch": 33, "train_loss": 5.302116135559082, "train_acc": 0.00916, "test_loss": 6.950838031005859, "test_acc": 0.01, "lyapunov": 1.514583631854533, "grad_norm": 0.22539071559889906, "grad_max_sv": 0.14949913807213305, "grad_min_sv": 3.03463898255766e-13, "grad_condition": 123295125931.77371, "lr": 0.0008852566213878943, "time_sec": 86.96885013580322 }, { "epoch": 34, "train_loss": 5.298243276367187, "train_acc": 0.00926, "test_loss": 7.482379321289063, "test_acc": 0.01, "lyapunov": 1.514684440839626, "grad_norm": 0.18381668144055355, "grad_max_sv": 0.10984101705253124, "grad_min_sv": 7.163631845931476e-15, "grad_condition": 109054948912.02344, "lr": 0.000878497527825878, "time_sec": 87.12512397766113 }, { "epoch": 35, "train_loss": 5.308689108428955, "train_acc": 0.00958, "test_loss": 7.612553489685059, "test_acc": 0.01, "lyapunov": 1.5216995715485204, "grad_norm": 0.22567054848299975, "grad_max_sv": 0.1234450839459896, "grad_min_sv": 5.377204609898583e-14, "grad_condition": 117334156157.8593, "lr": 0.000871572412738697, "time_sec": 86.95104956626892 }, { "epoch": 36, "train_loss": 5.303922519226075, "train_acc": 0.00964, "test_loss": 8.831939950561523, "test_acc": 0.01, "lyapunov": 1.5175864534914647, "grad_norm": 0.2187679660724696, "grad_max_sv": 0.13990986812859774, "grad_min_sv": 1.80366368447702e-13, "grad_condition": 123448577181.446, "lr": 0.0008644843137107055, "time_sec": 86.92687749862671 }, { "epoch": 37, "train_loss": 5.303381102600098, "train_acc": 0.00916, "test_loss": 6.551040885925293, "test_acc": 0.01, "lyapunov": 1.5200756013850727, "grad_norm": 0.1798120608859804, "grad_max_sv": 0.10729131288826466, "grad_min_sv": 1.364290789538136e-14, "grad_condition": 105529300010.77225, "lr": 0.0008572363398164014, "time_sec": 86.95336151123047 }, { "epoch": 38, "train_loss": 5.30714798034668, "train_acc": 0.0094, "test_loss": 6.027979496765137, "test_acc": 0.01, "lyapunov": 1.5257836866866596, "grad_norm": 0.1909663013844348, "grad_max_sv": 0.07728723548352719, "grad_min_sv": 4.265317043954499e-24, "grad_condition": 77287235483.15219, "lr": 0.0008498316702566826, "time_sec": 86.9212384223938 }, { "epoch": 39, "train_loss": 5.306197135772705, "train_acc": 0.00974, "test_loss": 6.997566845703125, "test_acc": 0.01, "lyapunov": 1.5238893687572626, "grad_norm": 0.18383519139729404, "grad_max_sv": 0.1007891584187746, "grad_min_sv": 5.3239199179750705e-15, "grad_condition": 100154494637.09956, "lr": 0.0008422735529643442, "time_sec": 86.89629626274109 }, { "epoch": 40, "train_loss": 5.307650102386474, "train_acc": 0.00992, "test_loss": 6.040484946441651, "test_acc": 0.01, "lyapunov": 1.5250033597507135, "grad_norm": 0.18467843309484097, "grad_max_sv": 0.1127883294597268, "grad_min_sv": 7.1038360456260524e-15, "grad_condition": 111935273841.19809, "lr": 0.0008345653031794289, "time_sec": 87.02732610702515 }, { "epoch": 41, "train_loss": 5.307996878356934, "train_acc": 0.00992, "test_loss": 5.920440175628662, "test_acc": 0.01, "lyapunov": 1.5282226456400683, "grad_norm": 0.16629297131246892, "grad_max_sv": 0.07292309552431106, "grad_min_sv": 1.583549415956451e-17, "grad_condition": 72921914356.18047, "lr": 0.0008267103019950526, "time_sec": 86.94355273246765 }, { "epoch": 42, "train_loss": 5.311696410522461, "train_acc": 0.00968, "test_loss": 6.38518196105957, "test_acc": 0.01, "lyapunov": 1.5307711250032001, "grad_norm": 0.1871179922092424, "grad_max_sv": 0.08245804710313678, "grad_min_sv": 6.943719241443141e-16, "grad_condition": 82389599949.82372, "lr": 0.0008187119948743447, "time_sec": 86.93303918838501 }, { "epoch": 43, "train_loss": 5.307222317810059, "train_acc": 0.00956, "test_loss": 6.652195385742187, "test_acc": 0.01, "lyapunov": 1.5260984678097698, "grad_norm": 0.16067559125539438, "grad_max_sv": 0.09466201290488244, "grad_min_sv": 4.4300769825600874e-16, "grad_condition": 94621173553.03905, "lr": 0.000810573890139155, "time_sec": 86.90417695045471 }, { "epoch": 44, "train_loss": 5.308213620300293, "train_acc": 0.00882, "test_loss": 6.962696185302734, "test_acc": 0.01, "lyapunov": 1.527706109044497, "grad_norm": 0.1609729738345643, "grad_max_sv": 0.07951483679935337, "grad_min_sv": 1.2691498572245332e-19, "grad_condition": 79514825996.07883, "lr": 0.0008022995574311873, "time_sec": 86.90469932556152 }, { "epoch": 45, "train_loss": 5.313642641601563, "train_acc": 0.01004, "test_loss": 6.176641661071777, "test_acc": 0.01, "lyapunov": 1.5278308333643258, "grad_norm": 0.20554701681584006, "grad_max_sv": 0.1498540248721838, "grad_min_sv": 2.7361367599211426e-14, "grad_condition": 145983867269.5576, "lr": 0.0007938926261462363, "time_sec": 86.93738555908203 }, { "epoch": 46, "train_loss": 5.3097161289978025, "train_acc": 0.00952, "test_loss": 6.005211575317383, "test_acc": 0.01, "lyapunov": 1.5284498929977417, "grad_norm": 0.17319376275900747, "grad_max_sv": 0.10527544040232897, "grad_min_sv": 1.6379736406305529e-15, "grad_condition": 105101166914.13033, "lr": 0.0007853567838422158, "time_sec": 86.95744371414185 }, { "epoch": 47, "train_loss": 5.311491881408691, "train_acc": 0.00956, "test_loss": 5.9810846961975095, "test_acc": 0.01, "lyapunov": 1.530076160760182, "grad_norm": 0.1622416677557275, "grad_max_sv": 0.09897023066878319, "grad_min_sv": 1.1070734961814082e-15, "grad_condition": 98861145932.69461, "lr": 0.0007766957746216719, "time_sec": 86.9021110534668 }, { "epoch": 48, "train_loss": 5.310971976165772, "train_acc": 0.00894, "test_loss": 5.884356218719482, "test_acc": 0.01, "lyapunov": 1.5301186023160929, "grad_norm": 0.15478972851501702, "grad_max_sv": 0.09055562000721692, "grad_min_sv": 6.095582881917491e-16, "grad_condition": 90492925874.14865, "lr": 0.0007679133974894982, "time_sec": 86.923269033432 }, { "epoch": 49, "train_loss": 5.313096929931641, "train_acc": 0.00936, "test_loss": 5.441997985839844, "test_acc": 0.01, "lyapunov": 1.5325667373359662, "grad_norm": 0.15811997882687892, "grad_max_sv": 0.09403467867523432, "grad_min_sv": 2.5362328677092476e-16, "grad_condition": 94010861805.62488, "lr": 0.000759013504686565, "time_sec": 86.9168426990509 }, { "epoch": 50, "train_loss": 5.311940245513916, "train_acc": 0.00958, "test_loss": 5.371611124420166, "test_acc": 0.01, "lyapunov": 1.5327015231027628, "grad_norm": 0.14176864627007332, "grad_max_sv": 0.07908807899802923, "grad_min_sv": 2.050192692484369e-32, "grad_condition": 79088078998.02924, "lr": 0.0007499999999999998, "time_sec": 86.92089605331421 }, { "epoch": 51, "train_loss": 5.310895777282715, "train_acc": 0.00916, "test_loss": 5.434047091674804, "test_acc": 0.01, "lyapunov": 1.53158952573986, "grad_norm": 0.1361778166532044, "grad_max_sv": 0.06832279236987233, "grad_min_sv": 6.675573383462495e-16, "grad_condition": 68265680127.16847, "lr": 0.0007408768370508575, "time_sec": 86.94595527648926 }, { "epoch": 52, "train_loss": 5.3132603437805175, "train_acc": 0.01008, "test_loss": 6.7278813507080075, "test_acc": 0.01, "lyapunov": 1.535024075252016, "grad_norm": 0.17384705948913357, "grad_max_sv": 0.04316680300980806, "grad_min_sv": 0.0, "grad_condition": 43166803009.80806, "lr": 0.0007316480175599307, "time_sec": 86.91442537307739 }, { "epoch": 53, "train_loss": 5.3123740222167966, "train_acc": 0.00936, "test_loss": 6.131865232849121, "test_acc": 0.01, "lyapunov": 1.5338834356468962, "grad_norm": 0.1343518088533916, "grad_max_sv": 0.04088693740777671, "grad_min_sv": 0.0, "grad_condition": 40886937407.77672, "lr": 0.0007223175895924635, "time_sec": 86.89388537406921 }, { "epoch": 54, "train_loss": 5.311756536712647, "train_acc": 0.00874, "test_loss": 6.26136455078125, "test_acc": 0.01, "lyapunov": 1.534105893900937, "grad_norm": 0.12044776828887008, "grad_max_sv": 0.018818416306748985, "grad_min_sv": 0.0, "grad_condition": 18818416306.748985, "lr": 0.0007128896457825361, "time_sec": 86.86209654808044 }, { "epoch": 55, "train_loss": 5.314126918182373, "train_acc": 0.00948, "test_loss": 6.455938655853272, "test_acc": 0.01, "lyapunov": 1.5355246698155123, "grad_norm": 0.16535062387735305, "grad_max_sv": 0.048017819551751016, "grad_min_sv": 0.0, "grad_condition": 48017819551.75102, "lr": 0.0007033683215378998, "time_sec": 86.91218829154968 }, { "epoch": 56, "train_loss": 5.3133398397827145, "train_acc": 0.00934, "test_loss": 6.355834351348877, "test_acc": 0.01, "lyapunov": 1.535221906574181, "grad_norm": 0.14103865757116907, "grad_max_sv": 0.040325032686814664, "grad_min_sv": 0.0, "grad_condition": 40325032686.814674, "lr": 0.0006937577932260512, "time_sec": 87.01914978027344 }, { "epoch": 57, "train_loss": 5.315177789154053, "train_acc": 0.00906, "test_loss": 5.778967167663574, "test_acc": 0.01, "lyapunov": 1.5374448241480172, "grad_norm": 0.12626262616875458, "grad_max_sv": 0.04227766813710332, "grad_min_sv": 0.0, "grad_condition": 42277668137.10332, "lr": 0.0006840622763423388, "time_sec": 86.90552043914795 }, { "epoch": 58, "train_loss": 5.314984718017578, "train_acc": 0.0096, "test_loss": 5.680106079101562, "test_acc": 0.01, "lyapunov": 1.536767850141696, "grad_norm": 0.13366926148127872, "grad_max_sv": 0.05202861637808383, "grad_min_sv": 0.0, "grad_condition": 52028616378.083824, "lr": 0.0006742860236609073, "time_sec": 86.97483849525452 }, { "epoch": 59, "train_loss": 5.314250464019775, "train_acc": 0.00922, "test_loss": 5.60796079864502, "test_acc": 0.01, "lyapunov": 1.535877099732304, "grad_norm": 0.13264295460080205, "grad_max_sv": 0.053861632384359835, "grad_min_sv": 0.0, "grad_condition": 53861632384.35984, "lr": 0.0006644333233692913, "time_sec": 86.90899348258972 }, { "epoch": 60, "train_loss": 5.315608520202637, "train_acc": 0.00862, "test_loss": 5.75697197265625, "test_acc": 0.01, "lyapunov": 1.5373123942128837, "grad_norm": 0.13451447891861437, "grad_max_sv": 0.05724321529269218, "grad_min_sv": 0.0, "grad_condition": 57243215292.692184, "lr": 0.0006545084971874734, "time_sec": 86.93145775794983 }, { "epoch": 61, "train_loss": 5.315526120605469, "train_acc": 0.00966, "test_loss": 5.641050135803223, "test_acc": 0.01, "lyapunov": 1.537875465419896, "grad_norm": 0.134018980558527, "grad_max_sv": 0.04659216776490212, "grad_min_sv": 0.0, "grad_condition": 46592167764.902115, "lr": 0.0006445158984722354, "time_sec": 86.9526846408844 }, { "epoch": 62, "train_loss": 5.3171287049865725, "train_acc": 0.0095, "test_loss": 5.52830389251709, "test_acc": 0.01, "lyapunov": 1.5390207541873082, "grad_norm": 0.13900770761864464, "grad_max_sv": 0.05631723469123244, "grad_min_sv": 0.0, "grad_condition": 56317234691.232445, "lr": 0.0006344599103076324, "time_sec": 86.95262598991394 }, { "epoch": 63, "train_loss": 5.321492596435547, "train_acc": 0.00884, "test_loss": 5.732630862426758, "test_acc": 0.01, "lyapunov": 1.5413236017422298, "grad_norm": 0.1533270491872105, "grad_max_sv": 0.04487980231642723, "grad_min_sv": 0.0, "grad_condition": 44879802316.42723, "lr": 0.0006243449435824269, "time_sec": 86.93239831924438 }, { "epoch": 64, "train_loss": 5.315124908752441, "train_acc": 0.0099, "test_loss": 5.382702461242676, "test_acc": 0.01, "lyapunov": 1.5375381320943613, "grad_norm": 0.12218366701103515, "grad_max_sv": 0.032946509402245285, "grad_min_sv": 0.0, "grad_condition": 32946509402.24528, "lr": 0.0006141754350553275, "time_sec": 86.91653037071228 }, { "epoch": 65, "train_loss": 5.317460901031494, "train_acc": 0.00952, "test_loss": 5.498714874267578, "test_acc": 0.01, "lyapunov": 1.5401654679452061, "grad_norm": 0.11182228456659622, "grad_max_sv": 0.020332988910377027, "grad_min_sv": 0.0, "grad_condition": 20332988910.377026, "lr": 0.0006039558454088793, "time_sec": 86.86022281646729 }, { "epoch": 66, "train_loss": 5.315697211608887, "train_acc": 0.00964, "test_loss": 5.722520481872559, "test_acc": 0.01, "lyapunov": 1.5384024250537842, "grad_norm": 0.11947856234602877, "grad_max_sv": 0.012709397682920098, "grad_min_sv": 0.0, "grad_condition": 12709397682.9201, "lr": 0.000593690657292862, "time_sec": 86.83588552474976 }, { "epoch": 67, "train_loss": 5.315312230377197, "train_acc": 0.00948, "test_loss": 5.6552305557250975, "test_acc": 0.01, "lyapunov": 1.5376315924822521, "grad_norm": 0.12716375762874924, "grad_max_sv": 0.026200923277065157, "grad_min_sv": 0.0, "grad_condition": 26200923277.06516, "lr": 0.0005833843733580507, "time_sec": 86.93734240531921 }, { "epoch": 68, "train_loss": 5.316413257446289, "train_acc": 0.00892, "test_loss": 5.644158979797363, "test_acc": 0.01, "lyapunov": 1.5389487700694053, "grad_norm": 0.11329541475422919, "grad_max_sv": 0.025692512933164834, "grad_min_sv": 0.0, "grad_condition": 25692512933.164837, "lr": 0.0005730415142812054, "time_sec": 86.92358016967773 }, { "epoch": 69, "train_loss": 5.317326981048584, "train_acc": 0.00962, "test_loss": 5.646556529998779, "test_acc": 0.01, "lyapunov": 1.5400864053565217, "grad_norm": 0.1245567601020978, "grad_max_sv": 0.024738446017727254, "grad_min_sv": 0.0, "grad_condition": 24738446017.727257, "lr": 0.0005626666167821517, "time_sec": 86.86787414550781 }, { "epoch": 70, "train_loss": 5.317049356994629, "train_acc": 0.00982, "test_loss": 5.6787915084838865, "test_acc": 0.01, "lyapunov": 1.5397665028072074, "grad_norm": 0.118076358762286, "grad_max_sv": 0.03472304726019502, "grad_min_sv": 0.0, "grad_condition": 34723047260.195015, "lr": 0.0005522642316338265, "time_sec": 86.88831448554993 }, { "epoch": 71, "train_loss": 5.315880928039551, "train_acc": 0.00964, "test_loss": 5.735556723022461, "test_acc": 0.01, "lyapunov": 1.5387067657602413, "grad_norm": 0.11912248112688287, "grad_max_sv": 0.025617524981498718, "grad_min_sv": 0.0, "grad_condition": 25617524981.49872, "lr": 0.0005418389216661573, "time_sec": 86.86845374107361 }, { "epoch": 72, "train_loss": 5.320206904296875, "train_acc": 0.00958, "test_loss": 5.694711586761475, "test_acc": 0.01, "lyapunov": 1.5424333557753307, "grad_norm": 0.12792597639508846, "grad_max_sv": 0.03625847464427352, "grad_min_sv": 0.0, "grad_condition": 36258474644.27352, "lr": 0.0005313952597646563, "time_sec": 86.87807965278625 }, { "epoch": 73, "train_loss": 5.318149011688233, "train_acc": 0.0099, "test_loss": 5.715859918212891, "test_acc": 0.01, "lyapunov": 1.5407461092600128, "grad_norm": 0.12131920132322771, "grad_max_sv": 0.04332554340362549, "grad_min_sv": 0.0, "grad_condition": 43325543403.62549, "lr": 0.0005209378268645994, "time_sec": 86.93414950370789 }, { "epoch": 74, "train_loss": 5.316737642364502, "train_acc": 0.0094, "test_loss": 5.432159627532959, "test_acc": 0.01, "lyapunov": 1.5394032800289066, "grad_norm": 0.11202086425017638, "grad_max_sv": 0.02820308110676706, "grad_min_sv": 0.0, "grad_condition": 28203081106.76706, "lr": 0.0005104712099416781, "time_sec": 86.86637806892395 }, { "epoch": 75, "train_loss": 5.317990305633545, "train_acc": 0.00994, "test_loss": 5.894020344543457, "test_acc": 0.01, "lyapunov": 1.5408979687849274, "grad_norm": 0.15447706508859999, "grad_max_sv": 0.01931341988965869, "grad_min_sv": 0.0, "grad_condition": 19313419889.65869, "lr": 0.0004999999999999996, "time_sec": 86.85794830322266 }, { "epoch": 76, "train_loss": 5.329913055419921, "train_acc": 0.00922, "test_loss": 5.356306673431397, "test_acc": 0.01, "lyapunov": 1.5469030404029904, "grad_norm": 0.1130858808468486, "grad_max_sv": 0.020954679837450384, "grad_min_sv": 0.0, "grad_condition": 20954679837.450386, "lr": 0.0004895287900583212, "time_sec": 86.8532190322876 }, { "epoch": 77, "train_loss": 5.317062496490479, "train_acc": 0.01014, "test_loss": 5.6768914947509765, "test_acc": 0.01, "lyapunov": 1.539591530399859, "grad_norm": 0.11763219922287847, "grad_max_sv": 0.03681175904348492, "grad_min_sv": 0.0, "grad_condition": 36811759043.484924, "lr": 0.0004790621731353997, "time_sec": 86.89854335784912 }, { "epoch": 78, "train_loss": 5.321235802612304, "train_acc": 0.00956, "test_loss": 5.498642253875732, "test_acc": 0.01, "lyapunov": 1.5433477379781815, "grad_norm": 0.12257877066992058, "grad_max_sv": 0.002356324018910527, "grad_min_sv": 0.0, "grad_condition": 2356324018.910527, "lr": 0.000468604740235343, "time_sec": 86.82986307144165 }, { "epoch": 79, "train_loss": 5.3170875860595705, "train_acc": 0.00874, "test_loss": 5.678500232696533, "test_acc": 0.01, "lyapunov": 1.5401862192031976, "grad_norm": 0.11850283030771655, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 86.84353518486023 }, { "epoch": 80, "train_loss": 5.319253426513672, "train_acc": 0.00918, "test_loss": 5.127548231506347, "test_acc": 0.01, "lyapunov": 1.5418513970606773, "grad_norm": 0.11699107355632338, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 86.8760769367218 }, { "epoch": 81, "train_loss": 5.317456825408936, "train_acc": 0.00894, "test_loss": 5.307968811035156, "test_acc": 0.01, "lyapunov": 1.5405245113860615, "grad_norm": 0.1284549935774549, "grad_max_sv": 0.0083365049213171, "grad_min_sv": 0.0, "grad_condition": 8336504921.317101, "lr": 0.00043733338321784746, "time_sec": 86.87371492385864 }, { "epoch": 82, "train_loss": 5.317734858398437, "train_acc": 0.00954, "test_loss": 5.0544998031616215, "test_acc": 0.01, "lyapunov": 1.5406023172466345, "grad_norm": 0.120735257297947, "grad_max_sv": 0.02263884055428207, "grad_min_sv": 0.0, "grad_condition": 22638840554.282066, "lr": 0.0004269584857187939, "time_sec": 86.92492771148682 }, { "epoch": 83, "train_loss": 5.32118753692627, "train_acc": 0.00954, "test_loss": 5.125200929260254, "test_acc": 0.01, "lyapunov": 1.5442977073552357, "grad_norm": 0.11585054245697951, "grad_max_sv": 0.004569409461691975, "grad_min_sv": 0.0, "grad_condition": 4569409461.691976, "lr": 0.0004166156266419484, "time_sec": 86.81740093231201 }, { "epoch": 84, "train_loss": 5.317668086853027, "train_acc": 0.00892, "test_loss": 5.523793495178222, "test_acc": 0.01, "lyapunov": 1.5407223094759694, "grad_norm": 0.10949975143698651, "grad_max_sv": 0.01457698536105454, "grad_min_sv": 0.0, "grad_condition": 14576985361.05454, "lr": 0.0004063093427071373, "time_sec": 86.87661004066467 }, { "epoch": 85, "train_loss": 5.327004724578857, "train_acc": 0.00984, "test_loss": 5.3676797477722165, "test_acc": 0.01, "lyapunov": 1.54690202819112, "grad_norm": 0.11567866960588237, "grad_max_sv": 0.00381420748308301, "grad_min_sv": 0.0, "grad_condition": 3814207483.0830092, "lr": 0.0003960441545911199, "time_sec": 86.82225131988525 }, { "epoch": 86, "train_loss": 5.3172469395446775, "train_acc": 0.00898, "test_loss": 4.901917692565918, "test_acc": 0.01, "lyapunov": 1.5404299381748794, "grad_norm": 0.11387390679382547, "grad_max_sv": 0.001853126659989357, "grad_min_sv": 0.0, "grad_condition": 1853126659.989357, "lr": 0.0003858245649446718, "time_sec": 86.82927370071411 }, { "epoch": 87, "train_loss": 5.318947126464844, "train_acc": 0.00926, "test_loss": 5.208927967834473, "test_acc": 0.01, "lyapunov": 1.5421383124788095, "grad_norm": 0.10919909006363937, "grad_max_sv": 0.0032654264010488986, "grad_min_sv": 0.0, "grad_condition": 3265426401.048898, "lr": 0.00037565505641757235, "time_sec": 86.81736421585083 }, { "epoch": 88, "train_loss": 5.318348231048584, "train_acc": 0.00918, "test_loss": 4.997183460998535, "test_acc": 0.01, "lyapunov": 1.5415247068990527, "grad_norm": 0.11341200364232766, "grad_max_sv": 0.006511487392708659, "grad_min_sv": 0.0, "grad_condition": 6511487392.708659, "lr": 0.00036554008969236695, "time_sec": 86.82162237167358 }, { "epoch": 89, "train_loss": 5.318816225433349, "train_acc": 0.00892, "test_loss": 5.18877671661377, "test_acc": 0.01, "lyapunov": 1.5420374519684736, "grad_norm": 0.12034783892609052, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 86.97105526924133 }, { "epoch": 90, "train_loss": 5.318523200531006, "train_acc": 0.00938, "test_loss": 5.115398947143555, "test_acc": 0.01, "lyapunov": 1.5415691600736146, "grad_norm": 0.14346849260322833, "grad_max_sv": 0.02495567239820957, "grad_min_sv": 0.0, "grad_condition": 24955672398.20957, "lr": 0.000345491502812526, "time_sec": 86.88058757781982 }, { "epoch": 91, "train_loss": 5.318174597930908, "train_acc": 0.00928, "test_loss": 5.025017410278321, "test_acc": 0.01, "lyapunov": 1.5413767959150817, "grad_norm": 0.12564666917462933, "grad_max_sv": 0.0075723147485405205, "grad_min_sv": 0.0, "grad_condition": 7572314748.540522, "lr": 0.0003355666766307081, "time_sec": 86.85795545578003 }, { "epoch": 92, "train_loss": 5.318962445831299, "train_acc": 0.00776, "test_loss": 4.925245237731934, "test_acc": 0.01, "lyapunov": 1.5422863734652623, "grad_norm": 0.12308146620405915, "grad_max_sv": 0.0013421432580798865, "grad_min_sv": 0.0, "grad_condition": 1342143258.0798864, "lr": 0.00032571397633909225, "time_sec": 86.79794430732727 }, { "epoch": 93, "train_loss": 5.327239834136963, "train_acc": 0.00902, "test_loss": 5.076303866577148, "test_acc": 0.01, "lyapunov": 1.5474630085098775, "grad_norm": 0.1277051442186759, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 86.82232332229614 }, { "epoch": 94, "train_loss": 5.318930770874023, "train_acc": 0.00872, "test_loss": 4.880594007110596, "test_acc": 0.01, "lyapunov": 1.5422684445100672, "grad_norm": 0.13600368147480044, "grad_max_sv": 0.002521184924989939, "grad_min_sv": 0.0, "grad_condition": 2521184924.9899387, "lr": 0.0003062422067739483, "time_sec": 86.81427669525146 }, { "epoch": 95, "train_loss": 5.319566112213135, "train_acc": 0.00978, "test_loss": 4.991552732849121, "test_acc": 0.01, "lyapunov": 1.5428647238885045, "grad_norm": 0.12437123327866709, "grad_max_sv": 0.012525724712759256, "grad_min_sv": 0.0, "grad_condition": 12525724712.759256, "lr": 0.00029663167846209965, "time_sec": 86.81576943397522 }, { "epoch": 96, "train_loss": 5.321689688720703, "train_acc": 0.00864, "test_loss": 4.8253173141479495, "test_acc": 0.01, "lyapunov": 1.5444780929619089, "grad_norm": 0.12565886868121948, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 86.88868856430054 }, { "epoch": 97, "train_loss": 5.31878070602417, "train_acc": 0.00896, "test_loss": 4.881497433471679, "test_acc": 0.01, "lyapunov": 1.5421305144839275, "grad_norm": 0.11716334018301236, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 86.82862520217896 }, { "epoch": 98, "train_loss": 5.322988173828125, "train_acc": 0.00888, "test_loss": 4.762122218322754, "test_acc": 0.01, "lyapunov": 1.545472724663327, "grad_norm": 0.14401618175686975, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 86.81479406356812 }, { "epoch": 99, "train_loss": 5.318863394622802, "train_acc": 0.00886, "test_loss": 4.714427976989746, "test_acc": 0.01, "lyapunov": 1.5421699697099378, "grad_norm": 0.13101580238155278, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 86.82360768318176 }, { "epoch": 100, "train_loss": 5.32177279083252, "train_acc": 0.00908, "test_loss": 4.741457105255127, "test_acc": 0.01, "lyapunov": 1.5448724360722106, "grad_norm": 0.12685940692823117, "grad_max_sv": 0.0014819118659943342, "grad_min_sv": 0.0, "grad_condition": 1481911865.9943342, "lr": 0.0002499999999999997, "time_sec": 86.83973097801208 }, { "epoch": 101, "train_loss": 5.321585564422607, "train_acc": 0.0095, "test_loss": 4.660526361846924, "test_acc": 0.01, "lyapunov": 1.5446103762482744, "grad_norm": 0.15017654739054603, "grad_max_sv": 0.013982362765818834, "grad_min_sv": 0.0, "grad_condition": 13982362765.818836, "lr": 0.00024098649531343477, "time_sec": 86.89186692237854 }, { "epoch": 102, "train_loss": 5.318927859802246, "train_acc": 0.00892, "test_loss": 4.667855642700196, "test_acc": 0.01, "lyapunov": 1.542065743900016, "grad_norm": 0.14354448313759138, "grad_max_sv": 0.007601975044235587, "grad_min_sv": 0.0, "grad_condition": 7601975044.235586, "lr": 0.0002320866025105016, "time_sec": 86.85510921478271 }, { "epoch": 103, "train_loss": 5.319302808380127, "train_acc": 0.00854, "test_loss": 4.7306030563354495, "test_acc": 0.01, "lyapunov": 1.5426954067576573, "grad_norm": 0.1222745390564005, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 86.83695554733276 }, { "epoch": 104, "train_loss": 5.3208301354980465, "train_acc": 0.00928, "test_loss": 4.6642813407897945, "test_acc": 0.01, "lyapunov": 1.5443277465717873, "grad_norm": 0.12082325206764133, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 86.83465480804443 }, { "epoch": 105, "train_loss": 5.325607220458984, "train_acc": 0.00868, "test_loss": 4.797847722625733, "test_acc": 0.01, "lyapunov": 1.547427470421852, "grad_norm": 0.1467365865583852, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 86.92287278175354 }, { "epoch": 106, "train_loss": 5.327985736999512, "train_acc": 0.00948, "test_loss": 4.780700933837891, "test_acc": 0.01, "lyapunov": 1.5493294055504567, "grad_norm": 0.13200210447777874, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 86.93008136749268 }, { "epoch": 107, "train_loss": 5.319034835205078, "train_acc": 0.00946, "test_loss": 4.834465756225586, "test_acc": 0.01, "lyapunov": 1.5422752080366129, "grad_norm": 0.12777999612030252, "grad_max_sv": 0.02157975882291794, "grad_min_sv": 0.0, "grad_condition": 21579758822.91794, "lr": 0.0001894261098608447, "time_sec": 86.82852697372437 }, { "epoch": 108, "train_loss": 5.321411961364746, "train_acc": 0.00916, "test_loss": 4.814922105407715, "test_acc": 0.01, "lyapunov": 1.544609341475055, "grad_norm": 0.13197562787736147, "grad_max_sv": 0.015251889312639832, "grad_min_sv": 0.0, "grad_condition": 15251889312.639832, "lr": 0.000181288005125655, "time_sec": 86.85191607475281 }, { "epoch": 109, "train_loss": 5.322899269256592, "train_acc": 0.00876, "test_loss": 4.713241914367676, "test_acc": 0.01, "lyapunov": 1.54528974267223, "grad_norm": 0.12828276594838653, "grad_max_sv": 0.0006727563217282295, "grad_min_sv": 0.0, "grad_condition": 672756321.7282295, "lr": 0.0001732896980049473, "time_sec": 86.82081818580627 }, { "epoch": 110, "train_loss": 5.318816036987305, "train_acc": 0.0094, "test_loss": 4.679484854125977, "test_acc": 0.01, "lyapunov": 1.5422053230388084, "grad_norm": 0.12847280658733387, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 86.9124755859375 }, { "epoch": 111, "train_loss": 5.318745676116944, "train_acc": 0.00848, "test_loss": 4.795034047698975, "test_acc": 0.01, "lyapunov": 1.5421484263656695, "grad_norm": 0.1278982868324375, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 86.83268451690674 }, { "epoch": 112, "train_loss": 5.318630710906983, "train_acc": 0.00898, "test_loss": 4.784210496520996, "test_acc": 0.01, "lyapunov": 1.5420354778504433, "grad_norm": 0.13247976598300262, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 86.79545545578003 }, { "epoch": 113, "train_loss": 5.318998959655762, "train_acc": 0.00884, "test_loss": 4.768862895202637, "test_acc": 0.01, "lyapunov": 1.542412842021269, "grad_norm": 0.13154644614275643, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 86.8436176776886 }, { "epoch": 114, "train_loss": 5.3237989538574215, "train_acc": 0.00958, "test_loss": 4.739323009490967, "test_acc": 0.01, "lyapunov": 1.5463786896537333, "grad_norm": 0.14268776917647705, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 86.84370040893555 }, { "epoch": 115, "train_loss": 5.321883607025146, "train_acc": 0.00924, "test_loss": 4.724630879211426, "test_acc": 0.01, "lyapunov": 1.544751648707768, "grad_norm": 0.13724738045143065, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 86.83514404296875 }, { "epoch": 116, "train_loss": 5.317745707855225, "train_acc": 0.00926, "test_loss": 4.771264694213867, "test_acc": 0.01, "lyapunov": 1.5411124830050846, "grad_norm": 0.13439912972628948, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 86.83839774131775 }, { "epoch": 117, "train_loss": 5.318638670196533, "train_acc": 0.00944, "test_loss": 4.926259418487549, "test_acc": 0.01, "lyapunov": 1.5420454350273933, "grad_norm": 0.1301899172356262, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 86.81545162200928 }, { "epoch": 118, "train_loss": 5.317975592346191, "train_acc": 0.0091, "test_loss": 4.7584453956604005, "test_acc": 0.01, "lyapunov": 1.5413338939856995, "grad_norm": 0.1306510838756953, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 86.84224820137024 }, { "epoch": 119, "train_loss": 5.317512142944336, "train_acc": 0.00918, "test_loss": 4.75227194366455, "test_acc": 0.01, "lyapunov": 1.5408342912069062, "grad_norm": 0.13531431192184493, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 86.84121561050415 }, { "epoch": 120, "train_loss": 5.32096346862793, "train_acc": 0.00916, "test_loss": 4.783403231811524, "test_acc": 0.01, "lyapunov": 1.5443097962747754, "grad_norm": 0.1366841922730417, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 86.8264012336731 }, { "epoch": 121, "train_loss": 5.31987023651123, "train_acc": 0.009, "test_loss": 4.769460425567627, "test_acc": 0.01, "lyapunov": 1.5431054827502317, "grad_norm": 0.13796061159903233, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 86.83200931549072 }, { "epoch": 122, "train_loss": 5.317669274597168, "train_acc": 0.009, "test_loss": 4.726600196838379, "test_acc": 0.01, "lyapunov": 1.5410202537351252, "grad_norm": 0.13807476351768067, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 86.85096383094788 }, { "epoch": 123, "train_loss": 5.31959240447998, "train_acc": 0.00982, "test_loss": 4.731892253112793, "test_acc": 0.01, "lyapunov": 1.5430450296158071, "grad_norm": 0.14330032241201268, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 86.8001983165741 }, { "epoch": 124, "train_loss": 5.317501362304688, "train_acc": 0.00938, "test_loss": 4.782514060974121, "test_acc": 0.01, "lyapunov": 1.540854393673675, "grad_norm": 0.14059038369574442, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 86.87392091751099 }, { "epoch": 125, "train_loss": 5.318027396545411, "train_acc": 0.0095, "test_loss": 4.765302996826172, "test_acc": 0.01, "lyapunov": 1.5414052317514444, "grad_norm": 0.1418679045184447, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 86.82495832443237 }, { "epoch": 126, "train_loss": 5.318346632080078, "train_acc": 0.0092, "test_loss": 4.7442352600097655, "test_acc": 0.01, "lyapunov": 1.5417146911401578, "grad_norm": 0.142826590523136, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 86.79729580879211 }, { "epoch": 127, "train_loss": 5.318922318725586, "train_acc": 0.00974, "test_loss": 4.76433516998291, "test_acc": 0.01, "lyapunov": 1.542423507136762, "grad_norm": 0.14495446560643363, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 86.93182754516602 }, { "epoch": 128, "train_loss": 5.318007217102051, "train_acc": 0.00962, "test_loss": 4.764061611938477, "test_acc": 0.01, "lyapunov": 1.541390145831096, "grad_norm": 0.14153652471754832, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 86.8191487789154 }, { "epoch": 129, "train_loss": 5.318092449340821, "train_acc": 0.00968, "test_loss": 4.765155668640137, "test_acc": 0.01, "lyapunov": 1.5414884422746156, "grad_norm": 0.14863798950920318, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 86.92294239997864 }, { "epoch": 130, "train_loss": 5.318419138793946, "train_acc": 0.00922, "test_loss": 4.764954615783691, "test_acc": 0.01, "lyapunov": 1.541847081745372, "grad_norm": 0.14422350481698742, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 86.83364939689636 }, { "epoch": 131, "train_loss": 5.319330998535157, "train_acc": 0.00984, "test_loss": 4.749797338867188, "test_acc": 0.01, "lyapunov": 1.5428275848593553, "grad_norm": 0.1575339118534098, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 86.83805966377258 }, { "epoch": 132, "train_loss": 5.3225936277771, "train_acc": 0.00944, "test_loss": 4.753033805847168, "test_acc": 0.01, "lyapunov": 1.5456237704552653, "grad_norm": 0.1459542484301229, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 86.83223581314087 }, { "epoch": 133, "train_loss": 5.319478280029297, "train_acc": 0.00904, "test_loss": 4.726372310638427, "test_acc": 0.01, "lyapunov": 1.5427262319628234, "grad_norm": 0.15430065761057823, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 86.81233429908752 }, { "epoch": 134, "train_loss": 5.320157431182861, "train_acc": 0.00978, "test_loss": 4.729707991790772, "test_acc": 0.01, "lyapunov": 1.5434529592314035, "grad_norm": 0.14953623206124225, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 86.81813621520996 }, { "epoch": 135, "train_loss": 5.344091755371093, "train_acc": 0.00992, "test_loss": 4.742976405334472, "test_acc": 0.01, "lyapunov": 1.5575274945524953, "grad_norm": 0.17021644451164028, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 86.84416842460632 }, { "epoch": 136, "train_loss": 5.3179564929199215, "train_acc": 0.01, "test_loss": 4.757002459716797, "test_acc": 0.01, "lyapunov": 1.541358881289392, "grad_norm": 0.1455320955701897, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 86.83202290534973 }, { "epoch": 137, "train_loss": 5.319369739990234, "train_acc": 0.00978, "test_loss": 4.748977610015869, "test_acc": 0.01, "lyapunov": 1.5428897822299577, "grad_norm": 0.15104084037444107, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 86.81699085235596 }, { "epoch": 138, "train_loss": 5.318675216522217, "train_acc": 0.01, "test_loss": 4.713645321655274, "test_acc": 0.01, "lyapunov": 1.5421365197662198, "grad_norm": 0.14694031631290994, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 86.8898720741272 }, { "epoch": 139, "train_loss": 5.318637705383301, "train_acc": 0.01, "test_loss": 4.743732140350342, "test_acc": 0.01, "lyapunov": 1.5420801776754276, "grad_norm": 0.15086340410308036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 86.82428193092346 }, { "epoch": 140, "train_loss": 5.318365608825683, "train_acc": 0.01, "test_loss": 4.738941632843018, "test_acc": 0.01, "lyapunov": 1.5417572262951784, "grad_norm": 0.1451696630670528, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 86.8176257610321 }, { "epoch": 141, "train_loss": 5.319074583282471, "train_acc": 0.01, "test_loss": 4.743734898376465, "test_acc": 0.01, "lyapunov": 1.5425543062522282, "grad_norm": 0.14883420989990226, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 86.81977844238281 }, { "epoch": 142, "train_loss": 5.321842821502686, "train_acc": 0.01, "test_loss": 4.742512757873535, "test_acc": 0.01, "lyapunov": 1.5452124737107846, "grad_norm": 0.14940314161589946, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 86.9058632850647 }, { "epoch": 143, "train_loss": 5.323013974456787, "train_acc": 0.01, "test_loss": 4.7366528335571285, "test_acc": 0.01, "lyapunov": 1.5466468251879564, "grad_norm": 0.48352294330900464, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 86.8274781703949 }, { "epoch": 144, "train_loss": 5.322230252380371, "train_acc": 0.01, "test_loss": 4.734474227905274, "test_acc": 0.01, "lyapunov": 1.5454154453619058, "grad_norm": 0.15060559526776118, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 86.83571076393127 }, { "epoch": 145, "train_loss": 5.318391214904785, "train_acc": 0.01, "test_loss": 4.740697119140625, "test_acc": 0.01, "lyapunov": 1.5418205120984245, "grad_norm": 0.14599666991367263, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 86.83404302597046 }, { "epoch": 146, "train_loss": 5.3190992230224605, "train_acc": 0.01, "test_loss": 4.740016835021972, "test_acc": 0.01, "lyapunov": 1.542624485462218, "grad_norm": 0.15263702906229243, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 86.86582016944885 }, { "epoch": 147, "train_loss": 5.318638049316406, "train_acc": 0.01, "test_loss": 4.740016804504394, "test_acc": 0.01, "lyapunov": 1.542047378352231, "grad_norm": 0.1501107976108878, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 86.7875075340271 }, { "epoch": 148, "train_loss": 5.318966191101074, "train_acc": 0.01, "test_loss": 4.740017098999023, "test_acc": 0.01, "lyapunov": 1.5423082866327231, "grad_norm": 0.1506843352752174, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 86.85878276824951 }, { "epoch": 149, "train_loss": 5.318281329040527, "train_acc": 0.01, "test_loss": 4.740017213439941, "test_acc": 0.01, "lyapunov": 1.5417110215672447, "grad_norm": 0.14832275166563608, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 87.06339812278748 }, { "epoch": 150, "train_loss": 5.318742103729248, "train_acc": 0.01, "test_loss": 4.740017121887207, "test_acc": 0.01, "lyapunov": 1.5422426760958894, "grad_norm": 0.1485832497803494, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 86.82008957862854 } ], "12": [ { "epoch": 1, "train_loss": 5.142427458190918, "train_acc": 0.01732, "test_loss": 4.915040765380859, "test_acc": 0.0102, "lyapunov": 2.4272339856228253, "grad_norm": 5.192250161678427, "grad_max_sv": 4.473296946287155, "grad_min_sv": 8.955331335380733e-08, "grad_condition": 71327028.89068338, "lr": 0.0009998903417374227, "time_sec": 132.13672518730164 }, { "epoch": 2, "train_loss": 4.874939300842285, "train_acc": 0.01776, "test_loss": 4.858658763122558, "test_acc": 0.0123, "lyapunov": 1.9352691591243305, "grad_norm": 3.5048458101816564, "grad_max_sv": 2.842214399576187, "grad_min_sv": 5.994522662700064e-08, "grad_condition": 56014607.037285045, "lr": 0.0009995614150494292, "time_sec": 132.1895821094513 }, { "epoch": 3, "train_loss": 4.780418332366944, "train_acc": 0.01696, "test_loss": 5.036572162628174, "test_acc": 0.013, "lyapunov": 1.6941773053020468, "grad_norm": 2.3576536383434044, "grad_max_sv": 1.8239452183246612, "grad_min_sv": 3.909134313473395e-08, "grad_condition": 54665529.32274648, "lr": 0.0009990133642141358, "time_sec": 132.14293670654297 }, { "epoch": 4, "train_loss": 4.74106760559082, "train_acc": 0.0156, "test_loss": 4.614977532958984, "test_acc": 0.01, "lyapunov": 1.667667641359217, "grad_norm": 1.2834888351442275, "grad_max_sv": 0.7230008448474109, "grad_min_sv": 1.1444949870584092e-08, "grad_condition": 21641297318.53074, "lr": 0.0009982464296247522, "time_sec": 132.18336057662964 }, { "epoch": 5, "train_loss": 4.765737413482666, "train_acc": 0.01652, "test_loss": 5.099783699798584, "test_acc": 0.01, "lyapunov": 1.6692155538617497, "grad_norm": 0.6681729594071041, "grad_max_sv": 0.4321929462254047, "grad_min_sv": 8.256420696048775e-10, "grad_condition": 130856413066.44238, "lr": 0.0009972609476841367, "time_sec": 132.0963535308838 }, { "epoch": 6, "train_loss": 4.802682023925781, "train_acc": 0.01584, "test_loss": 4.645143016052246, "test_acc": 0.01, "lyapunov": 1.6541148235121041, "grad_norm": 0.5601084813828376, "grad_max_sv": 0.3682811915874481, "grad_min_sv": 4.4830527621445066e-12, "grad_condition": 122810946704.98007, "lr": 0.000996057350657239, "time_sec": 132.08646774291992 }, { "epoch": 7, "train_loss": 4.861019936065674, "train_acc": 0.0145, "test_loss": 5.0593204246521, "test_acc": 0.012, "lyapunov": 1.6806474119196158, "grad_norm": 0.4786920265962189, "grad_max_sv": 0.36215363070368767, "grad_min_sv": 5.403665967264682e-10, "grad_condition": 157595569273.04913, "lr": 0.000994636166481494, "time_sec": 132.12457752227783 }, { "epoch": 8, "train_loss": 4.906115528869629, "train_acc": 0.01422, "test_loss": 4.609849331665039, "test_acc": 0.01, "lyapunov": 1.6933349569130431, "grad_norm": 0.5105557123165358, "grad_max_sv": 0.2962237525731325, "grad_min_sv": 1.5893412122574907e-12, "grad_condition": 162936272535.53033, "lr": 0.0009929980185352525, "time_sec": 132.0816192626953 }, { "epoch": 9, "train_loss": 4.948906524505615, "train_acc": 0.01298, "test_loss": 4.606528971099854, "test_acc": 0.01, "lyapunov": 1.684294082624528, "grad_norm": 0.4680820303299784, "grad_max_sv": 0.2727967657148838, "grad_min_sv": 6.175172652279376e-13, "grad_condition": 191797793138.9354, "lr": 0.0009911436253643444, "time_sec": 132.09475946426392 }, { "epoch": 10, "train_loss": 5.001812951354981, "train_acc": 0.01048, "test_loss": 4.605593468475342, "test_acc": 0.01, "lyapunov": 1.6371012395605102, "grad_norm": 0.4454332910853826, "grad_max_sv": 0.06080346256494522, "grad_min_sv": 1.1174912073463375e-13, "grad_condition": 43714632849.557816, "lr": 0.0009890738003669028, "time_sec": 132.12074422836304 }, { "epoch": 11, "train_loss": 5.020210814056396, "train_acc": 0.0096, "test_loss": 6.067085327148438, "test_acc": 0.01, "lyapunov": 1.55058368331636, "grad_norm": 0.43082604131055474, "grad_max_sv": 0.221556506305933, "grad_min_sv": 2.881964604461995e-09, "grad_condition": 154673733.23759162, "lr": 0.00098678945143658, "time_sec": 132.08557748794556 }, { "epoch": 12, "train_loss": 5.050462992553711, "train_acc": 0.0094, "test_loss": 4.605482531738281, "test_acc": 0.01, "lyapunov": 1.5398570713789568, "grad_norm": 0.381893916008903, "grad_max_sv": 0.2668355040252209, "grad_min_sv": 3.789388436370445e-09, "grad_condition": 42311880.80663426, "lr": 0.0009842915805643154, "time_sec": 132.05907773971558 }, { "epoch": 13, "train_loss": 5.067867939758301, "train_acc": 0.00924, "test_loss": 4.605311224365234, "test_acc": 0.01, "lyapunov": 1.539125974830764, "grad_norm": 0.1537321432498029, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000981581283398829, "time_sec": 132.1301724910736 }, { "epoch": 14, "train_loss": 5.122542482299805, "train_acc": 0.01028, "test_loss": 6.089662152862549, "test_acc": 0.01, "lyapunov": 1.5396406424929723, "grad_norm": 0.3505932006709459, "grad_max_sv": 0.24503438249230386, "grad_min_sv": 3.2204854292020023e-09, "grad_condition": 175828681.99119335, "lr": 0.0009786597487660333, "time_sec": 132.11422061920166 }, { "epoch": 15, "train_loss": 5.167975009613037, "train_acc": 0.00938, "test_loss": 6.145216786956787, "test_acc": 0.01, "lyapunov": 1.5421736868446136, "grad_norm": 0.460038063194906, "grad_max_sv": 0.37677369341254235, "grad_min_sv": 5.061586208499058e-09, "grad_condition": 83937837.74305013, "lr": 0.0009755282581475766, "time_sec": 132.15303254127502 }, { "epoch": 16, "train_loss": 5.185187667541504, "train_acc": 0.00964, "test_loss": 4.605292627716064, "test_acc": 0.01, "lyapunov": 1.5415043111347482, "grad_norm": 0.2749549655041811, "grad_max_sv": 0.13375916928052903, "grad_min_sv": 1.7694276155388877e-09, "grad_condition": 28413171.440939356, "lr": 0.0009721881851187403, "time_sec": 132.0988028049469 }, { "epoch": 17, "train_loss": 5.213513888549805, "train_acc": 0.00944, "test_loss": 4.605225193786621, "test_acc": 0.01, "lyapunov": 1.5439205886153005, "grad_norm": 0.15107835674594625, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009686409947459456, "time_sec": 132.06156492233276 }, { "epoch": 18, "train_loss": 5.259810456237793, "train_acc": 0.00946, "test_loss": 6.243620587158203, "test_acc": 0.01, "lyapunov": 1.5492180427321998, "grad_norm": 0.17993668118393238, "grad_max_sv": 0.02630040645599365, "grad_min_sv": 2.2052708131825583e-10, "grad_condition": 25149159.75180607, "lr": 0.0009648882429441254, "time_sec": 132.04172444343567 }, { "epoch": 19, "train_loss": 5.30400526260376, "train_acc": 0.01008, "test_loss": 6.052386779022217, "test_acc": 0.01, "lyapunov": 1.544384488974081, "grad_norm": 0.348063373631547, "grad_max_sv": 0.2475440863519907, "grad_min_sv": 2.704030184225853e-09, "grad_condition": 448939719.83669394, "lr": 0.00096093157579425, "time_sec": 132.16821956634521 }, { "epoch": 20, "train_loss": 5.344405227050781, "train_acc": 0.0094, "test_loss": 6.0689891357421875, "test_acc": 0.01, "lyapunov": 1.549183475087061, "grad_norm": 0.3941364600912924, "grad_max_sv": 0.28380888141691685, "grad_min_sv": 2.9937321677220295e-09, "grad_condition": 919686281.1330671, "lr": 0.0009567727288213001, "time_sec": 132.13486909866333 }, { "epoch": 21, "train_loss": 5.342385781860352, "train_acc": 0.00934, "test_loss": 5.634283610534668, "test_acc": 0.01, "lyapunov": 1.5489524468741454, "grad_norm": 0.35198337312808664, "grad_max_sv": 0.2675567839294672, "grad_min_sv": 2.7506563800988593e-09, "grad_condition": 137616088.9764635, "lr": 0.0009524135262330095, "time_sec": 132.15001010894775 }, { "epoch": 22, "train_loss": 5.340258148040771, "train_acc": 0.01038, "test_loss": 6.047631702423096, "test_acc": 0.01, "lyapunov": 1.5503142017232792, "grad_norm": 0.32912217146899386, "grad_max_sv": 0.23988064490258693, "grad_min_sv": 2.0088645359163383e-09, "grad_condition": 325233106.42990357, "lr": 0.0009478558801197061, "time_sec": 132.1328146457672 }, { "epoch": 23, "train_loss": 5.33926953994751, "train_acc": 0.00924, "test_loss": 6.389647571563721, "test_acc": 0.01, "lyapunov": 1.5511968355349568, "grad_norm": 0.3034442087369207, "grad_max_sv": 0.21002153679728508, "grad_min_sv": 7.416720458496191e-10, "grad_condition": 49849833895.91653, "lr": 0.000943101789615607, "time_sec": 132.11377239227295 }, { "epoch": 24, "train_loss": 5.342641763763428, "train_acc": 0.01046, "test_loss": 6.151307273101807, "test_acc": 0.01, "lyapunov": 1.5519740599805436, "grad_norm": 0.32351011233615656, "grad_max_sv": 0.24164889194071293, "grad_min_sv": 1.9842920796070418e-09, "grad_condition": 216397157.20139033, "lr": 0.0009381533400219313, "time_sec": 132.07816553115845 }, { "epoch": 25, "train_loss": 5.336951184997559, "train_acc": 0.00994, "test_loss": 5.9992121322631835, "test_acc": 0.01, "lyapunov": 1.5503220811219471, "grad_norm": 0.2784195734173852, "grad_max_sv": 0.19388381093740464, "grad_min_sv": 2.1356596568026515e-10, "grad_condition": 108561949775.06238, "lr": 0.0009330127018922189, "time_sec": 132.10879969596863 }, { "epoch": 26, "train_loss": 5.336466632537841, "train_acc": 0.01006, "test_loss": 5.7221336074829106, "test_acc": 0.01, "lyapunov": 1.5520486011529517, "grad_norm": 0.24825146645127755, "grad_max_sv": 0.17286810129880906, "grad_min_sv": 1.0904332706662028e-12, "grad_condition": 103853917717.00699, "lr": 0.000927682130080253, "time_sec": 132.1171510219574 }, { "epoch": 27, "train_loss": 5.336693968505859, "train_acc": 0.00944, "test_loss": 5.829081159210205, "test_acc": 0.01, "lyapunov": 1.5536211549168657, "grad_norm": 0.23362614927382305, "grad_max_sv": 0.15823216680437327, "grad_min_sv": 7.62931019239883e-13, "grad_condition": 111090272986.05489, "lr": 0.0009221639627510072, "time_sec": 132.13189697265625 }, { "epoch": 28, "train_loss": 5.336333346252442, "train_acc": 0.01034, "test_loss": 6.183766918945312, "test_acc": 0.01, "lyapunov": 1.5548379052325587, "grad_norm": 0.2252526539391841, "grad_max_sv": 0.1425440175458789, "grad_min_sv": 5.001494019507075e-14, "grad_condition": 136232139639.80547, "lr": 0.0009164606203550494, "time_sec": 132.0898892879486 }, { "epoch": 29, "train_loss": 5.3385375555419925, "train_acc": 0.01006, "test_loss": 18.741441845703125, "test_acc": 0.01, "lyapunov": 1.559137857478598, "grad_norm": 0.24309729358940327, "grad_max_sv": 0.1129613446071744, "grad_min_sv": 7.652494146034002e-15, "grad_condition": 112054629681.63525, "lr": 0.0009105746045668516, "time_sec": 132.19855189323425 }, { "epoch": 30, "train_loss": 5.337543925323486, "train_acc": 0.00958, "test_loss": 17.780749963378906, "test_acc": 0.01, "lyapunov": 1.5578542255684542, "grad_norm": 0.22390701226492316, "grad_max_sv": 0.10281856972724199, "grad_min_sv": 3.3459312089163837e-15, "grad_condition": 102453292464.96785, "lr": 0.0009045084971874733, "time_sec": 132.09549117088318 }, { "epoch": 31, "train_loss": 5.33479830078125, "train_acc": 0.00896, "test_loss": 18.024621951293945, "test_acc": 0.01, "lyapunov": 1.5561083588758697, "grad_norm": 0.2617176836095928, "grad_max_sv": 0.0911625299602747, "grad_min_sv": 1.0217219065908696e-15, "grad_condition": 91065349161.70517, "lr": 0.0008982649590120977, "time_sec": 132.07474184036255 }, { "epoch": 32, "train_loss": 5.336539338684082, "train_acc": 0.0096, "test_loss": 18.656125256347657, "test_acc": 0.01, "lyapunov": 1.558475110536951, "grad_norm": 0.2736415217941262, "grad_max_sv": 0.08601008746773005, "grad_min_sv": 8.793854624629887e-16, "grad_condition": 85922955415.14108, "lr": 0.0008918467286629196, "time_sec": 132.10801935195923 }, { "epoch": 33, "train_loss": 5.346367032775879, "train_acc": 0.00982, "test_loss": 16.179306204223632, "test_acc": 0.01, "lyapunov": 1.5642947364036384, "grad_norm": 0.26593824832856844, "grad_max_sv": 0.11054420564323664, "grad_min_sv": 1.4557409070313929e-10, "grad_condition": 86957832407.85573, "lr": 0.0008852566213878943, "time_sec": 132.09707188606262 }, { "epoch": 34, "train_loss": 5.366751658630371, "train_acc": 0.0095, "test_loss": 14.5320333984375, "test_acc": 0.01, "lyapunov": 1.5604360716422196, "grad_norm": 0.39203529519334207, "grad_max_sv": 0.3150600105524063, "grad_min_sv": 3.335271438415291e-09, "grad_condition": 437335317.70210946, "lr": 0.000878497527825878, "time_sec": 132.12472343444824 }, { "epoch": 35, "train_loss": 5.3540499374389645, "train_acc": 0.00914, "test_loss": 14.636802185058594, "test_acc": 0.01, "lyapunov": 1.5606954972762281, "grad_norm": 0.3377550426065231, "grad_max_sv": 0.2708315536379814, "grad_min_sv": 2.616331799126792e-09, "grad_condition": 145659046.06806198, "lr": 0.000871572412738697, "time_sec": 132.10315084457397 }, { "epoch": 36, "train_loss": 5.350296534576416, "train_acc": 0.00996, "test_loss": 15.48446300354004, "test_acc": 0.01, "lyapunov": 1.5607713335920173, "grad_norm": 0.29951473550525415, "grad_max_sv": 0.24341562166810035, "grad_min_sv": 1.5972995535181583e-09, "grad_condition": 1815700162.0467975, "lr": 0.0008644843137107055, "time_sec": 132.10273575782776 }, { "epoch": 37, "train_loss": 5.3520866116333, "train_acc": 0.00968, "test_loss": 14.972803247070312, "test_acc": 0.01, "lyapunov": 1.5632766884611087, "grad_norm": 0.33571017690288324, "grad_max_sv": 0.2274009022861719, "grad_min_sv": 6.642170352888692e-10, "grad_condition": 43022286203.22009, "lr": 0.0008572363398164014, "time_sec": 132.0913314819336 }, { "epoch": 38, "train_loss": 5.347811700897217, "train_acc": 0.00978, "test_loss": 15.4173666015625, "test_acc": 0.01, "lyapunov": 1.5653380673864614, "grad_norm": 0.23644614014625348, "grad_max_sv": 0.15670949593186378, "grad_min_sv": 3.485120328424339e-13, "grad_condition": 126042108666.44785, "lr": 0.0008498316702566826, "time_sec": 132.12694144248962 }, { "epoch": 39, "train_loss": 5.350918925933838, "train_acc": 0.01, "test_loss": 7.349865231323242, "test_acc": 0.01, "lyapunov": 1.5639865206330634, "grad_norm": 0.25831036099968246, "grad_max_sv": 0.18908596560359, "grad_min_sv": 3.4109730636612205e-10, "grad_condition": 109021837331.04056, "lr": 0.0008422735529643442, "time_sec": 132.15545773506165 }, { "epoch": 40, "train_loss": 5.350084358825684, "train_acc": 0.00968, "test_loss": 6.699221839904785, "test_acc": 0.01, "lyapunov": 1.5618754555197323, "grad_norm": 0.33240423060946156, "grad_max_sv": 0.16681117806583642, "grad_min_sv": 8.354353915913262e-10, "grad_condition": 29639133022.15968, "lr": 0.0008345653031794289, "time_sec": 132.0622968673706 }, { "epoch": 41, "train_loss": 5.348379842224121, "train_acc": 0.01014, "test_loss": 12.351808143615722, "test_acc": 0.01, "lyapunov": 1.5626876762760875, "grad_norm": 0.31832555128145307, "grad_max_sv": 0.20640474413521587, "grad_min_sv": 8.66528908347317e-13, "grad_condition": 129815385507.61075, "lr": 0.0008267103019950526, "time_sec": 132.2454056739807 }, { "epoch": 42, "train_loss": 5.34665752532959, "train_acc": 0.00974, "test_loss": 14.07037748260498, "test_acc": 0.01, "lyapunov": 1.5655529825278864, "grad_norm": 0.2561124376145529, "grad_max_sv": 0.10575219443999231, "grad_min_sv": 1.9916840597483354e-10, "grad_condition": 82384130296.00456, "lr": 0.0008187119948743447, "time_sec": 132.08385848999023 }, { "epoch": 43, "train_loss": 5.343207415618896, "train_acc": 0.0099, "test_loss": 13.306277600097657, "test_acc": 0.01, "lyapunov": 1.5653508831472958, "grad_norm": 0.19924932372474, "grad_max_sv": 0.096745721437037, "grad_min_sv": 1.0061398517570142e-15, "grad_condition": 96651724250.54889, "lr": 0.000810573890139155, "time_sec": 132.13167572021484 }, { "epoch": 44, "train_loss": 5.345402418518066, "train_acc": 0.00992, "test_loss": 7.869494395446777, "test_acc": 0.01, "lyapunov": 1.5646309980650996, "grad_norm": 0.21769658517748566, "grad_max_sv": 0.13879811409860848, "grad_min_sv": 1.6053037275992228e-14, "grad_condition": 135561498479.67575, "lr": 0.0008022995574311873, "time_sec": 132.21540069580078 }, { "epoch": 45, "train_loss": 5.346674517059326, "train_acc": 0.00986, "test_loss": 11.400154348754883, "test_acc": 0.01, "lyapunov": 1.5669585390164114, "grad_norm": 0.21055278107954878, "grad_max_sv": 0.12050471100956202, "grad_min_sv": 1.448653245665297e-14, "grad_condition": 117784195175.33076, "lr": 0.0007938926261462363, "time_sec": 132.13598537445068 }, { "epoch": 46, "train_loss": 5.350086312103271, "train_acc": 0.00912, "test_loss": 11.996928524780273, "test_acc": 0.01, "lyapunov": 1.5701792279777624, "grad_norm": 0.21008620048452556, "grad_max_sv": 0.08796360064297915, "grad_min_sv": 3.893309181110675e-16, "grad_condition": 87925759209.02908, "lr": 0.0007853567838422158, "time_sec": 132.10033679008484 }, { "epoch": 47, "train_loss": 5.342350235290527, "train_acc": 0.0087, "test_loss": 10.970650772094727, "test_acc": 0.01, "lyapunov": 1.564373235263483, "grad_norm": 0.1731163774631187, "grad_max_sv": 0.08237459398806095, "grad_min_sv": 2.1940905206855015e-16, "grad_condition": 82355183433.8488, "lr": 0.0007766957746216719, "time_sec": 132.1089198589325 }, { "epoch": 48, "train_loss": 5.34227012512207, "train_acc": 0.00988, "test_loss": 11.343988357543946, "test_acc": 0.01, "lyapunov": 1.5652936489685723, "grad_norm": 0.16074333900064897, "grad_max_sv": 0.07524463571608067, "grad_min_sv": 4.129742513509048e-34, "grad_condition": 75244635716.08066, "lr": 0.0007679133974894982, "time_sec": 132.16328692436218 }, { "epoch": 49, "train_loss": 5.344108670349121, "train_acc": 0.00988, "test_loss": 11.356095449829102, "test_acc": 0.01, "lyapunov": 1.5667558609677092, "grad_norm": 0.15860129770355044, "grad_max_sv": 0.07414976768195629, "grad_min_sv": 2.920054218147879e-21, "grad_condition": 74149767435.12958, "lr": 0.000759013504686565, "time_sec": 132.1159553527832 }, { "epoch": 50, "train_loss": 5.3415603378295895, "train_acc": 0.00976, "test_loss": 11.700657446289062, "test_acc": 0.01, "lyapunov": 1.5651936311551067, "grad_norm": 0.14626453498485173, "grad_max_sv": 0.05773629667237401, "grad_min_sv": 7.389830128226318e-40, "grad_condition": 57736296672.37401, "lr": 0.0007499999999999998, "time_sec": 132.10842418670654 }, { "epoch": 51, "train_loss": 5.345499488220215, "train_acc": 0.0091, "test_loss": 7.841943490600586, "test_acc": 0.01, "lyapunov": 1.5647823362399245, "grad_norm": 0.19931882783012003, "grad_max_sv": 0.13148421347141265, "grad_min_sv": 1.1399481724407015e-14, "grad_condition": 129966725437.33623, "lr": 0.0007408768370508575, "time_sec": 132.13836026191711 }, { "epoch": 52, "train_loss": 5.346541320800781, "train_acc": 0.01036, "test_loss": 8.251887129211426, "test_acc": 0.01, "lyapunov": 1.565840955280587, "grad_norm": 0.21227656722607438, "grad_max_sv": 0.14938069488853217, "grad_min_sv": 2.1186636603898966e-14, "grad_condition": 146306194841.0702, "lr": 0.0007316480175599307, "time_sec": 132.21652913093567 }, { "epoch": 53, "train_loss": 5.346332246856689, "train_acc": 0.00998, "test_loss": 8.80145364074707, "test_acc": 0.01, "lyapunov": 1.5666624332023094, "grad_norm": 0.2018507800384921, "grad_max_sv": 0.12567667234688998, "grad_min_sv": 4.6990583254762225e-15, "grad_condition": 125036911617.91772, "lr": 0.0007223175895924635, "time_sec": 132.1492202281952 }, { "epoch": 54, "train_loss": 5.344240028381348, "train_acc": 0.0096, "test_loss": 8.331844716644287, "test_acc": 0.01, "lyapunov": 1.5653653464963675, "grad_norm": 0.1977193203709713, "grad_max_sv": 0.12096917647868395, "grad_min_sv": 2.717621440740357e-15, "grad_condition": 120646434306.70581, "lr": 0.0007128896457825361, "time_sec": 132.13583779335022 }, { "epoch": 55, "train_loss": 5.34588626373291, "train_acc": 0.00938, "test_loss": 8.483297344970703, "test_acc": 0.01, "lyapunov": 1.5671809872093103, "grad_norm": 0.17917342896025326, "grad_max_sv": 0.10660264752805233, "grad_min_sv": 2.903017749905976e-15, "grad_condition": 106288369212.58371, "lr": 0.0007033683215378998, "time_sec": 132.12570214271545 }, { "epoch": 56, "train_loss": 5.347936657714844, "train_acc": 0.00928, "test_loss": 12.471004583740234, "test_acc": 0.01, "lyapunov": 1.5704145821768913, "grad_norm": 0.1585992442529963, "grad_max_sv": 0.05894996239803731, "grad_min_sv": 4.065829085829974e-17, "grad_condition": 58945476044.698166, "lr": 0.0006937577932260512, "time_sec": 132.08077478408813 }, { "epoch": 57, "train_loss": 5.350657684173584, "train_acc": 0.00942, "test_loss": 11.975766296386718, "test_acc": 0.01, "lyapunov": 1.572284730803936, "grad_norm": 0.16329462100720574, "grad_max_sv": 0.018565936107188465, "grad_min_sv": 0.0, "grad_condition": 18565936107.188465, "lr": 0.0006840622763423388, "time_sec": 132.12146091461182 }, { "epoch": 58, "train_loss": 5.342193555297851, "train_acc": 0.00952, "test_loss": 12.00783012084961, "test_acc": 0.01, "lyapunov": 1.5669191542183956, "grad_norm": 0.13144150243285688, "grad_max_sv": 0.014100767159834503, "grad_min_sv": 0.0, "grad_condition": 14100767159.834503, "lr": 0.0006742860236609073, "time_sec": 132.0214581489563 }, { "epoch": 59, "train_loss": 5.349671448669434, "train_acc": 0.0097, "test_loss": 12.08228343963623, "test_acc": 0.01, "lyapunov": 1.5733529234786168, "grad_norm": 0.15236031303960995, "grad_max_sv": 0.002432991983368993, "grad_min_sv": 0.0, "grad_condition": 2432991983.368993, "lr": 0.0006644333233692913, "time_sec": 131.98429799079895 }, { "epoch": 60, "train_loss": 5.343136109619141, "train_acc": 0.00986, "test_loss": 10.815134619140625, "test_acc": 0.01, "lyapunov": 1.567219941207515, "grad_norm": 0.13665097355727693, "grad_max_sv": 0.03331217863596976, "grad_min_sv": 4.039363544528912e-19, "grad_condition": 33312131775.42389, "lr": 0.0006545084971874734, "time_sec": 132.03068280220032 }, { "epoch": 61, "train_loss": 5.344384336853027, "train_acc": 0.01022, "test_loss": 11.902839001464844, "test_acc": 0.01, "lyapunov": 1.5653783214061767, "grad_norm": 0.18581223375617745, "grad_max_sv": 0.11722703091800213, "grad_min_sv": 1.8473140836599877e-15, "grad_condition": 117024266905.12569, "lr": 0.0006445158984722354, "time_sec": 132.11943864822388 }, { "epoch": 62, "train_loss": 5.346207113494873, "train_acc": 0.00964, "test_loss": 10.298070428466797, "test_acc": 0.01, "lyapunov": 1.5678635116123483, "grad_norm": 0.17212702314261866, "grad_max_sv": 0.11003287564963102, "grad_min_sv": 1.1830899390639064e-16, "grad_condition": 110021246721.88094, "lr": 0.0006344599103076324, "time_sec": 132.09185695648193 }, { "epoch": 63, "train_loss": 5.345449805297852, "train_acc": 0.00958, "test_loss": 9.716324475097656, "test_acc": 0.01, "lyapunov": 1.5676089863643012, "grad_norm": 0.15858824070117938, "grad_max_sv": 0.09742239024490118, "grad_min_sv": 2.2791221237746455e-16, "grad_condition": 97400387801.48373, "lr": 0.0006243449435824269, "time_sec": 132.09884762763977 }, { "epoch": 64, "train_loss": 5.347441923828125, "train_acc": 0.01, "test_loss": 9.248421519470215, "test_acc": 0.01, "lyapunov": 1.5703948257524338, "grad_norm": 0.14831464239510592, "grad_max_sv": 0.07895854022353888, "grad_min_sv": 1.0966957298749494e-34, "grad_condition": 78958540223.53888, "lr": 0.0006141754350553275, "time_sec": 132.1075723171234 }, { "epoch": 65, "train_loss": 5.3479963973999025, "train_acc": 0.00918, "test_loss": 11.96562194519043, "test_acc": 0.01, "lyapunov": 1.5711398328966497, "grad_norm": 0.13907361248234446, "grad_max_sv": 0.06278349282220005, "grad_min_sv": 0.0, "grad_condition": 62783492822.20006, "lr": 0.0006039558454088793, "time_sec": 132.1277093887329 }, { "epoch": 66, "train_loss": 5.343847501678467, "train_acc": 0.00942, "test_loss": 10.723486402893066, "test_acc": 0.01, "lyapunov": 1.5666573139102868, "grad_norm": 0.1348401569471477, "grad_max_sv": 0.07675737962126732, "grad_min_sv": 0.0, "grad_condition": 76757379621.2673, "lr": 0.000593690657292862, "time_sec": 132.15379786491394 }, { "epoch": 67, "train_loss": 5.348686145477295, "train_acc": 0.00928, "test_loss": 9.169928652954102, "test_acc": 0.01, "lyapunov": 1.5714481184854532, "grad_norm": 0.16082287392865435, "grad_max_sv": 0.09281166503205895, "grad_min_sv": 4.119931040700715e-29, "grad_condition": 92811665032.05894, "lr": 0.0005833843733580507, "time_sec": 132.15499711036682 }, { "epoch": 68, "train_loss": 5.346614480133057, "train_acc": 0.01036, "test_loss": 9.111311894226073, "test_acc": 0.01, "lyapunov": 1.5694071944717252, "grad_norm": 0.15530027367743043, "grad_max_sv": 0.09021252328529954, "grad_min_sv": 9.645277459794148e-41, "grad_condition": 90212523285.29953, "lr": 0.0005730415142812054, "time_sec": 132.0900914669037 }, { "epoch": 69, "train_loss": 5.345042231140137, "train_acc": 0.0094, "test_loss": 8.921395944213867, "test_acc": 0.01, "lyapunov": 1.5690713626954256, "grad_norm": 0.12882941842915957, "grad_max_sv": 0.05447775078937411, "grad_min_sv": 0.0, "grad_condition": 54477750789.374115, "lr": 0.0005626666167821517, "time_sec": 132.08048009872437 }, { "epoch": 70, "train_loss": 5.35093121887207, "train_acc": 0.00998, "test_loss": 9.45476280517578, "test_acc": 0.01, "lyapunov": 1.5726936317770683, "grad_norm": 0.15278112356314727, "grad_max_sv": 0.05165710533037782, "grad_min_sv": 0.0, "grad_condition": 51657105330.377815, "lr": 0.0005522642316338265, "time_sec": 132.26694178581238 }, { "epoch": 71, "train_loss": 5.349324496612549, "train_acc": 0.0099, "test_loss": 8.863416375732422, "test_acc": 0.01, "lyapunov": 1.572835110642416, "grad_norm": 0.13044312395716468, "grad_max_sv": 0.040168187906965615, "grad_min_sv": 0.0, "grad_condition": 40168187906.965614, "lr": 0.0005418389216661573, "time_sec": 132.09336495399475 }, { "epoch": 72, "train_loss": 5.344522937774658, "train_acc": 0.0098, "test_loss": 8.490674835205079, "test_acc": 0.01, "lyapunov": 1.5687179925191739, "grad_norm": 0.12245301057298638, "grad_max_sv": 0.05633250158280134, "grad_min_sv": 0.0, "grad_condition": 56332501582.801346, "lr": 0.0005313952597646563, "time_sec": 132.10885214805603 }, { "epoch": 73, "train_loss": 5.344547733154297, "train_acc": 0.0097, "test_loss": 8.686578596496583, "test_acc": 0.01, "lyapunov": 1.5687794383529508, "grad_norm": 0.11446001541385904, "grad_max_sv": 0.049419266358017924, "grad_min_sv": 0.0, "grad_condition": 49419266358.01792, "lr": 0.0005209378268645994, "time_sec": 132.04956126213074 }, { "epoch": 74, "train_loss": 5.3437795330810545, "train_acc": 0.0094, "test_loss": 8.874914520263673, "test_acc": 0.01, "lyapunov": 1.5682151988339241, "grad_norm": 0.1237497118091755, "grad_max_sv": 0.03953348807990551, "grad_min_sv": 0.0, "grad_condition": 39533488079.9055, "lr": 0.0005104712099416781, "time_sec": 132.10020518302917 }, { "epoch": 75, "train_loss": 5.343674107208252, "train_acc": 0.0092, "test_loss": 8.772430587768556, "test_acc": 0.01, "lyapunov": 1.5683565054403241, "grad_norm": 0.11349041239477198, "grad_max_sv": 0.026115051889792084, "grad_min_sv": 0.0, "grad_condition": 26115051889.792084, "lr": 0.0004999999999999996, "time_sec": 132.01686429977417 }, { "epoch": 76, "train_loss": 5.342641368255615, "train_acc": 0.00932, "test_loss": 8.705339865112304, "test_acc": 0.01, "lyapunov": 1.5662559923308585, "grad_norm": 0.12277695191025612, "grad_max_sv": 0.0629763058386743, "grad_min_sv": 0.0, "grad_condition": 62976305838.67432, "lr": 0.0004895287900583212, "time_sec": 132.05883979797363 }, { "epoch": 77, "train_loss": 5.341884041595459, "train_acc": 0.00968, "test_loss": 9.93609327545166, "test_acc": 0.01, "lyapunov": 1.566317234502729, "grad_norm": 0.11484157346336721, "grad_max_sv": 0.047401683824136856, "grad_min_sv": 0.0, "grad_condition": 47401683824.136856, "lr": 0.0004790621731353997, "time_sec": 132.05576992034912 }, { "epoch": 78, "train_loss": 5.343069399871826, "train_acc": 0.0102, "test_loss": 8.943976522827148, "test_acc": 0.01, "lyapunov": 1.5676431427221469, "grad_norm": 0.10629466820483455, "grad_max_sv": 0.034334157966077326, "grad_min_sv": 0.0, "grad_condition": 34334157966.077324, "lr": 0.000468604740235343, "time_sec": 132.03219604492188 }, { "epoch": 79, "train_loss": 5.342923241119385, "train_acc": 0.00894, "test_loss": 10.30071854095459, "test_acc": 0.01, "lyapunov": 1.5677035571364186, "grad_norm": 0.11729853273385192, "grad_max_sv": 0.018184055807068944, "grad_min_sv": 0.0, "grad_condition": 18184055807.068947, "lr": 0.00045816107833384175, "time_sec": 132.0335590839386 }, { "epoch": 80, "train_loss": 5.342889130249024, "train_acc": 0.00868, "test_loss": 9.292682635498046, "test_acc": 0.01, "lyapunov": 1.5676629153054085, "grad_norm": 0.10602422228730526, "grad_max_sv": 0.022180042415857314, "grad_min_sv": 0.0, "grad_condition": 22180042415.857315, "lr": 0.0004477357683661729, "time_sec": 132.04535913467407 }, { "epoch": 81, "train_loss": 5.3435448347473145, "train_acc": 0.01026, "test_loss": 10.646222018432617, "test_acc": 0.01, "lyapunov": 1.5682694253409306, "grad_norm": 0.10584507536046345, "grad_max_sv": 0.036097540194168685, "grad_min_sv": 0.0, "grad_condition": 36097540194.168686, "lr": 0.00043733338321784746, "time_sec": 132.0792417526245 }, { "epoch": 82, "train_loss": 5.346409954376221, "train_acc": 0.00938, "test_loss": 8.388480964660644, "test_acc": 0.01, "lyapunov": 1.5704751517766578, "grad_norm": 0.1594968968610417, "grad_max_sv": 0.05689305039122701, "grad_min_sv": 0.0, "grad_condition": 56893050391.227005, "lr": 0.0004269584857187939, "time_sec": 132.10688591003418 }, { "epoch": 83, "train_loss": 5.351143104705811, "train_acc": 0.00934, "test_loss": 10.536403848266602, "test_acc": 0.01, "lyapunov": 1.57418333660916, "grad_norm": 0.14631187426937112, "grad_max_sv": 0.043841119017452, "grad_min_sv": 0.0, "grad_condition": 43841119017.451996, "lr": 0.0004166156266419484, "time_sec": 132.08924984931946 }, { "epoch": 84, "train_loss": 5.345183093261719, "train_acc": 0.00942, "test_loss": 11.133738461303711, "test_acc": 0.01, "lyapunov": 1.5697272662311563, "grad_norm": 0.11663908627078753, "grad_max_sv": 0.04061344410292804, "grad_min_sv": 0.0, "grad_condition": 40613444102.92804, "lr": 0.0004063093427071373, "time_sec": 132.13465809822083 }, { "epoch": 85, "train_loss": 5.346176763000488, "train_acc": 0.01038, "test_loss": 11.12772626953125, "test_acc": 0.01, "lyapunov": 1.5703431422753102, "grad_norm": 0.1377494846746287, "grad_max_sv": 0.026653958344832064, "grad_min_sv": 0.0, "grad_condition": 26653958344.83206, "lr": 0.0003960441545911199, "time_sec": 132.03662395477295 }, { "epoch": 86, "train_loss": 5.343412326202393, "train_acc": 0.00966, "test_loss": 10.485674588012696, "test_acc": 0.01, "lyapunov": 1.568256547383945, "grad_norm": 0.11507124566756707, "grad_max_sv": 0.015460054902359844, "grad_min_sv": 0.0, "grad_condition": 15460054902.359842, "lr": 0.0003858245649446718, "time_sec": 132.30029678344727 }, { "epoch": 87, "train_loss": 5.343340453948975, "train_acc": 0.0093, "test_loss": 10.443886459350585, "test_acc": 0.01, "lyapunov": 1.5683554758501175, "grad_norm": 0.11491345749975401, "grad_max_sv": 0.01923052747733891, "grad_min_sv": 0.0, "grad_condition": 19230527477.33891, "lr": 0.00037565505641757235, "time_sec": 132.09554266929626 }, { "epoch": 88, "train_loss": 5.343219871826172, "train_acc": 0.00982, "test_loss": 9.331489477539062, "test_acc": 0.01, "lyapunov": 1.5680722632371555, "grad_norm": 0.10357957499765331, "grad_max_sv": 0.03583596190437675, "grad_min_sv": 0.0, "grad_condition": 35835961904.37675, "lr": 0.00036554008969236695, "time_sec": 132.38618564605713 }, { "epoch": 89, "train_loss": 5.345059629974365, "train_acc": 0.00942, "test_loss": 9.705012353515626, "test_acc": 0.01, "lyapunov": 1.5701254081848028, "grad_norm": 0.13335748884903612, "grad_max_sv": 0.01991720902733505, "grad_min_sv": 0.0, "grad_condition": 19917209027.335045, "lr": 0.0003554841015277638, "time_sec": 132.10200333595276 }, { "epoch": 90, "train_loss": 5.346582987670899, "train_acc": 0.00936, "test_loss": 9.92761245727539, "test_acc": 0.01, "lyapunov": 1.570894326395391, "grad_norm": 0.12917945353905133, "grad_max_sv": 0.005056336428970099, "grad_min_sv": 0.0, "grad_condition": 5056336428.9700985, "lr": 0.000345491502812526, "time_sec": 132.01398086547852 }, { "epoch": 91, "train_loss": 5.343077623138428, "train_acc": 0.00948, "test_loss": 9.892114511108398, "test_acc": 0.01, "lyapunov": 1.5679589848384223, "grad_norm": 0.10089565070900397, "grad_max_sv": 0.024783097906038165, "grad_min_sv": 0.0, "grad_condition": 24783097906.038166, "lr": 0.0003355666766307081, "time_sec": 132.0552315711975 }, { "epoch": 92, "train_loss": 5.344612928619385, "train_acc": 0.00984, "test_loss": 9.036325561523437, "test_acc": 0.01, "lyapunov": 1.5697500227052537, "grad_norm": 0.13133583896592352, "grad_max_sv": 0.017823219764977694, "grad_min_sv": 0.0, "grad_condition": 17823219764.977695, "lr": 0.00032571397633909225, "time_sec": 132.07679438591003 }, { "epoch": 93, "train_loss": 5.346883224182129, "train_acc": 0.0096, "test_loss": 8.63075946044922, "test_acc": 0.01, "lyapunov": 1.5719260608448702, "grad_norm": 0.09641577817960369, "grad_max_sv": 0.003358140075579286, "grad_min_sv": 0.0, "grad_condition": 3358140075.5792856, "lr": 0.00031593772365766094, "time_sec": 132.0291886329651 }, { "epoch": 94, "train_loss": 5.343683553771973, "train_acc": 0.00968, "test_loss": 8.73685708618164, "test_acc": 0.01, "lyapunov": 1.5686328389760478, "grad_norm": 0.09724660681276874, "grad_max_sv": 0.018295074068009853, "grad_min_sv": 0.0, "grad_condition": 18295074068.00985, "lr": 0.0003062422067739483, "time_sec": 132.12304759025574 }, { "epoch": 95, "train_loss": 5.343045575866699, "train_acc": 0.0086, "test_loss": 8.563214770507813, "test_acc": 0.01, "lyapunov": 1.5680832335406252, "grad_norm": 0.09663765425859253, "grad_max_sv": 0.0011947159189730882, "grad_min_sv": 0.0, "grad_condition": 1194715918.9730883, "lr": 0.00029663167846209965, "time_sec": 132.08247256278992 }, { "epoch": 96, "train_loss": 5.342066871490479, "train_acc": 0.00906, "test_loss": 8.190421600341796, "test_acc": 0.01, "lyapunov": 1.5670246782205295, "grad_norm": 0.10563473423950201, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 132.00989890098572 }, { "epoch": 97, "train_loss": 5.344517989196778, "train_acc": 0.00956, "test_loss": 7.861407074737548, "test_acc": 0.01, "lyapunov": 1.5693480187974622, "grad_norm": 0.11742062064295959, "grad_max_sv": 0.0026324169710278513, "grad_min_sv": 0.0, "grad_condition": 2632416971.027851, "lr": 0.00027768241040753615, "time_sec": 132.0594036579132 }, { "epoch": 98, "train_loss": 5.347235653991699, "train_acc": 0.0093, "test_loss": 7.575284122467041, "test_acc": 0.01, "lyapunov": 1.571171855682607, "grad_norm": 0.09980977977399007, "grad_max_sv": 0.02286601336672902, "grad_min_sv": 0.0, "grad_condition": 22866013366.729023, "lr": 0.00026835198244006903, "time_sec": 132.04233193397522 }, { "epoch": 99, "train_loss": 5.343029342498779, "train_acc": 0.00906, "test_loss": 7.45513014831543, "test_acc": 0.01, "lyapunov": 1.5681262549841801, "grad_norm": 0.09342461116650493, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 131.9914095401764 }, { "epoch": 100, "train_loss": 5.3494312777709965, "train_acc": 0.00946, "test_loss": 7.298580384063721, "test_acc": 0.01, "lyapunov": 1.573579462897747, "grad_norm": 0.11907283705246616, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 131.99966597557068 }, { "epoch": 101, "train_loss": 5.342477266693115, "train_acc": 0.00948, "test_loss": 7.23597857055664, "test_acc": 0.01, "lyapunov": 1.5675478393159559, "grad_norm": 0.09720728561760718, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 131.99136352539062 }, { "epoch": 102, "train_loss": 5.341832947845459, "train_acc": 0.00952, "test_loss": 6.885648638916016, "test_acc": 0.01, "lyapunov": 1.5668759388691933, "grad_norm": 0.09041804951245885, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 131.99253511428833 }, { "epoch": 103, "train_loss": 5.342141702270508, "train_acc": 0.00956, "test_loss": 7.227639694976807, "test_acc": 0.01, "lyapunov": 1.5670329186007799, "grad_norm": 0.09504910369326992, "grad_max_sv": 0.02663951087743044, "grad_min_sv": 0.0, "grad_condition": 26639510877.43044, "lr": 0.0002233042253783278, "time_sec": 132.1089026927948 }, { "epoch": 104, "train_loss": 5.342686755828858, "train_acc": 0.00952, "test_loss": 7.590157605743408, "test_acc": 0.01, "lyapunov": 1.5676686721079796, "grad_norm": 0.09647661834231228, "grad_max_sv": 0.024380091251805423, "grad_min_sv": 0.0, "grad_condition": 24380091251.805428, "lr": 0.000214643216157784, "time_sec": 132.06964230537415 }, { "epoch": 105, "train_loss": 5.344026827392578, "train_acc": 0.0095, "test_loss": 7.26397318649292, "test_acc": 0.01, "lyapunov": 1.569079797895973, "grad_norm": 0.09462212649965553, "grad_max_sv": 0.025716999545693398, "grad_min_sv": 0.0, "grad_condition": 25716999545.693398, "lr": 0.00020610737385376332, "time_sec": 132.05113744735718 }, { "epoch": 106, "train_loss": 5.343383273925781, "train_acc": 0.00984, "test_loss": 7.472719841003418, "test_acc": 0.01, "lyapunov": 1.5685262430049574, "grad_norm": 0.09652945369879859, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 132.04551148414612 }, { "epoch": 107, "train_loss": 5.343959386138916, "train_acc": 0.00958, "test_loss": 7.445523268127442, "test_acc": 0.01, "lyapunov": 1.5691688893091342, "grad_norm": 0.11388204494439719, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 132.02328181266785 }, { "epoch": 108, "train_loss": 5.342418379516602, "train_acc": 0.00956, "test_loss": 7.7173920944213865, "test_acc": 0.01, "lyapunov": 1.5675345683646629, "grad_norm": 0.09095832390063928, "grad_max_sv": 0.0006004700437188149, "grad_min_sv": 0.0, "grad_condition": 600470043.7188148, "lr": 0.000181288005125655, "time_sec": 132.05611062049866 }, { "epoch": 109, "train_loss": 5.343011405029297, "train_acc": 0.00944, "test_loss": 7.669947085571289, "test_acc": 0.01, "lyapunov": 1.5680827374958322, "grad_norm": 0.09262475373763442, "grad_max_sv": 0.005615572584792972, "grad_min_sv": 0.0, "grad_condition": 5615572584.792972, "lr": 0.0001732896980049473, "time_sec": 132.0278182029724 }, { "epoch": 110, "train_loss": 5.343270805511475, "train_acc": 0.00902, "test_loss": 7.524606921386718, "test_acc": 0.01, "lyapunov": 1.5684265477578048, "grad_norm": 0.0929528487372896, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 132.01432704925537 }, { "epoch": 111, "train_loss": 5.3430648620605465, "train_acc": 0.00908, "test_loss": 7.709186791992187, "test_acc": 0.01, "lyapunov": 1.568246929236995, "grad_norm": 0.08919578457075998, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 131.99741911888123 }, { "epoch": 112, "train_loss": 5.343547642822266, "train_acc": 0.00982, "test_loss": 7.633082518005371, "test_acc": 0.01, "lyapunov": 1.56872364535661, "grad_norm": 0.09053282340492008, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 131.9864740371704 }, { "epoch": 113, "train_loss": 5.349385154571533, "train_acc": 0.00926, "test_loss": 7.402510799407959, "test_acc": 0.01, "lyapunov": 1.573695613295221, "grad_norm": 0.1331401826658418, "grad_max_sv": 0.007452957844361663, "grad_min_sv": 0.0, "grad_condition": 7452957844.361662, "lr": 0.00014276366018359834, "time_sec": 131.9871220588684 }, { "epoch": 114, "train_loss": 5.3475169880676265, "train_acc": 0.00952, "test_loss": 7.718253441619873, "test_acc": 0.01, "lyapunov": 1.5723201231578428, "grad_norm": 0.12289444805074258, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 131.98372554779053 }, { "epoch": 115, "train_loss": 5.344510088806152, "train_acc": 0.0094, "test_loss": 7.667512203216552, "test_acc": 0.01, "lyapunov": 1.569762335713867, "grad_norm": 0.09241242910799227, "grad_max_sv": 0.008661840902641415, "grad_min_sv": 0.0, "grad_condition": 8661840902.641415, "lr": 0.00012842758726130276, "time_sec": 132.05068254470825 }, { "epoch": 116, "train_loss": 5.343971741943359, "train_acc": 0.00908, "test_loss": 7.700549072265625, "test_acc": 0.01, "lyapunov": 1.5691710436130728, "grad_norm": 0.10830143197848235, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 132.05018138885498 }, { "epoch": 117, "train_loss": 5.34632839920044, "train_acc": 0.00976, "test_loss": 7.761262622070313, "test_acc": 0.01, "lyapunov": 1.5713817326309125, "grad_norm": 0.11435501476976112, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 131.99043989181519 }, { "epoch": 118, "train_loss": 5.343400028686523, "train_acc": 0.0092, "test_loss": 7.794083961486816, "test_acc": 0.01, "lyapunov": 1.5685766228019733, "grad_norm": 0.08899614535065951, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 131.99262475967407 }, { "epoch": 119, "train_loss": 5.343056818084717, "train_acc": 0.00994, "test_loss": 7.639262364196777, "test_acc": 0.01, "lyapunov": 1.5682302356680946, "grad_norm": 0.08977728685492378, "grad_max_sv": 0.0006828804966062307, "grad_min_sv": 0.0, "grad_condition": 682880496.6062307, "lr": 0.00010173504098790182, "time_sec": 132.01868438720703 }, { "epoch": 120, "train_loss": 5.343217134552002, "train_acc": 0.00976, "test_loss": 7.660574660491943, "test_acc": 0.01, "lyapunov": 1.5684062449828438, "grad_norm": 0.09249377742678497, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 132.00144267082214 }, { "epoch": 121, "train_loss": 5.344638092651367, "train_acc": 0.00922, "test_loss": 7.663163458251953, "test_acc": 0.01, "lyapunov": 1.5699151044001665, "grad_norm": 0.1218726255205378, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 132.01804733276367 }, { "epoch": 122, "train_loss": 5.348134873046875, "train_acc": 0.00886, "test_loss": 7.884050512695312, "test_acc": 0.01, "lyapunov": 1.5724969224246872, "grad_norm": 0.09050076665656355, "grad_max_sv": 0.006364198122173548, "grad_min_sv": 0.0, "grad_condition": 6364198122.173548, "lr": 8.353937964495024e-05, "time_sec": 132.0272445678711 }, { "epoch": 123, "train_loss": 5.345365750579834, "train_acc": 0.00954, "test_loss": 7.118724527740478, "test_acc": 0.01, "lyapunov": 1.5703083133453604, "grad_norm": 0.09069370794057488, "grad_max_sv": 0.011258925357833505, "grad_min_sv": 0.0, "grad_condition": 11258925357.833506, "lr": 7.783603724899243e-05, "time_sec": 132.11900568008423 }, { "epoch": 124, "train_loss": 5.3431124142456055, "train_acc": 0.01036, "test_loss": 7.23227484741211, "test_acc": 0.01, "lyapunov": 1.568215018952899, "grad_norm": 0.09217613058420869, "grad_max_sv": 0.022803956363350152, "grad_min_sv": 0.0, "grad_condition": 22803956363.35015, "lr": 7.231786991974666e-05, "time_sec": 132.04238414764404 }, { "epoch": 125, "train_loss": 5.343697594146729, "train_acc": 0.00968, "test_loss": 7.098866456604004, "test_acc": 0.01, "lyapunov": 1.5689014327495605, "grad_norm": 0.09081931856189392, "grad_max_sv": 0.0006075550802052021, "grad_min_sv": 0.0, "grad_condition": 607555080.2052021, "lr": 6.698729810778072e-05, "time_sec": 132.0574872493744 }, { "epoch": 126, "train_loss": 5.34278548538208, "train_acc": 0.00934, "test_loss": 7.256412179565429, "test_acc": 0.01, "lyapunov": 1.5679547353778653, "grad_norm": 0.09038480638705418, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 132.04981470108032 }, { "epoch": 127, "train_loss": 5.342774636230469, "train_acc": 0.0091, "test_loss": 7.211266984558105, "test_acc": 0.01, "lyapunov": 1.567944114470421, "grad_norm": 0.089217745438497, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 132.0332305431366 }, { "epoch": 128, "train_loss": 5.343552632446289, "train_acc": 0.00974, "test_loss": 7.4164355209350585, "test_acc": 0.01, "lyapunov": 1.5687480887488636, "grad_norm": 0.11327584151012998, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 132.0342137813568 }, { "epoch": 129, "train_loss": 5.343920302124023, "train_acc": 0.00956, "test_loss": 7.272874592590332, "test_acc": 0.01, "lyapunov": 1.5691817562903285, "grad_norm": 0.09015948976899717, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 132.10112881660461 }, { "epoch": 130, "train_loss": 5.3440144625854495, "train_acc": 0.01, "test_loss": 7.378188175964356, "test_acc": 0.01, "lyapunov": 1.5693023784081344, "grad_norm": 0.08928317026508968, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 132.07870721817017 }, { "epoch": 131, "train_loss": 5.343164742889404, "train_acc": 0.01, "test_loss": 7.42498392944336, "test_acc": 0.01, "lyapunov": 1.5683802131496731, "grad_norm": 0.08938231829702648, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 132.035484790802 }, { "epoch": 132, "train_loss": 5.343568996734619, "train_acc": 0.01, "test_loss": 7.3698252609252926, "test_acc": 0.01, "lyapunov": 1.5688252653307317, "grad_norm": 0.08905121975076379, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 132.03120112419128 }, { "epoch": 133, "train_loss": 5.343650721282959, "train_acc": 0.01, "test_loss": 7.399177293395996, "test_acc": 0.01, "lyapunov": 1.568874374070131, "grad_norm": 0.08945297165320838, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 132.04973649978638 }, { "epoch": 134, "train_loss": 5.344010626678466, "train_acc": 0.01, "test_loss": 7.451564918518066, "test_acc": 0.01, "lyapunov": 1.569275133750018, "grad_norm": 0.08901909798719944, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 132.0272672176361 }, { "epoch": 135, "train_loss": 5.3513097511291505, "train_acc": 0.01, "test_loss": 7.494620336914062, "test_acc": 0.01, "lyapunov": 1.5749251406515956, "grad_norm": 0.11347426013089548, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 132.07217669487 }, { "epoch": 136, "train_loss": 5.344121324768066, "train_acc": 0.01, "test_loss": 7.466115431976318, "test_acc": 0.01, "lyapunov": 1.5693210134725741, "grad_norm": 0.13961703652050822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 132.09098315238953 }, { "epoch": 137, "train_loss": 5.3435055235290525, "train_acc": 0.01, "test_loss": 7.356763949584961, "test_acc": 0.01, "lyapunov": 1.5687689787286627, "grad_norm": 0.08881051948095202, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 132.01117372512817 }, { "epoch": 138, "train_loss": 5.343292431945801, "train_acc": 0.01, "test_loss": 7.423162863159179, "test_acc": 0.01, "lyapunov": 1.5685121305763263, "grad_norm": 0.08882639322875942, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 132.0426745414734 }, { "epoch": 139, "train_loss": 5.345961066894532, "train_acc": 0.01, "test_loss": 7.442799024963379, "test_acc": 0.01, "lyapunov": 1.5709345974885593, "grad_norm": 0.11315656196544904, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 132.11658310890198 }, { "epoch": 140, "train_loss": 5.343492304992676, "train_acc": 0.01, "test_loss": 7.444627010345459, "test_acc": 0.01, "lyapunov": 1.5687398992840895, "grad_norm": 0.08884505400987935, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 132.04373836517334 }, { "epoch": 141, "train_loss": 5.344924531860352, "train_acc": 0.01, "test_loss": 7.465608943176269, "test_acc": 0.01, "lyapunov": 1.570182631387735, "grad_norm": 0.0880861679030681, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 132.03311824798584 }, { "epoch": 142, "train_loss": 5.343007263793945, "train_acc": 0.01, "test_loss": 7.4812581214904785, "test_acc": 0.01, "lyapunov": 1.5682257471791923, "grad_norm": 0.08813951319538865, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 132.02575135231018 }, { "epoch": 143, "train_loss": 5.343106704711914, "train_acc": 0.01, "test_loss": 7.437115397644043, "test_acc": 0.01, "lyapunov": 1.5683247204631796, "grad_norm": 0.10158596989760496, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 132.05020785331726 }, { "epoch": 144, "train_loss": 5.34294032119751, "train_acc": 0.01, "test_loss": 7.48037815246582, "test_acc": 0.01, "lyapunov": 1.5681621552733205, "grad_norm": 0.08833317407426634, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 132.06616115570068 }, { "epoch": 145, "train_loss": 5.3438012377929685, "train_acc": 0.01, "test_loss": 7.496150346374511, "test_acc": 0.01, "lyapunov": 1.5690925231065287, "grad_norm": 0.08791012889132134, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 132.04411220550537 }, { "epoch": 146, "train_loss": 5.342738318328857, "train_acc": 0.01, "test_loss": 7.490428826141358, "test_acc": 0.01, "lyapunov": 1.5679414330236137, "grad_norm": 0.08841039102397012, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 132.08523440361023 }, { "epoch": 147, "train_loss": 5.3446823258972165, "train_acc": 0.01, "test_loss": 7.497726692199707, "test_acc": 0.01, "lyapunov": 1.5699935627105597, "grad_norm": 0.08776043049557726, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 132.03058862686157 }, { "epoch": 148, "train_loss": 5.343377943572998, "train_acc": 0.01, "test_loss": 7.49042504272461, "test_acc": 0.01, "lyapunov": 1.5686415504006779, "grad_norm": 0.08845953592324265, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 132.1206715106964 }, { "epoch": 149, "train_loss": 5.342948052978516, "train_acc": 0.01, "test_loss": 7.490426095581054, "test_acc": 0.01, "lyapunov": 1.5681962311420294, "grad_norm": 0.08842267718527619, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 132.15464973449707 }, { "epoch": 150, "train_loss": 5.341931441345215, "train_acc": 0.01, "test_loss": 7.487130715942383, "test_acc": 0.01, "lyapunov": 1.567085372822364, "grad_norm": 0.0882430826444348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 132.04750204086304 } ], "16": [ { "epoch": 1, "train_loss": 5.159331872253418, "train_acc": 0.01526, "test_loss": 4.873309817504883, "test_acc": 0.0093, "lyapunov": 2.4743038653717626, "grad_norm": 5.258705722697472, "grad_max_sv": 4.479718285799026, "grad_min_sv": 8.709666913797598e-08, "grad_condition": 86685976.9902235, "lr": 0.0009998903417374227, "time_sec": 177.3543930053711 }, { "epoch": 2, "train_loss": 4.886084578857422, "train_acc": 0.01782, "test_loss": 4.853029528808594, "test_acc": 0.01, "lyapunov": 1.9916716545744015, "grad_norm": 3.460383424161388, "grad_max_sv": 2.7798140585422515, "grad_min_sv": 5.706028290974885e-08, "grad_condition": 56364730.82112197, "lr": 0.0009995614150494292, "time_sec": 177.3599088191986 }, { "epoch": 3, "train_loss": 4.784042566375732, "train_acc": 0.01776, "test_loss": 4.790321257781982, "test_acc": 0.0116, "lyapunov": 1.7964752174704277, "grad_norm": 2.38204770499042, "grad_max_sv": 1.8151098906993866, "grad_min_sv": 3.787766869461917e-08, "grad_condition": 87913704.86086728, "lr": 0.0009990133642141358, "time_sec": 177.30120587348938 }, { "epoch": 4, "train_loss": 4.7238768682861325, "train_acc": 0.017, "test_loss": 4.624422996520996, "test_acc": 0.01, "lyapunov": 1.708475301332791, "grad_norm": 1.1762359291788405, "grad_max_sv": 0.7854173953674035, "grad_min_sv": 9.800736290438679e-09, "grad_condition": 32224269144.49076, "lr": 0.0009982464296247522, "time_sec": 177.37837982177734 }, { "epoch": 5, "train_loss": 4.755855419616699, "train_acc": 0.01562, "test_loss": 4.610174011230469, "test_acc": 0.01, "lyapunov": 1.675043061871053, "grad_norm": 0.7259009952417778, "grad_max_sv": 0.5301507465541363, "grad_min_sv": 5.1440461827152224e-11, "grad_condition": 105915112802.73376, "lr": 0.0009972609476841367, "time_sec": 177.381986618042 }, { "epoch": 6, "train_loss": 4.81643141998291, "train_acc": 0.01288, "test_loss": 4.60545783996582, "test_acc": 0.01, "lyapunov": 1.6532284676876214, "grad_norm": 0.4607532772533372, "grad_max_sv": 0.3609377399086952, "grad_min_sv": 5.305074951633812e-13, "grad_condition": 279971546429.15295, "lr": 0.000996057350657239, "time_sec": 177.434068441391 }, { "epoch": 7, "train_loss": 4.86136633392334, "train_acc": 0.01224, "test_loss": 5.360651237487793, "test_acc": 0.01, "lyapunov": 1.6404305040988776, "grad_norm": 0.3680696909769052, "grad_max_sv": 0.316419655829668, "grad_min_sv": 4.076535490995613e-14, "grad_condition": 307643620830.443, "lr": 0.000994636166481494, "time_sec": 177.2750985622406 }, { "epoch": 8, "train_loss": 4.912417060089111, "train_acc": 0.01054, "test_loss": 9.9219926071167, "test_acc": 0.01, "lyapunov": 1.6378350980446468, "grad_norm": 0.4461762738170382, "grad_max_sv": 0.26778712812811134, "grad_min_sv": 1.894336000793759e-10, "grad_condition": 230695726821.5417, "lr": 0.0009929980185352525, "time_sec": 177.29276037216187 }, { "epoch": 9, "train_loss": 4.968367258911133, "train_acc": 0.00954, "test_loss": 7.827674491882324, "test_acc": 0.01, "lyapunov": 1.624799670465767, "grad_norm": 0.5375330781925154, "grad_max_sv": 0.19412051439285277, "grad_min_sv": 1.2617160814236554e-09, "grad_condition": 49059473464.09962, "lr": 0.0009911436253643444, "time_sec": 177.24522376060486 }, { "epoch": 10, "train_loss": 5.062082354125977, "train_acc": 0.01038, "test_loss": 5.569893667602539, "test_acc": 0.01, "lyapunov": 1.6864765662976238, "grad_norm": 0.753548419446606, "grad_max_sv": 0.4160853669047356, "grad_min_sv": 5.35826894499278e-09, "grad_condition": 10262508595.882322, "lr": 0.0009890738003669028, "time_sec": 177.3631317615509 }, { "epoch": 11, "train_loss": 5.058011302032471, "train_acc": 0.00952, "test_loss": 5.087331884002686, "test_acc": 0.01, "lyapunov": 1.6062763267770752, "grad_norm": 0.6603912459051273, "grad_max_sv": 0.3468701772391796, "grad_min_sv": 4.421987463785291e-09, "grad_condition": 31727265214.824364, "lr": 0.00098678945143658, "time_sec": 177.38562989234924 }, { "epoch": 12, "train_loss": 5.058439118957519, "train_acc": 0.00978, "test_loss": 5.082496954345703, "test_acc": 0.01, "lyapunov": 1.5697322474111377, "grad_norm": 0.3523516525308902, "grad_max_sv": 0.15937897935509682, "grad_min_sv": 1.873834291129129e-09, "grad_condition": 2759306059.465498, "lr": 0.0009842915805643154, "time_sec": 177.36675763130188 }, { "epoch": 13, "train_loss": 5.109822076416016, "train_acc": 0.00966, "test_loss": 5.692898876953125, "test_acc": 0.01, "lyapunov": 1.5695562542551924, "grad_norm": 0.4593422563560374, "grad_max_sv": 0.35409238263964654, "grad_min_sv": 4.71099455383317e-09, "grad_condition": 127958722.61296721, "lr": 0.000981581283398829, "time_sec": 177.44806337356567 }, { "epoch": 14, "train_loss": 5.165816433410645, "train_acc": 0.01014, "test_loss": 7.84957985534668, "test_acc": 0.01, "lyapunov": 1.5709327590435058, "grad_norm": 0.5694077536605798, "grad_max_sv": 0.4453627858310938, "grad_min_sv": 5.610913853565864e-09, "grad_condition": 15313856896.7998, "lr": 0.0009786597487660333, "time_sec": 177.33772945404053 }, { "epoch": 15, "train_loss": 5.173155229797363, "train_acc": 0.00972, "test_loss": 5.157973370361328, "test_acc": 0.01, "lyapunov": 1.5706551062786365, "grad_norm": 0.43055135839909847, "grad_max_sv": 0.21150126457214355, "grad_min_sv": 1.4762666979190565e-09, "grad_condition": 47799778820.01504, "lr": 0.0009755282581475766, "time_sec": 177.33515882492065 }, { "epoch": 16, "train_loss": 5.207788455657959, "train_acc": 0.00962, "test_loss": 7.759160287475586, "test_acc": 0.01, "lyapunov": 1.5720331275554569, "grad_norm": 0.3894440758556563, "grad_max_sv": 0.1499915760010481, "grad_min_sv": 1.4193079274022143e-09, "grad_condition": 19769526881.522236, "lr": 0.0009721881851187403, "time_sec": 177.28159952163696 }, { "epoch": 17, "train_loss": 5.25385222076416, "train_acc": 0.00914, "test_loss": 4.720599290466309, "test_acc": 0.01, "lyapunov": 1.579244610293747, "grad_norm": 0.3647403085884025, "grad_max_sv": 0.17017204388976098, "grad_min_sv": 1.3479770702114132e-09, "grad_condition": 29838909132.92096, "lr": 0.0009686409947459456, "time_sec": 177.3482620716095 }, { "epoch": 18, "train_loss": 5.290630603790283, "train_acc": 0.00966, "test_loss": 4.818104879760742, "test_acc": 0.01, "lyapunov": 1.572280853300753, "grad_norm": 0.42846936793954693, "grad_max_sv": 0.2142110202461481, "grad_min_sv": 2.2586123961791682e-09, "grad_condition": 6069325065.621381, "lr": 0.0009648882429441254, "time_sec": 177.32465243339539 }, { "epoch": 19, "train_loss": 5.347908495483399, "train_acc": 0.00976, "test_loss": 4.680776121520996, "test_acc": 0.01, "lyapunov": 1.575872380715197, "grad_norm": 0.575049551174443, "grad_max_sv": 0.43422624468803406, "grad_min_sv": 4.46815191792408e-09, "grad_condition": 771924430.9754374, "lr": 0.00096093157579425, "time_sec": 177.39169430732727 }, { "epoch": 20, "train_loss": 5.372361971588135, "train_acc": 0.0092, "test_loss": 4.661239500427246, "test_acc": 0.01, "lyapunov": 1.5752952742149762, "grad_norm": 0.48504969680471643, "grad_max_sv": 0.3245972327888012, "grad_min_sv": 3.24804563384129e-09, "grad_condition": 111189476.23947105, "lr": 0.0009567727288213001, "time_sec": 177.45550775527954 }, { "epoch": 21, "train_loss": 5.37029109954834, "train_acc": 0.00994, "test_loss": 4.667470470428467, "test_acc": 0.01, "lyapunov": 1.5776933690775996, "grad_norm": 0.5453589213556644, "grad_max_sv": 0.3167274951934814, "grad_min_sv": 1.839770059066596e-09, "grad_condition": 35181903296.3187, "lr": 0.0009524135262330095, "time_sec": 177.39379477500916 }, { "epoch": 22, "train_loss": 5.364489818725586, "train_acc": 0.01004, "test_loss": 4.650138076782227, "test_acc": 0.01, "lyapunov": 1.5788932602728725, "grad_norm": 0.41535739480122674, "grad_max_sv": 0.2576656248420477, "grad_min_sv": 1.5858205317854233e-12, "grad_condition": 141035021433.30975, "lr": 0.0009478558801197061, "time_sec": 177.35208559036255 }, { "epoch": 23, "train_loss": 5.354643789978027, "train_acc": 0.0095, "test_loss": 4.695660099029541, "test_acc": 0.01, "lyapunov": 1.5758325334095284, "grad_norm": 0.30581042910039435, "grad_max_sv": 0.09805708080530166, "grad_min_sv": 6.027597976882962e-11, "grad_condition": 58654490617.71743, "lr": 0.000943101789615607, "time_sec": 177.3221151828766 }, { "epoch": 24, "train_loss": 5.353882457122802, "train_acc": 0.00926, "test_loss": 4.697132012939453, "test_acc": 0.01, "lyapunov": 1.578979221756196, "grad_norm": 0.24237849220724425, "grad_max_sv": 0.008070914912968874, "grad_min_sv": 0.0, "grad_condition": 8070914912.968875, "lr": 0.0009381533400219313, "time_sec": 177.2640483379364 }, { "epoch": 25, "train_loss": 5.351721515655518, "train_acc": 0.00882, "test_loss": 4.700634111022949, "test_acc": 0.01, "lyapunov": 1.5769606035993533, "grad_norm": 0.299683664855393, "grad_max_sv": 0.0009750408120453357, "grad_min_sv": 0.0, "grad_condition": 975040812.0453358, "lr": 0.0009330127018922189, "time_sec": 177.26898193359375 }, { "epoch": 26, "train_loss": 5.350724313659668, "train_acc": 0.00882, "test_loss": 4.976845028686523, "test_acc": 0.01, "lyapunov": 1.5759871856635794, "grad_norm": 0.25282322824422004, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000927682130080253, "time_sec": 177.23982048034668 }, { "epoch": 27, "train_loss": 5.3572762519836425, "train_acc": 0.00916, "test_loss": 4.699456916046143, "test_acc": 0.01, "lyapunov": 1.5826555691716615, "grad_norm": 0.3870563147260469, "grad_max_sv": 0.0008042730391025543, "grad_min_sv": 0.0, "grad_condition": 804273039.1025543, "lr": 0.0009221639627510072, "time_sec": 177.22700691223145 }, { "epoch": 28, "train_loss": 5.352617038269043, "train_acc": 0.0083, "test_loss": 4.97811413192749, "test_acc": 0.01, "lyapunov": 1.5779867312487434, "grad_norm": 0.23788834158418645, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009164606203550494, "time_sec": 177.21826004981995 }, { "epoch": 29, "train_loss": 5.361850127716065, "train_acc": 0.00882, "test_loss": 4.701448201751709, "test_acc": 0.01, "lyapunov": 1.5833598887524032, "grad_norm": 0.42995748870040046, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009105746045668516, "time_sec": 177.21908974647522 }, { "epoch": 30, "train_loss": 5.358213574829102, "train_acc": 0.00904, "test_loss": 5.412950395202636, "test_acc": 0.01, "lyapunov": 1.5822858404930291, "grad_norm": 0.331672095140798, "grad_max_sv": 0.0007659861817955971, "grad_min_sv": 0.0, "grad_condition": 765986181.7955971, "lr": 0.0009045084971874733, "time_sec": 177.25155925750732 }, { "epoch": 31, "train_loss": 5.359104016113282, "train_acc": 0.00934, "test_loss": 4.669879191589356, "test_acc": 0.01, "lyapunov": 1.5799903305595184, "grad_norm": 0.2952731697889261, "grad_max_sv": 0.07996195461601019, "grad_min_sv": 1.8027052930896337e-13, "grad_condition": 65774856592.69602, "lr": 0.0008982649590120977, "time_sec": 177.35512685775757 }, { "epoch": 32, "train_loss": 5.376470304718017, "train_acc": 0.0094, "test_loss": 5.556229885864258, "test_acc": 0.01, "lyapunov": 1.5852845087075782, "grad_norm": 0.34062130802734397, "grad_max_sv": 0.1435967419296503, "grad_min_sv": 4.671640446328522e-10, "grad_condition": 42736336798.66166, "lr": 0.0008918467286629196, "time_sec": 177.3573558330536 }, { "epoch": 33, "train_loss": 5.354219467468262, "train_acc": 0.00872, "test_loss": 5.552221805572509, "test_acc": 0.01, "lyapunov": 1.5796612647488295, "grad_norm": 0.24724638679639113, "grad_max_sv": 0.012037708284333348, "grad_min_sv": 0.0, "grad_condition": 12037708284.333347, "lr": 0.0008852566213878943, "time_sec": 177.34085536003113 }, { "epoch": 34, "train_loss": 5.358693110198975, "train_acc": 0.00966, "test_loss": 5.034206434631348, "test_acc": 0.01, "lyapunov": 1.5802869622969566, "grad_norm": 0.26366751089242085, "grad_max_sv": 0.08639110988005996, "grad_min_sv": 4.474218043386011e-15, "grad_condition": 85802279590.28976, "lr": 0.000878497527825878, "time_sec": 177.4128155708313 }, { "epoch": 35, "train_loss": 5.366087015075683, "train_acc": 0.00934, "test_loss": 4.936266462707519, "test_acc": 0.01, "lyapunov": 1.584944297285641, "grad_norm": 0.3376396372917839, "grad_max_sv": 0.1203163092955947, "grad_min_sv": 2.7491684533434274e-14, "grad_condition": 116380291473.68535, "lr": 0.000871572412738697, "time_sec": 177.40404987335205 }, { "epoch": 36, "train_loss": 5.361581598358154, "train_acc": 0.01024, "test_loss": 4.950734414672851, "test_acc": 0.01, "lyapunov": 1.5822551268750749, "grad_norm": 0.35809443213096964, "grad_max_sv": 0.13039383399300278, "grad_min_sv": 9.003150469885764e-15, "grad_condition": 129198667968.56705, "lr": 0.0008644843137107055, "time_sec": 177.38117098808289 }, { "epoch": 37, "train_loss": 5.367499517974854, "train_acc": 0.00976, "test_loss": 5.498499377441406, "test_acc": 0.01, "lyapunov": 1.58695989923404, "grad_norm": 0.3008050326299743, "grad_max_sv": 0.1228790944442153, "grad_min_sv": 5.822944316845422e-15, "grad_condition": 122173960457.34317, "lr": 0.0008572363398164014, "time_sec": 177.40381455421448 }, { "epoch": 38, "train_loss": 5.360039620361328, "train_acc": 0.0097, "test_loss": 5.010895380401611, "test_acc": 0.01, "lyapunov": 1.5823902507572223, "grad_norm": 0.28800004102415633, "grad_max_sv": 0.10303753465414048, "grad_min_sv": 1.7600771723101566e-15, "grad_condition": 102819314675.69463, "lr": 0.0008498316702566826, "time_sec": 177.36353826522827 }, { "epoch": 39, "train_loss": 5.361895691375732, "train_acc": 0.00962, "test_loss": 5.47797232055664, "test_acc": 0.01, "lyapunov": 1.5826790979146348, "grad_norm": 0.3607282899922051, "grad_max_sv": 0.1270065199583769, "grad_min_sv": 5.8177677532204334e-15, "grad_condition": 126306540301.11067, "lr": 0.0008422735529643442, "time_sec": 177.36847496032715 }, { "epoch": 40, "train_loss": 5.360779151458741, "train_acc": 0.00974, "test_loss": 4.913441442871094, "test_acc": 0.01, "lyapunov": 1.5841997578320905, "grad_norm": 0.30144541489536497, "grad_max_sv": 0.08766317497938872, "grad_min_sv": 3.1235879522614164e-15, "grad_condition": 87300355595.9631, "lr": 0.0008345653031794289, "time_sec": 177.39417672157288 }, { "epoch": 41, "train_loss": 5.361253643188476, "train_acc": 0.00952, "test_loss": 5.392577352905273, "test_acc": 0.01, "lyapunov": 1.584902299334631, "grad_norm": 0.33710076786895654, "grad_max_sv": 0.07017813064157963, "grad_min_sv": 1.8795491026783212e-20, "grad_condition": 70178128751.4103, "lr": 0.0008267103019950526, "time_sec": 177.4070680141449 }, { "epoch": 42, "train_loss": 5.359663697814941, "train_acc": 0.00966, "test_loss": 5.435651000976563, "test_acc": 0.01, "lyapunov": 1.583795747793544, "grad_norm": 0.44265142669444985, "grad_max_sv": 0.06058515841141343, "grad_min_sv": 8.532913146218004e-39, "grad_condition": 60585158411.41343, "lr": 0.0008187119948743447, "time_sec": 177.301589012146 }, { "epoch": 43, "train_loss": 5.361796244659423, "train_acc": 0.0104, "test_loss": 5.4946890060424805, "test_acc": 0.01, "lyapunov": 1.5847100778613858, "grad_norm": 0.6384686198807327, "grad_max_sv": 0.08455213336274028, "grad_min_sv": 1.854097809152722e-15, "grad_condition": 84328075575.36731, "lr": 0.000810573890139155, "time_sec": 177.35142517089844 }, { "epoch": 44, "train_loss": 5.364447811279297, "train_acc": 0.01014, "test_loss": 5.332209419250488, "test_acc": 0.01, "lyapunov": 1.5854847031786008, "grad_norm": 0.675284019586962, "grad_max_sv": 0.11337836356833578, "grad_min_sv": 1.7049374807524963e-14, "grad_condition": 111308573138.52168, "lr": 0.0008022995574311873, "time_sec": 177.3521008491516 }, { "epoch": 45, "train_loss": 5.360489757080078, "train_acc": 0.00976, "test_loss": 5.304935124206543, "test_acc": 0.01, "lyapunov": 1.5837746992745363, "grad_norm": 0.5718003616383085, "grad_max_sv": 0.08602348966524005, "grad_min_sv": 3.0378301121606614e-16, "grad_condition": 85997891115.73683, "lr": 0.0007938926261462363, "time_sec": 177.33692407608032 }, { "epoch": 46, "train_loss": 5.361809297485352, "train_acc": 0.01014, "test_loss": 4.89552943725586, "test_acc": 0.01, "lyapunov": 1.585215172194459, "grad_norm": 0.44412809114793517, "grad_max_sv": 0.0825215914286673, "grad_min_sv": 1.1713936618830865e-15, "grad_condition": 82407893767.02434, "lr": 0.0007853567838422158, "time_sec": 177.35017251968384 }, { "epoch": 47, "train_loss": 5.361848121795655, "train_acc": 0.00954, "test_loss": 4.982022219848633, "test_acc": 0.01, "lyapunov": 1.5858572995876108, "grad_norm": 0.4284143094057381, "grad_max_sv": 0.06426824014633895, "grad_min_sv": 5.420102114032563e-18, "grad_condition": 64267673459.65764, "lr": 0.0007766957746216719, "time_sec": 177.3225803375244 }, { "epoch": 48, "train_loss": 5.360097906646729, "train_acc": 0.0101, "test_loss": 5.039643939208984, "test_acc": 0.01, "lyapunov": 1.5852815909763736, "grad_norm": 0.21919166507419222, "grad_max_sv": 0.02766723851673305, "grad_min_sv": 0.0, "grad_condition": 27667238516.73305, "lr": 0.0007679133974894982, "time_sec": 177.3571081161499 }, { "epoch": 49, "train_loss": 5.361355583496094, "train_acc": 0.00912, "test_loss": 4.70521968460083, "test_acc": 0.01, "lyapunov": 1.587215112603229, "grad_norm": 0.31401296813167406, "grad_max_sv": 0.0012400273233652114, "grad_min_sv": 0.0, "grad_condition": 1240027323.3652115, "lr": 0.000759013504686565, "time_sec": 177.23792433738708 }, { "epoch": 50, "train_loss": 5.374890024871826, "train_acc": 0.00998, "test_loss": 5.3741009857177735, "test_acc": 0.01, "lyapunov": 1.5953726881300396, "grad_norm": 0.3238754552354357, "grad_max_sv": 0.04934265548363328, "grad_min_sv": 2.6824701739898724e-33, "grad_condition": 49342655483.63328, "lr": 0.0007499999999999998, "time_sec": 177.3176691532135 }, { "epoch": 51, "train_loss": 5.359442653961182, "train_acc": 0.0091, "test_loss": 5.708284506988526, "test_acc": 0.01, "lyapunov": 1.5848879155600468, "grad_norm": 0.19742833159549178, "grad_max_sv": 0.019448843877762557, "grad_min_sv": 4.3389140032583084e-41, "grad_condition": 19448843877.762554, "lr": 0.0007408768370508575, "time_sec": 177.30614399909973 }, { "epoch": 52, "train_loss": 5.357807418670654, "train_acc": 0.00892, "test_loss": 5.598787411499023, "test_acc": 0.01, "lyapunov": 1.5835388462866664, "grad_norm": 0.22895282871195646, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 177.23059678077698 }, { "epoch": 53, "train_loss": 5.364920553588867, "train_acc": 0.00838, "test_loss": 5.555523378753662, "test_acc": 0.01, "lyapunov": 1.5897833791840108, "grad_norm": 0.27349172628604307, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 177.23636078834534 }, { "epoch": 54, "train_loss": 5.360137451934815, "train_acc": 0.00904, "test_loss": 5.4607298324584965, "test_acc": 0.01, "lyapunov": 1.585875649586358, "grad_norm": 0.3494380261105508, "grad_max_sv": 0.009265018161386251, "grad_min_sv": 0.0, "grad_condition": 9265018161.386251, "lr": 0.0007128896457825361, "time_sec": 177.3195767402649 }, { "epoch": 55, "train_loss": 5.361894327392578, "train_acc": 0.01076, "test_loss": 5.3967264434814455, "test_acc": 0.01, "lyapunov": 1.5858059591039673, "grad_norm": 0.32616838064335635, "grad_max_sv": 0.06554236207157374, "grad_min_sv": 3.9627266810538444e-22, "grad_condition": 65542362038.60982, "lr": 0.0007033683215378998, "time_sec": 177.4070463180542 }, { "epoch": 56, "train_loss": 5.361103507232666, "train_acc": 0.00966, "test_loss": 5.396138972473144, "test_acc": 0.01, "lyapunov": 1.585260014399848, "grad_norm": 0.24476233592152788, "grad_max_sv": 0.053304498083889484, "grad_min_sv": 8.107207506846484e-17, "grad_condition": 53297506440.79659, "lr": 0.0006937577932260512, "time_sec": 177.3034119606018 }, { "epoch": 57, "train_loss": 5.3623845806884765, "train_acc": 0.00962, "test_loss": 5.060037421417237, "test_acc": 0.01, "lyapunov": 1.5866734694946758, "grad_norm": 0.28857632314696974, "grad_max_sv": 0.06447782786563039, "grad_min_sv": 1.9607974133287156e-16, "grad_condition": 64457267604.59035, "lr": 0.0006840622763423388, "time_sec": 177.35450506210327 }, { "epoch": 58, "train_loss": 5.361771304779053, "train_acc": 0.01002, "test_loss": 5.0901702087402345, "test_acc": 0.01, "lyapunov": 1.586991887873091, "grad_norm": 0.23271259978105882, "grad_max_sv": 0.04189403969794512, "grad_min_sv": 2.1019476964872255e-46, "grad_condition": 41894039697.945114, "lr": 0.0006742860236609073, "time_sec": 177.32643222808838 }, { "epoch": 59, "train_loss": 5.360649804382324, "train_acc": 0.00986, "test_loss": 5.02971961517334, "test_acc": 0.01, "lyapunov": 1.5858081442010983, "grad_norm": 0.25490660325152764, "grad_max_sv": 0.04079276975244284, "grad_min_sv": 0.0, "grad_condition": 40792769752.44284, "lr": 0.0006644333233692913, "time_sec": 177.3179268836975 }, { "epoch": 60, "train_loss": 5.364020364685058, "train_acc": 0.00904, "test_loss": 4.7199004196167, "test_acc": 0.01, "lyapunov": 1.5886733891713956, "grad_norm": 0.22342122942097759, "grad_max_sv": 0.027459373604506253, "grad_min_sv": 0.0, "grad_condition": 27459373604.506256, "lr": 0.0006545084971874734, "time_sec": 177.30202984809875 }, { "epoch": 61, "train_loss": 5.363523327484131, "train_acc": 0.00934, "test_loss": 4.7266477081298826, "test_acc": 0.01, "lyapunov": 1.5883313112551598, "grad_norm": 0.20389335925530302, "grad_max_sv": 0.045495460741221905, "grad_min_sv": 1.4012984643248171e-46, "grad_condition": 45495460741.2219, "lr": 0.0006445158984722354, "time_sec": 177.32515287399292 }, { "epoch": 62, "train_loss": 5.367948243408203, "train_acc": 0.0091, "test_loss": 4.75396729888916, "test_acc": 0.01, "lyapunov": 1.5914591578266504, "grad_norm": 0.255614489528913, "grad_max_sv": 0.03248326424509287, "grad_min_sv": 1.3219893653396629e-33, "grad_condition": 32483264245.092873, "lr": 0.0006344599103076324, "time_sec": 177.34726858139038 }, { "epoch": 63, "train_loss": 5.360079801940918, "train_acc": 0.0094, "test_loss": 5.19269112701416, "test_acc": 0.01, "lyapunov": 1.5859909679578699, "grad_norm": 0.247568680367887, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 177.2823510169983 }, { "epoch": 64, "train_loss": 5.359493107910156, "train_acc": 0.00876, "test_loss": 5.2250466796875, "test_acc": 0.01, "lyapunov": 1.585366655188753, "grad_norm": 0.2769224967661722, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 177.23246479034424 }, { "epoch": 65, "train_loss": 5.361286865844726, "train_acc": 0.00938, "test_loss": 5.298229453277588, "test_acc": 0.01, "lyapunov": 1.5870976630988938, "grad_norm": 0.24716357558635968, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 177.274742603302 }, { "epoch": 66, "train_loss": 5.360220510559082, "train_acc": 0.00942, "test_loss": 5.1931522216796875, "test_acc": 0.01, "lyapunov": 1.5856442792946115, "grad_norm": 0.21643181506904438, "grad_max_sv": 0.028073416696861385, "grad_min_sv": 0.0, "grad_condition": 28073416696.86139, "lr": 0.000593690657292862, "time_sec": 177.3214614391327 }, { "epoch": 67, "train_loss": 5.3634411520385745, "train_acc": 0.01004, "test_loss": 4.726324760437012, "test_acc": 0.01, "lyapunov": 1.5876712076499333, "grad_norm": 0.19917891606110388, "grad_max_sv": 0.06480920519679785, "grad_min_sv": 5.826939700269216e-27, "grad_condition": 64809205196.797485, "lr": 0.0005833843733580507, "time_sec": 177.30631113052368 }, { "epoch": 68, "train_loss": 5.3627893775939945, "train_acc": 0.0096, "test_loss": 4.78324942779541, "test_acc": 0.01, "lyapunov": 1.5872700497927263, "grad_norm": 0.17814025282763096, "grad_max_sv": 0.05710890954360366, "grad_min_sv": 1.642725198984103e-39, "grad_condition": 57108909543.60366, "lr": 0.0005730415142812054, "time_sec": 177.28468227386475 }, { "epoch": 69, "train_loss": 5.36284663772583, "train_acc": 0.01016, "test_loss": 4.65924833908081, "test_acc": 0.01, "lyapunov": 1.5882405993883566, "grad_norm": 0.18974647851723686, "grad_max_sv": 0.03764563817530871, "grad_min_sv": 0.0, "grad_condition": 37645638175.3087, "lr": 0.0005626666167821517, "time_sec": 177.30268549919128 }, { "epoch": 70, "train_loss": 5.365585427398682, "train_acc": 0.00962, "test_loss": 4.667314112854004, "test_acc": 0.01, "lyapunov": 1.58941994451196, "grad_norm": 0.17127250466631513, "grad_max_sv": 0.043766821082681415, "grad_min_sv": 0.0, "grad_condition": 43766821082.68142, "lr": 0.0005522642316338265, "time_sec": 177.31375312805176 }, { "epoch": 71, "train_loss": 5.360834673461914, "train_acc": 0.0103, "test_loss": 4.691217092895508, "test_acc": 0.01, "lyapunov": 1.5854695108540529, "grad_norm": 0.15750040762462056, "grad_max_sv": 0.05662639001384377, "grad_min_sv": 0.0, "grad_condition": 56626390013.84377, "lr": 0.0005418389216661573, "time_sec": 177.3107042312622 }, { "epoch": 72, "train_loss": 5.360965846557617, "train_acc": 0.01014, "test_loss": 4.686003870391846, "test_acc": 0.01, "lyapunov": 1.586221619945048, "grad_norm": 0.1761841219237378, "grad_max_sv": 0.051002619601786134, "grad_min_sv": 0.0, "grad_condition": 51002619601.78613, "lr": 0.0005313952597646563, "time_sec": 177.28891253471375 }, { "epoch": 73, "train_loss": 5.365758000946045, "train_acc": 0.00988, "test_loss": 4.678875315856933, "test_acc": 0.01, "lyapunov": 1.5900602660825491, "grad_norm": 0.21832467373191636, "grad_max_sv": 0.06282770875841379, "grad_min_sv": 0.0, "grad_condition": 62827708758.413795, "lr": 0.0005209378268645994, "time_sec": 177.3162078857422 }, { "epoch": 74, "train_loss": 5.365496074371338, "train_acc": 0.0093, "test_loss": 4.655053031921387, "test_acc": 0.01, "lyapunov": 1.589696585979608, "grad_norm": 0.23086253967925782, "grad_max_sv": 0.060001683793962, "grad_min_sv": 0.0, "grad_condition": 60001683793.962, "lr": 0.0005104712099416781, "time_sec": 177.30215072631836 }, { "epoch": 75, "train_loss": 5.364179220275879, "train_acc": 0.0099, "test_loss": 4.638170684051514, "test_acc": 0.01, "lyapunov": 1.5883820352651883, "grad_norm": 0.3049112090346521, "grad_max_sv": 0.05380613347515464, "grad_min_sv": 0.0, "grad_condition": 53806133475.15464, "lr": 0.0004999999999999996, "time_sec": 177.36862349510193 }, { "epoch": 76, "train_loss": 5.359675194854736, "train_acc": 0.01046, "test_loss": 4.649093914794922, "test_acc": 0.01, "lyapunov": 1.5854026216375248, "grad_norm": 0.2119481091202284, "grad_max_sv": 0.03726704930886626, "grad_min_sv": 0.0, "grad_condition": 37267049308.86626, "lr": 0.0004895287900583212, "time_sec": 177.32284903526306 }, { "epoch": 77, "train_loss": 5.360474863128662, "train_acc": 0.00958, "test_loss": 4.605349244689942, "test_acc": 0.01, "lyapunov": 1.5860518323795876, "grad_norm": 0.20492250658984978, "grad_max_sv": 0.010520621668547392, "grad_min_sv": 0.0, "grad_condition": 10520621668.54739, "lr": 0.0004790621731353997, "time_sec": 177.27856492996216 }, { "epoch": 78, "train_loss": 5.3626285870361325, "train_acc": 0.0096, "test_loss": 4.636105052185059, "test_acc": 0.01, "lyapunov": 1.5883512807928997, "grad_norm": 0.16200768770528595, "grad_max_sv": 0.01769152507185936, "grad_min_sv": 0.0, "grad_condition": 17691525071.85936, "lr": 0.000468604740235343, "time_sec": 177.26149678230286 }, { "epoch": 79, "train_loss": 5.361725220947266, "train_acc": 0.00962, "test_loss": 4.642175579071045, "test_acc": 0.01, "lyapunov": 1.5874589931629504, "grad_norm": 0.1671711869857159, "grad_max_sv": 0.027231273613870143, "grad_min_sv": 0.0, "grad_condition": 27231273613.870144, "lr": 0.00045816107833384175, "time_sec": 177.28059816360474 }, { "epoch": 80, "train_loss": 5.359847649841309, "train_acc": 0.00934, "test_loss": 4.646283575439453, "test_acc": 0.01, "lyapunov": 1.5854374237377624, "grad_norm": 0.15090527056955186, "grad_max_sv": 0.02150285104289651, "grad_min_sv": 0.0, "grad_condition": 21502851042.896507, "lr": 0.0004477357683661729, "time_sec": 177.27379083633423 }, { "epoch": 81, "train_loss": 5.3600718869018555, "train_acc": 0.01048, "test_loss": 4.752709213256836, "test_acc": 0.01, "lyapunov": 1.585394742238857, "grad_norm": 0.17187344605967436, "grad_max_sv": 0.043320519663393495, "grad_min_sv": 0.0, "grad_condition": 43320519663.39349, "lr": 0.00043733338321784746, "time_sec": 177.62933731079102 }, { "epoch": 82, "train_loss": 5.362194033813476, "train_acc": 0.00908, "test_loss": 4.769781411743164, "test_acc": 0.01, "lyapunov": 1.5872593858967656, "grad_norm": 0.17685474969644083, "grad_max_sv": 0.043185068760067225, "grad_min_sv": 0.0, "grad_condition": 43185068760.06722, "lr": 0.0004269584857187939, "time_sec": 177.36878728866577 }, { "epoch": 83, "train_loss": 5.360512623901367, "train_acc": 0.00896, "test_loss": 4.634495629882813, "test_acc": 0.01, "lyapunov": 1.585809985999866, "grad_norm": 0.17569851085947658, "grad_max_sv": 0.048822146560996774, "grad_min_sv": 0.0, "grad_condition": 48822146560.99677, "lr": 0.0004166156266419484, "time_sec": 177.35730743408203 }, { "epoch": 84, "train_loss": 5.360660369110107, "train_acc": 0.01062, "test_loss": 4.635055514526367, "test_acc": 0.01, "lyapunov": 1.5863755276745848, "grad_norm": 0.1734959766637803, "grad_max_sv": 0.03708101906813681, "grad_min_sv": 0.0, "grad_condition": 37081019068.13681, "lr": 0.0004063093427071373, "time_sec": 177.31386804580688 }, { "epoch": 85, "train_loss": 5.359581319885254, "train_acc": 0.00962, "test_loss": 4.680524919128418, "test_acc": 0.01, "lyapunov": 1.585432373349319, "grad_norm": 0.19633262712151112, "grad_max_sv": 0.016985992342233656, "grad_min_sv": 0.0, "grad_condition": 16985992342.233658, "lr": 0.0003960441545911199, "time_sec": 177.29162740707397 }, { "epoch": 86, "train_loss": 5.364330820922851, "train_acc": 0.00994, "test_loss": 4.640988105010987, "test_acc": 0.01, "lyapunov": 1.5893402819133475, "grad_norm": 0.17010660799200755, "grad_max_sv": 0.005552049493417144, "grad_min_sv": 0.0, "grad_condition": 5552049493.417144, "lr": 0.0003858245649446718, "time_sec": 177.2697069644928 }, { "epoch": 87, "train_loss": 5.36001446975708, "train_acc": 0.0091, "test_loss": 4.6622309997558595, "test_acc": 0.01, "lyapunov": 1.5858566068932223, "grad_norm": 0.18253684720194474, "grad_max_sv": 0.009605350159108638, "grad_min_sv": 0.0, "grad_condition": 9605350159.108639, "lr": 0.00037565505641757235, "time_sec": 177.2729914188385 }, { "epoch": 88, "train_loss": 5.363334915313721, "train_acc": 0.00928, "test_loss": 4.651910215759277, "test_acc": 0.01, "lyapunov": 1.5891908779168678, "grad_norm": 0.25285970261724394, "grad_max_sv": 0.014622378209605814, "grad_min_sv": 0.0, "grad_condition": 14622378209.605814, "lr": 0.00036554008969236695, "time_sec": 177.25673460960388 }, { "epoch": 89, "train_loss": 5.366140861053466, "train_acc": 0.0098, "test_loss": 4.632004132843018, "test_acc": 0.01, "lyapunov": 1.5918613025904311, "grad_norm": 0.3793803057886311, "grad_max_sv": 0.0227991352789104, "grad_min_sv": 0.0, "grad_condition": 22799135278.9104, "lr": 0.0003554841015277638, "time_sec": 177.28270602226257 }, { "epoch": 90, "train_loss": 5.358956403503418, "train_acc": 0.00908, "test_loss": 4.634336037445069, "test_acc": 0.01, "lyapunov": 1.5845078528689607, "grad_norm": 0.16129836844937653, "grad_max_sv": 0.030955695733428, "grad_min_sv": 0.0, "grad_condition": 30955695733.428, "lr": 0.000345491502812526, "time_sec": 177.34664869308472 }, { "epoch": 91, "train_loss": 5.370377727966309, "train_acc": 0.01008, "test_loss": 4.641486628723144, "test_acc": 0.01, "lyapunov": 1.5915974838959286, "grad_norm": 0.23056801493799003, "grad_max_sv": 0.021973734814673664, "grad_min_sv": 0.0, "grad_condition": 21973734814.673664, "lr": 0.0003355666766307081, "time_sec": 177.30071926116943 }, { "epoch": 92, "train_loss": 5.35953079574585, "train_acc": 0.0104, "test_loss": 4.654357167816162, "test_acc": 0.01, "lyapunov": 1.5854123461886744, "grad_norm": 0.2133357061554603, "grad_max_sv": 0.01584432367235422, "grad_min_sv": 0.0, "grad_condition": 15844323672.354221, "lr": 0.00032571397633909225, "time_sec": 177.30744338035583 }, { "epoch": 93, "train_loss": 5.359757648162842, "train_acc": 0.01004, "test_loss": 4.635669487762451, "test_acc": 0.01, "lyapunov": 1.5857275602457774, "grad_norm": 0.21123088900545153, "grad_max_sv": 0.022326651168987154, "grad_min_sv": 0.0, "grad_condition": 22326651168.98716, "lr": 0.00031593772365766094, "time_sec": 177.30698537826538 }, { "epoch": 94, "train_loss": 5.358649451293945, "train_acc": 0.00924, "test_loss": 4.650500559997559, "test_acc": 0.01, "lyapunov": 1.584580004367682, "grad_norm": 0.22156955822269123, "grad_max_sv": 0.0036812785547226667, "grad_min_sv": 0.0, "grad_condition": 3681278554.7226667, "lr": 0.0003062422067739483, "time_sec": 177.29391837120056 }, { "epoch": 95, "train_loss": 5.368402194519043, "train_acc": 0.0096, "test_loss": 4.631659384155274, "test_acc": 0.01, "lyapunov": 1.5918427952720076, "grad_norm": 0.19012319147558024, "grad_max_sv": 0.01328945653513074, "grad_min_sv": 0.0, "grad_condition": 13289456535.130741, "lr": 0.00029663167846209965, "time_sec": 177.28295135498047 }, { "epoch": 96, "train_loss": 5.360648808441162, "train_acc": 0.00988, "test_loss": 4.642071528625488, "test_acc": 0.01, "lyapunov": 1.586560007251437, "grad_norm": 0.16157307254883244, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 177.2989547252655 }, { "epoch": 97, "train_loss": 5.358733374786377, "train_acc": 0.00914, "test_loss": 4.639485282897949, "test_acc": 0.01, "lyapunov": 1.5846895253871713, "grad_norm": 0.14480973228900776, "grad_max_sv": 0.00837345547042787, "grad_min_sv": 0.0, "grad_condition": 8373455470.427872, "lr": 0.00027768241040753615, "time_sec": 177.27525234222412 }, { "epoch": 98, "train_loss": 5.360293337707519, "train_acc": 0.0099, "test_loss": 4.644459535980225, "test_acc": 0.01, "lyapunov": 1.5861705498927086, "grad_norm": 0.18867802153244584, "grad_max_sv": 0.026158737391233443, "grad_min_sv": 0.0, "grad_condition": 26158737391.23344, "lr": 0.00026835198244006903, "time_sec": 177.2919957637787 }, { "epoch": 99, "train_loss": 5.360852672576904, "train_acc": 0.00976, "test_loss": 4.641770568847656, "test_acc": 0.01, "lyapunov": 1.5866629604793265, "grad_norm": 0.2490166385107765, "grad_max_sv": 0.025310791656374933, "grad_min_sv": 0.0, "grad_condition": 25310791656.37493, "lr": 0.0002591231629491421, "time_sec": 177.28516483306885 }, { "epoch": 100, "train_loss": 5.359503317260742, "train_acc": 0.0096, "test_loss": 4.633657774353027, "test_acc": 0.01, "lyapunov": 1.5852865261190079, "grad_norm": 0.31764569596084014, "grad_max_sv": 0.03201284250244498, "grad_min_sv": 0.0, "grad_condition": 32012842502.444984, "lr": 0.0002499999999999997, "time_sec": 177.3286590576172 }, { "epoch": 101, "train_loss": 5.3610862644958495, "train_acc": 0.01004, "test_loss": 4.627243125915528, "test_acc": 0.01, "lyapunov": 1.586990461934863, "grad_norm": 0.3077979208978545, "grad_max_sv": 0.022488519130274654, "grad_min_sv": 0.0, "grad_condition": 22488519130.274654, "lr": 0.00024098649531343477, "time_sec": 177.27038407325745 }, { "epoch": 102, "train_loss": 5.359221751708985, "train_acc": 0.0099, "test_loss": 4.6350917106628415, "test_acc": 0.01, "lyapunov": 1.5852433824173324, "grad_norm": 0.17125449319078032, "grad_max_sv": 0.0006372035015374423, "grad_min_sv": 0.0, "grad_condition": 637203501.5374422, "lr": 0.0002320866025105016, "time_sec": 177.26434516906738 }, { "epoch": 103, "train_loss": 5.359845841064453, "train_acc": 0.00998, "test_loss": 4.644444650268555, "test_acc": 0.01, "lyapunov": 1.5859144453502372, "grad_norm": 0.15906823668777442, "grad_max_sv": 0.0012175182346254587, "grad_min_sv": 0.0, "grad_condition": 1217518234.6254587, "lr": 0.0002233042253783278, "time_sec": 177.29427409172058 }, { "epoch": 104, "train_loss": 5.359393982086182, "train_acc": 0.00964, "test_loss": 4.629140382385254, "test_acc": 0.01, "lyapunov": 1.5853588230469648, "grad_norm": 0.18868988717884208, "grad_max_sv": 0.007832410791888834, "grad_min_sv": 0.0, "grad_condition": 7832410791.888834, "lr": 0.000214643216157784, "time_sec": 177.3122420310974 }, { "epoch": 105, "train_loss": 5.376110725402832, "train_acc": 0.00958, "test_loss": 4.641193688201905, "test_acc": 0.01, "lyapunov": 1.594091626079491, "grad_norm": 0.21866401239429448, "grad_max_sv": 0.01763616520911455, "grad_min_sv": 0.0, "grad_condition": 17636165209.11455, "lr": 0.00020610737385376332, "time_sec": 177.33545303344727 }, { "epoch": 106, "train_loss": 5.360543824005127, "train_acc": 0.00952, "test_loss": 4.63230926361084, "test_acc": 0.01, "lyapunov": 1.586505341407893, "grad_norm": 0.19148423296709022, "grad_max_sv": 0.007322627399116754, "grad_min_sv": 0.0, "grad_condition": 7322627399.116755, "lr": 0.00019770044256881242, "time_sec": 177.29128861427307 }, { "epoch": 107, "train_loss": 5.359816354370118, "train_acc": 0.00964, "test_loss": 4.628876644897461, "test_acc": 0.01, "lyapunov": 1.5858964429182165, "grad_norm": 0.16953893016049196, "grad_max_sv": 0.005570205627009273, "grad_min_sv": 0.0, "grad_condition": 5570205627.009273, "lr": 0.0001894261098608447, "time_sec": 177.26312851905823 }, { "epoch": 108, "train_loss": 5.360526904602051, "train_acc": 0.009, "test_loss": 4.630769221496582, "test_acc": 0.01, "lyapunov": 1.5865018233618773, "grad_norm": 0.18006495124030458, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 177.246666431427 }, { "epoch": 109, "train_loss": 5.361382939453125, "train_acc": 0.0098, "test_loss": 4.626291159820557, "test_acc": 0.01, "lyapunov": 1.586926028856536, "grad_norm": 0.2328474503629796, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 177.25811576843262 }, { "epoch": 110, "train_loss": 5.358514823455811, "train_acc": 0.00986, "test_loss": 4.6495152236938475, "test_acc": 0.01, "lyapunov": 1.5844445182844196, "grad_norm": 0.31612028134160525, "grad_max_sv": 0.010267550591379404, "grad_min_sv": 0.0, "grad_condition": 10267550591.379404, "lr": 0.00016543469682057076, "time_sec": 177.28474497795105 }, { "epoch": 111, "train_loss": 5.366782173309327, "train_acc": 0.00906, "test_loss": 4.620611762237549, "test_acc": 0.01, "lyapunov": 1.5906709133816497, "grad_norm": 0.40151776348821855, "grad_max_sv": 0.010553297400474549, "grad_min_sv": 0.0, "grad_condition": 10553297400.474548, "lr": 0.00015772644703565552, "time_sec": 177.3135175704956 }, { "epoch": 112, "train_loss": 5.359567135009765, "train_acc": 0.00886, "test_loss": 4.628111135101318, "test_acc": 0.01, "lyapunov": 1.5856597996733683, "grad_norm": 0.3009012541884835, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 177.25540447235107 }, { "epoch": 113, "train_loss": 5.358919576873779, "train_acc": 0.00968, "test_loss": 4.627276501464844, "test_acc": 0.01, "lyapunov": 1.5849643582883088, "grad_norm": 0.3242366139837751, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 177.27025246620178 }, { "epoch": 114, "train_loss": 5.3586665776062015, "train_acc": 0.00944, "test_loss": 4.620662684631347, "test_acc": 0.01, "lyapunov": 1.5846976368018733, "grad_norm": 0.2903374978600601, "grad_max_sv": 0.004233767790719867, "grad_min_sv": 0.0, "grad_condition": 4233767790.7198668, "lr": 0.00013551568628929425, "time_sec": 177.26198053359985 }, { "epoch": 115, "train_loss": 5.3605953396606445, "train_acc": 0.00902, "test_loss": 4.621528549194336, "test_acc": 0.01, "lyapunov": 1.586485847792662, "grad_norm": 0.331820693233947, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 177.23981928825378 }, { "epoch": 116, "train_loss": 5.359012928771973, "train_acc": 0.00958, "test_loss": 4.619492964172363, "test_acc": 0.01, "lyapunov": 1.585117801376011, "grad_norm": 0.2797157160809922, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 177.225914478302 }, { "epoch": 117, "train_loss": 5.359644413146973, "train_acc": 0.00924, "test_loss": 4.621938159942627, "test_acc": 0.01, "lyapunov": 1.5857579552608987, "grad_norm": 0.2795622109437437, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 177.22438168525696 }, { "epoch": 118, "train_loss": 5.359761270446778, "train_acc": 0.00924, "test_loss": 4.6217840301513675, "test_acc": 0.01, "lyapunov": 1.5858274750087573, "grad_norm": 0.24852001797471837, "grad_max_sv": 0.0012709970586001873, "grad_min_sv": 0.0, "grad_condition": 1270997058.6001873, "lr": 0.00010815327133708009, "time_sec": 177.2276487350464 }, { "epoch": 119, "train_loss": 5.357662630462647, "train_acc": 0.0091, "test_loss": 4.622296886444092, "test_acc": 0.01, "lyapunov": 1.5836935113458073, "grad_norm": 0.24372977816065178, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 177.25115942955017 }, { "epoch": 120, "train_loss": 5.361358259277344, "train_acc": 0.00944, "test_loss": 4.622046688079834, "test_acc": 0.01, "lyapunov": 1.587042825301285, "grad_norm": 0.22330891574384296, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 177.27366518974304 }, { "epoch": 121, "train_loss": 5.35905032409668, "train_acc": 0.00908, "test_loss": 4.622121089935303, "test_acc": 0.01, "lyapunov": 1.5851479878510966, "grad_norm": 0.20960225247372524, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 177.23317313194275 }, { "epoch": 122, "train_loss": 5.361670205078125, "train_acc": 0.0093, "test_loss": 4.622285698699951, "test_acc": 0.01, "lyapunov": 1.5875935237425978, "grad_norm": 0.21843560272800885, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 177.2194859981537 }, { "epoch": 123, "train_loss": 5.360625909729004, "train_acc": 0.01, "test_loss": 4.6224393463134765, "test_acc": 0.01, "lyapunov": 1.5867376934232005, "grad_norm": 0.2137074208505857, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 177.2682557106018 }, { "epoch": 124, "train_loss": 5.358632594451905, "train_acc": 0.0093, "test_loss": 4.680952319335938, "test_acc": 0.01, "lyapunov": 1.5847194472237316, "grad_norm": 0.1870926810471898, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 177.23400807380676 }, { "epoch": 125, "train_loss": 5.360412776184082, "train_acc": 0.0089, "test_loss": 4.73941685333252, "test_acc": 0.01, "lyapunov": 1.5865021639162926, "grad_norm": 0.21273250180362335, "grad_max_sv": 0.0014166037552058696, "grad_min_sv": 0.0, "grad_condition": 1416603755.2058697, "lr": 6.698729810778072e-05, "time_sec": 177.24382710456848 }, { "epoch": 126, "train_loss": 5.358947314758301, "train_acc": 0.0097, "test_loss": 4.672125242614746, "test_acc": 0.01, "lyapunov": 1.584972734646419, "grad_norm": 0.23341550723215748, "grad_max_sv": 0.001309919636696577, "grad_min_sv": 0.0, "grad_condition": 1309919636.696577, "lr": 6.184665997806817e-05, "time_sec": 177.26921725273132 }, { "epoch": 127, "train_loss": 5.359260606536865, "train_acc": 0.00982, "test_loss": 4.664470828247071, "test_acc": 0.01, "lyapunov": 1.585314722012376, "grad_norm": 0.265210981123156, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 177.23559665679932 }, { "epoch": 128, "train_loss": 5.361228064270019, "train_acc": 0.0096, "test_loss": 4.79210078125, "test_acc": 0.01, "lyapunov": 1.5868884224416044, "grad_norm": 0.284706461729636, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 177.23232126235962 }, { "epoch": 129, "train_loss": 5.358762674407959, "train_acc": 0.00948, "test_loss": 4.767799957275391, "test_acc": 0.01, "lyapunov": 1.5848681917580802, "grad_norm": 0.27692568211643537, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 177.2341754436493 }, { "epoch": 130, "train_loss": 5.360010164489746, "train_acc": 0.00926, "test_loss": 4.671016343688965, "test_acc": 0.01, "lyapunov": 1.5858237874477417, "grad_norm": 0.2706962686573412, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 177.24218034744263 }, { "epoch": 131, "train_loss": 5.3587316012573245, "train_acc": 0.00928, "test_loss": 4.748648097229004, "test_acc": 0.01, "lyapunov": 1.5848381055895324, "grad_norm": 0.23937263927645328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 177.2330150604248 }, { "epoch": 132, "train_loss": 5.35890893157959, "train_acc": 0.00964, "test_loss": 4.8125279388427735, "test_acc": 0.01, "lyapunov": 1.5850241647656922, "grad_norm": 0.2489556767273508, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 177.22991752624512 }, { "epoch": 133, "train_loss": 5.361185835876465, "train_acc": 0.00952, "test_loss": 4.643449569702148, "test_acc": 0.01, "lyapunov": 1.5871033570955477, "grad_norm": 0.31193315187891146, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 177.2139208316803 }, { "epoch": 134, "train_loss": 5.358732033691406, "train_acc": 0.00876, "test_loss": 4.706984965515137, "test_acc": 0.01, "lyapunov": 1.5848448145420044, "grad_norm": 0.25839982964286506, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 177.22592782974243 }, { "epoch": 135, "train_loss": 5.359151672363281, "train_acc": 0.00906, "test_loss": 4.7044763816833495, "test_acc": 0.01, "lyapunov": 1.5852836605228122, "grad_norm": 0.2598696228178214, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 177.2558205127716 }, { "epoch": 136, "train_loss": 5.359703632965088, "train_acc": 0.01, "test_loss": 4.721178560638427, "test_acc": 0.01, "lyapunov": 1.5858281173974351, "grad_norm": 0.26109222250019687, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 177.24931955337524 }, { "epoch": 137, "train_loss": 5.359647062225342, "train_acc": 0.00956, "test_loss": 4.705288150024414, "test_acc": 0.01, "lyapunov": 1.585799050453069, "grad_norm": 0.2430419176031886, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 177.20098423957825 }, { "epoch": 138, "train_loss": 5.370798114471436, "train_acc": 0.01, "test_loss": 4.711322469329834, "test_acc": 0.01, "lyapunov": 1.592538814105646, "grad_norm": 0.23717985848250528, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 177.27925276756287 }, { "epoch": 139, "train_loss": 5.358164114685058, "train_acc": 0.0097, "test_loss": 4.713753561401367, "test_acc": 0.01, "lyapunov": 1.5842537294568309, "grad_norm": 0.21577381809039398, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 177.2640838623047 }, { "epoch": 140, "train_loss": 5.359127445678711, "train_acc": 0.00982, "test_loss": 4.702644599914551, "test_acc": 0.01, "lyapunov": 1.5852683206348468, "grad_norm": 0.22693874606806255, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 177.26845002174377 }, { "epoch": 141, "train_loss": 5.358451212463379, "train_acc": 0.01, "test_loss": 4.709589306640625, "test_acc": 0.01, "lyapunov": 1.5845830724062517, "grad_norm": 0.21686215956311627, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 177.26886224746704 }, { "epoch": 142, "train_loss": 5.359413949279785, "train_acc": 0.01, "test_loss": 4.713582644653321, "test_acc": 0.01, "lyapunov": 1.5855683030374825, "grad_norm": 0.2386062253915984, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 177.24717164039612 }, { "epoch": 143, "train_loss": 5.380280564575195, "train_acc": 0.01, "test_loss": 4.7039310775756835, "test_acc": 0.01, "lyapunov": 1.59827317331758, "grad_norm": 0.281062533044562, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 177.23896765708923 }, { "epoch": 144, "train_loss": 5.359466158905029, "train_acc": 0.01, "test_loss": 4.690676583862305, "test_acc": 0.01, "lyapunov": 1.5856200407837968, "grad_norm": 0.18794718433603225, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 177.22590732574463 }, { "epoch": 145, "train_loss": 5.358838105926513, "train_acc": 0.01, "test_loss": 4.686097943115234, "test_acc": 0.01, "lyapunov": 1.5849668324146124, "grad_norm": 0.18762604455384463, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 177.2236692905426 }, { "epoch": 146, "train_loss": 5.358961830444336, "train_acc": 0.01, "test_loss": 4.6859198120117185, "test_acc": 0.01, "lyapunov": 1.5850938287232539, "grad_norm": 0.20367093372209882, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 177.23711729049683 }, { "epoch": 147, "train_loss": 5.359495299530029, "train_acc": 0.01, "test_loss": 4.686381504821777, "test_acc": 0.01, "lyapunov": 1.585582929194126, "grad_norm": 0.1846519425292254, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 177.23132824897766 }, { "epoch": 148, "train_loss": 5.358631723632812, "train_acc": 0.01, "test_loss": 4.686381640625, "test_acc": 0.01, "lyapunov": 1.5847509065857324, "grad_norm": 0.21479574972052035, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 177.25513577461243 }, { "epoch": 149, "train_loss": 5.359418527679443, "train_acc": 0.01, "test_loss": 4.6863815933227535, "test_acc": 0.01, "lyapunov": 1.585573171105836, "grad_norm": 0.18053721718052793, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 177.26594400405884 }, { "epoch": 150, "train_loss": 5.358559367828369, "train_acc": 0.01, "test_loss": 4.686381562042237, "test_acc": 0.01, "lyapunov": 1.584673622075249, "grad_norm": 0.17806465386525372, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 177.21632599830627 } ] } }