{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 4.346117241363525, "train_acc": 0.09834, "test_loss": 3.550243005371094, "test_acc": 0.1705, "lyapunov": null, "grad_norm": 6.371099905681965, "grad_max_sv": 5.004546135663986, "grad_min_sv": 1.1479638856171093e-07, "grad_condition": 101906528.03771546, "lr": 0.0009998903417374227, "time_sec": 16.05687952041626 }, { "epoch": 2, "train_loss": 3.5102988652038576, "train_acc": 0.18534, "test_loss": 3.5716390384674073, "test_acc": 0.2002, "lyapunov": null, "grad_norm": 4.572810771811442, "grad_max_sv": 3.3247465908527376, "grad_min_sv": 8.398422393085526e-08, "grad_condition": 76227232.13894418, "lr": 0.0009995614150494292, "time_sec": 15.448272466659546 }, { "epoch": 3, "train_loss": 3.054396768722534, "train_acc": 0.25274, "test_loss": 2.993664514160156, "test_acc": 0.2763, "lyapunov": null, "grad_norm": 3.5860981037463016, "grad_max_sv": 2.402756503224373, "grad_min_sv": 6.775348947440918e-08, "grad_condition": 42769838.6817436, "lr": 0.0009990133642141358, "time_sec": 15.465861558914185 }, { "epoch": 4, "train_loss": 2.722675824432373, "train_acc": 0.3136, "test_loss": 2.728995104598999, "test_acc": 0.3281, "lyapunov": null, "grad_norm": 2.9852975671602957, "grad_max_sv": 1.8682193964719773, "grad_min_sv": 5.5938930086305014e-08, "grad_condition": 328348281.0445617, "lr": 0.0009982464296247522, "time_sec": 15.43475079536438 }, { "epoch": 5, "train_loss": 2.508175393676758, "train_acc": 0.3569, "test_loss": 3.419650896835327, "test_acc": 0.2461, "lyapunov": null, "grad_norm": 2.6358092556880783, "grad_max_sv": 1.6064732760190963, "grad_min_sv": 4.9754905795396096e-08, "grad_condition": 44385388.81342572, "lr": 0.0009972609476841367, "time_sec": 15.444115400314331 }, { "epoch": 6, "train_loss": 2.3319723847961424, "train_acc": 0.39276, "test_loss": 2.5260577701568603, "test_acc": 0.373, "lyapunov": null, "grad_norm": 2.4120452283895926, "grad_max_sv": 1.3716692090034486, "grad_min_sv": 4.6226219474476696e-08, "grad_condition": 36175494.06179842, "lr": 0.000996057350657239, "time_sec": 15.43784475326538 }, { "epoch": 7, "train_loss": 2.190326895675659, "train_acc": 0.42378, "test_loss": 2.579724459838867, "test_acc": 0.3695, "lyapunov": null, "grad_norm": 2.2437900964501787, "grad_max_sv": 1.2385427325963974, "grad_min_sv": 4.28970178392718e-08, "grad_condition": 190661418.56414273, "lr": 0.000994636166481494, "time_sec": 15.455140829086304 }, { "epoch": 8, "train_loss": 2.070303360748291, "train_acc": 0.44962, "test_loss": 2.7414955226898194, "test_acc": 0.3392, "lyapunov": null, "grad_norm": 2.0940271772848607, "grad_max_sv": 1.1511073380708694, "grad_min_sv": 4.056795894439441e-08, "grad_condition": 707337590.06387, "lr": 0.0009929980185352525, "time_sec": 15.463218450546265 }, { "epoch": 9, "train_loss": 1.9642453713607788, "train_acc": 0.47356, "test_loss": 2.222684016609192, "test_acc": 0.4312, "lyapunov": null, "grad_norm": 1.964494515952547, "grad_max_sv": 1.0273158520460128, "grad_min_sv": 3.78966669392633e-08, "grad_condition": 428475326.2676049, "lr": 0.0009911436253643444, "time_sec": 15.443583011627197 }, { "epoch": 10, "train_loss": 1.8679190033721924, "train_acc": 0.49384, "test_loss": 2.2569959682464598, "test_acc": 0.4227, "lyapunov": null, "grad_norm": 1.863426925292341, "grad_max_sv": 0.9406855523586273, "grad_min_sv": 3.563859525823609e-08, "grad_condition": 44606817.73724544, "lr": 0.0009890738003669028, "time_sec": 15.442885637283325 }, { "epoch": 11, "train_loss": 1.7814382321929931, "train_acc": 0.51302, "test_loss": 2.504388472366333, "test_acc": 0.3946, "lyapunov": null, "grad_norm": 1.7723102238636992, "grad_max_sv": 0.8945659548044205, "grad_min_sv": 3.425328631706526e-08, "grad_condition": 109308981.21335419, "lr": 0.00098678945143658, "time_sec": 15.459418535232544 }, { "epoch": 12, "train_loss": 1.7159840296936035, "train_acc": 0.53146, "test_loss": 2.508260029220581, "test_acc": 0.3935, "lyapunov": null, "grad_norm": 1.686140929704303, "grad_max_sv": 0.8295574262738228, "grad_min_sv": 3.2012488864613386e-08, "grad_condition": 89179142.85485055, "lr": 0.0009842915805643154, "time_sec": 15.439209461212158 }, { "epoch": 13, "train_loss": 1.6503846585845947, "train_acc": 0.54474, "test_loss": 2.1456974792480468, "test_acc": 0.4502, "lyapunov": null, "grad_norm": 1.619802250264676, "grad_max_sv": 0.7797225803136826, "grad_min_sv": 3.0749212220730626e-08, "grad_condition": 285444721.0869424, "lr": 0.000981581283398829, "time_sec": 15.433976173400879 }, { "epoch": 14, "train_loss": 1.5905582858276368, "train_acc": 0.5585, "test_loss": 2.3602350467681883, "test_acc": 0.4172, "lyapunov": null, "grad_norm": 1.5586059487347217, "grad_max_sv": 0.7570723682641983, "grad_min_sv": 2.990113052159238e-08, "grad_condition": 33337603.41083364, "lr": 0.0009786597487660333, "time_sec": 15.430689811706543 }, { "epoch": 15, "train_loss": 1.5257548734283448, "train_acc": 0.57394, "test_loss": 2.2596036737442016, "test_acc": 0.4401, "lyapunov": null, "grad_norm": 1.494958992831554, "grad_max_sv": 0.7011767938733101, "grad_min_sv": 2.8093294829334425e-08, "grad_condition": 215948380.66679326, "lr": 0.0009755282581475766, "time_sec": 15.445661544799805 }, { "epoch": 16, "train_loss": 1.4769169562911988, "train_acc": 0.58454, "test_loss": 2.1792555765151977, "test_acc": 0.4464, "lyapunov": null, "grad_norm": 1.4433947117799557, "grad_max_sv": 0.6677212715148926, "grad_min_sv": 2.683760501054344e-08, "grad_condition": 45818352.96134277, "lr": 0.0009721881851187403, "time_sec": 15.456706523895264 }, { "epoch": 17, "train_loss": 1.429377403755188, "train_acc": 0.5973, "test_loss": 1.954601181793213, "test_acc": 0.4919, "lyapunov": null, "grad_norm": 1.402899746172417, "grad_max_sv": 0.6569379523396492, "grad_min_sv": 2.6772942612884876e-08, "grad_condition": 33425629.606939513, "lr": 0.0009686409947459456, "time_sec": 15.437876462936401 }, { "epoch": 18, "train_loss": 1.3954533521652221, "train_acc": 0.60348, "test_loss": 2.0381541999816895, "test_acc": 0.4877, "lyapunov": null, "grad_norm": 1.3646767773598742, "grad_max_sv": 0.6277542792260646, "grad_min_sv": 2.5360278501545055e-08, "grad_condition": 1276893214.2885015, "lr": 0.0009648882429441254, "time_sec": 15.442293643951416 }, { "epoch": 19, "train_loss": 1.34601386013031, "train_acc": 0.61788, "test_loss": 2.016515805435181, "test_acc": 0.4879, "lyapunov": null, "grad_norm": 1.3307426948998278, "grad_max_sv": 0.6192222326993942, "grad_min_sv": 2.5143750027184496e-08, "grad_condition": 86894504.02450311, "lr": 0.00096093157579425, "time_sec": 15.452877044677734 }, { "epoch": 20, "train_loss": 1.3103528637313844, "train_acc": 0.6263, "test_loss": 1.9570331373214722, "test_acc": 0.5034, "lyapunov": null, "grad_norm": 1.3019068672950393, "grad_max_sv": 0.5866124749183654, "grad_min_sv": 2.432551227254942e-08, "grad_condition": 79675782.79073408, "lr": 0.0009567727288213001, "time_sec": 15.442177057266235 }, { "epoch": 21, "train_loss": 1.2698568128204346, "train_acc": 0.6344, "test_loss": 2.4308045747756957, "test_acc": 0.4364, "lyapunov": null, "grad_norm": 1.268768380545349, "grad_max_sv": 0.5797948583960533, "grad_min_sv": 2.4104086050920348e-08, "grad_condition": 252776511.74393004, "lr": 0.0009524135262330095, "time_sec": 15.434435844421387 }, { "epoch": 22, "train_loss": 1.2418579862976074, "train_acc": 0.64312, "test_loss": 2.0848071727752684, "test_acc": 0.4867, "lyapunov": null, "grad_norm": 1.2415784803203374, "grad_max_sv": 0.5592644922435284, "grad_min_sv": 2.333180208254765e-08, "grad_condition": 407593245.7962709, "lr": 0.0009478558801197061, "time_sec": 15.460945129394531 }, { "epoch": 23, "train_loss": 1.2006691330718995, "train_acc": 0.65526, "test_loss": 2.041600823402405, "test_acc": 0.4981, "lyapunov": null, "grad_norm": 1.2102718857806654, "grad_max_sv": 0.5479752145707607, "grad_min_sv": 2.2646243507534748e-08, "grad_condition": 185681115.951604, "lr": 0.000943101789615607, "time_sec": 15.44005274772644 }, { "epoch": 24, "train_loss": 1.172968614616394, "train_acc": 0.66154, "test_loss": 1.9552119861602784, "test_acc": 0.513, "lyapunov": null, "grad_norm": 1.1987019399549284, "grad_max_sv": 0.5312893047928811, "grad_min_sv": 2.1980094488081857e-08, "grad_condition": 1318897337.4819613, "lr": 0.0009381533400219313, "time_sec": 15.440562009811401 }, { "epoch": 25, "train_loss": 1.1449218238067627, "train_acc": 0.6641, "test_loss": 2.128752773284912, "test_acc": 0.4906, "lyapunov": null, "grad_norm": 1.1778317272519585, "grad_max_sv": 0.5174455069005489, "grad_min_sv": 2.167262270237613e-08, "grad_condition": 94067067.14088301, "lr": 0.0009330127018922189, "time_sec": 15.443851232528687 }, { "epoch": 26, "train_loss": 1.1113452094268799, "train_acc": 0.67438, "test_loss": 1.8866374584197998, "test_acc": 0.5238, "lyapunov": null, "grad_norm": 1.1514970963524438, "grad_max_sv": 0.5059572130441665, "grad_min_sv": 2.105146406777836e-08, "grad_condition": 50748348.81685668, "lr": 0.000927682130080253, "time_sec": 15.436878681182861 }, { "epoch": 27, "train_loss": 1.0829708759689332, "train_acc": 0.68438, "test_loss": 1.9943335615158082, "test_acc": 0.5124, "lyapunov": null, "grad_norm": 1.1319771840855883, "grad_max_sv": 0.4948433578014374, "grad_min_sv": 2.0725160652934616e-08, "grad_condition": 77507476.80554287, "lr": 0.0009221639627510072, "time_sec": 15.441301822662354 }, { "epoch": 28, "train_loss": 1.0513020403671265, "train_acc": 0.6904, "test_loss": 1.9359693916320801, "test_acc": 0.5214, "lyapunov": null, "grad_norm": 1.1163749465170618, "grad_max_sv": 0.48814368024468424, "grad_min_sv": 2.0212865362197185e-08, "grad_condition": 298941066.3217323, "lr": 0.0009164606203550494, "time_sec": 15.441382646560669 }, { "epoch": 29, "train_loss": 1.029607636756897, "train_acc": 0.69482, "test_loss": 1.8560630758285523, "test_acc": 0.5431, "lyapunov": null, "grad_norm": 1.0928580221633342, "grad_max_sv": 0.5047290526330471, "grad_min_sv": 2.040681175013992e-08, "grad_condition": 48855533.517919585, "lr": 0.0009105746045668516, "time_sec": 15.460914373397827 }, { "epoch": 30, "train_loss": 1.0061684103393556, "train_acc": 0.70324, "test_loss": 1.8417754476547241, "test_acc": 0.5501, "lyapunov": null, "grad_norm": 1.0821004976322715, "grad_max_sv": 0.4740450643002987, "grad_min_sv": 1.9723761995882327e-08, "grad_condition": 57054017.19113614, "lr": 0.0009045084971874733, "time_sec": 15.458839178085327 }, { "epoch": 31, "train_loss": 0.9935745064163208, "train_acc": 0.70312, "test_loss": 1.9427630338668824, "test_acc": 0.522, "lyapunov": null, "grad_norm": 1.0722093249603526, "grad_max_sv": 0.46733852848410606, "grad_min_sv": 1.9939205435706707e-08, "grad_condition": 112229781.98396464, "lr": 0.0008982649590120977, "time_sec": 15.452664375305176 }, { "epoch": 32, "train_loss": 0.9721898876953124, "train_acc": 0.70988, "test_loss": 1.9291723361968993, "test_acc": 0.5365, "lyapunov": null, "grad_norm": 1.0493640798096933, "grad_max_sv": 0.451675596088171, "grad_min_sv": 1.9157993355872065e-08, "grad_condition": 369697835.9253775, "lr": 0.0008918467286629196, "time_sec": 15.447975158691406 }, { "epoch": 33, "train_loss": 0.9359502591705322, "train_acc": 0.71948, "test_loss": 1.8434128448486329, "test_acc": 0.544, "lyapunov": null, "grad_norm": 1.0350388755850537, "grad_max_sv": 0.4494323328137398, "grad_min_sv": 1.8973058482987804e-08, "grad_condition": 171928795.69725567, "lr": 0.0008852566213878943, "time_sec": 15.466245889663696 }, { "epoch": 34, "train_loss": 0.9224456702995301, "train_acc": 0.72168, "test_loss": 1.9599631881713868, "test_acc": 0.5373, "lyapunov": null, "grad_norm": 1.0242311025233581, "grad_max_sv": 0.44513428434729574, "grad_min_sv": 1.8523945613654545e-08, "grad_condition": 888195654.0727282, "lr": 0.000878497527825878, "time_sec": 15.461785316467285 }, { "epoch": 35, "train_loss": 0.9021567019844056, "train_acc": 0.72618, "test_loss": 1.9999154584884644, "test_acc": 0.5252, "lyapunov": null, "grad_norm": 1.0039865896001459, "grad_max_sv": 0.43928237855434416, "grad_min_sv": 1.8592035315456722e-08, "grad_condition": 59743908.57133106, "lr": 0.000871572412738697, "time_sec": 15.456985473632812 }, { "epoch": 36, "train_loss": 0.873283097190857, "train_acc": 0.73628, "test_loss": 1.982330265045166, "test_acc": 0.5279, "lyapunov": null, "grad_norm": 0.9875825554026111, "grad_max_sv": 0.42813498005270956, "grad_min_sv": 1.7983777930719037e-08, "grad_condition": 38527409.79900636, "lr": 0.0008644843137107055, "time_sec": 15.460105419158936 }, { "epoch": 37, "train_loss": 0.855709279346466, "train_acc": 0.74242, "test_loss": 1.9136155584335328, "test_acc": 0.5472, "lyapunov": null, "grad_norm": 0.9742310219337682, "grad_max_sv": 0.4270216949284077, "grad_min_sv": 1.8125810764824114e-08, "grad_condition": 40840950.73216411, "lr": 0.0008572363398164014, "time_sec": 15.459755897521973 }, { "epoch": 38, "train_loss": 0.8404359550476074, "train_acc": 0.74404, "test_loss": 1.9389733367919921, "test_acc": 0.543, "lyapunov": null, "grad_norm": 0.9722202503028375, "grad_max_sv": 0.42485796511173246, "grad_min_sv": 1.783134123689578e-08, "grad_condition": 35194167.51271446, "lr": 0.0008498316702566826, "time_sec": 15.465211629867554 }, { "epoch": 39, "train_loss": 0.8240101078987122, "train_acc": 0.7481, "test_loss": 1.8307217979431152, "test_acc": 0.5614, "lyapunov": null, "grad_norm": 0.9595502877351665, "grad_max_sv": 0.42209447696805, "grad_min_sv": 1.767885368514355e-08, "grad_condition": 49656386.85866156, "lr": 0.0008422735529643442, "time_sec": 15.455949544906616 }, { "epoch": 40, "train_loss": 0.8046207006645203, "train_acc": 0.75466, "test_loss": 1.850761813545227, "test_acc": 0.5635, "lyapunov": null, "grad_norm": 0.9479757240987767, "grad_max_sv": 0.4134661167860031, "grad_min_sv": 1.7007238412025672e-08, "grad_condition": 126702887.42727256, "lr": 0.0008345653031794289, "time_sec": 15.462433099746704 }, { "epoch": 41, "train_loss": 0.7895244974899291, "train_acc": 0.7586, "test_loss": 1.8032215663909912, "test_acc": 0.5672, "lyapunov": null, "grad_norm": 0.9378242670136524, "grad_max_sv": 0.3964280657470226, "grad_min_sv": 1.6944396442897246e-08, "grad_condition": 56052359.18882908, "lr": 0.0008267103019950526, "time_sec": 15.461899757385254 }, { "epoch": 42, "train_loss": 0.7817759350585938, "train_acc": 0.76056, "test_loss": 1.8505826110839845, "test_acc": 0.5582, "lyapunov": null, "grad_norm": 0.9337187835649021, "grad_max_sv": 0.40529350489377974, "grad_min_sv": 1.6676117367206422e-08, "grad_condition": 104849301.5445062, "lr": 0.0008187119948743447, "time_sec": 15.4581778049469 }, { "epoch": 43, "train_loss": 0.7522177431297302, "train_acc": 0.77, "test_loss": 1.8242130517959594, "test_acc": 0.5664, "lyapunov": null, "grad_norm": 0.9099555522847652, "grad_max_sv": 0.3934644728899002, "grad_min_sv": 1.6434511908997028e-08, "grad_condition": 61342068.969211556, "lr": 0.000810573890139155, "time_sec": 15.447810411453247 }, { "epoch": 44, "train_loss": 0.7323650365447998, "train_acc": 0.77464, "test_loss": 1.8068662160873412, "test_acc": 0.5687, "lyapunov": null, "grad_norm": 0.9037556138602378, "grad_max_sv": 0.38610322400927544, "grad_min_sv": 1.6304181772903992e-08, "grad_condition": 167736758.90882486, "lr": 0.0008022995574311873, "time_sec": 15.458601951599121 }, { "epoch": 45, "train_loss": 0.7159886347198486, "train_acc": 0.77928, "test_loss": 1.8823264539718627, "test_acc": 0.5645, "lyapunov": null, "grad_norm": 0.8924866037240323, "grad_max_sv": 0.3947519548237324, "grad_min_sv": 1.6336485028634052e-08, "grad_condition": 69167052.26120928, "lr": 0.0007938926261462363, "time_sec": 15.471583843231201 }, { "epoch": 46, "train_loss": 0.7136952446365357, "train_acc": 0.78054, "test_loss": 1.7574677402496337, "test_acc": 0.5825, "lyapunov": null, "grad_norm": 0.8931942393361509, "grad_max_sv": 0.37973910570144653, "grad_min_sv": 1.6153765381235476e-08, "grad_condition": 489329276.9292526, "lr": 0.0007853567838422158, "time_sec": 15.471785068511963 }, { "epoch": 47, "train_loss": 0.6837898429489135, "train_acc": 0.78762, "test_loss": 1.813544430541992, "test_acc": 0.5725, "lyapunov": null, "grad_norm": 0.8815821036419627, "grad_max_sv": 0.3751175247132778, "grad_min_sv": 1.5766544728818e-08, "grad_condition": 56980767.9665909, "lr": 0.0007766957746216719, "time_sec": 15.457926750183105 }, { "epoch": 48, "train_loss": 0.6856673602676392, "train_acc": 0.78888, "test_loss": 1.990400904083252, "test_acc": 0.5508, "lyapunov": null, "grad_norm": 0.8744462547536074, "grad_max_sv": 0.3799706071615219, "grad_min_sv": 1.6096928557272904e-08, "grad_condition": 303945380.88277286, "lr": 0.0007679133974894982, "time_sec": 15.456810712814331 }, { "epoch": 49, "train_loss": 0.667086083278656, "train_acc": 0.792, "test_loss": 1.8513258657455445, "test_acc": 0.5727, "lyapunov": null, "grad_norm": 0.8677773875250141, "grad_max_sv": 0.3783408857882023, "grad_min_sv": 1.5666924351245835e-08, "grad_condition": 353923080.3313891, "lr": 0.000759013504686565, "time_sec": 15.462752342224121 }, { "epoch": 50, "train_loss": 0.6466483051490783, "train_acc": 0.79742, "test_loss": 2.043276873779297, "test_acc": 0.5419, "lyapunov": null, "grad_norm": 0.8555816651124006, "grad_max_sv": 0.3675771526992321, "grad_min_sv": 1.5045219146090152e-08, "grad_condition": 536508015.45004594, "lr": 0.0007499999999999998, "time_sec": 15.458629846572876 }, { "epoch": 51, "train_loss": 0.6258693974494934, "train_acc": 0.80236, "test_loss": 1.954080751991272, "test_acc": 0.5622, "lyapunov": null, "grad_norm": 0.8469179426728266, "grad_max_sv": 0.377849230915308, "grad_min_sv": 1.5333696528480045e-08, "grad_condition": 117912957.37628272, "lr": 0.0007408768370508575, "time_sec": 15.46766972541809 }, { "epoch": 52, "train_loss": 0.6236670018768311, "train_acc": 0.80516, "test_loss": 1.8472453788757324, "test_acc": 0.5858, "lyapunov": null, "grad_norm": 0.8404179479578597, "grad_max_sv": 0.3541756056249142, "grad_min_sv": 1.5022051764665422e-08, "grad_condition": 129884434.5908782, "lr": 0.0007316480175599307, "time_sec": 15.461432695388794 }, { "epoch": 53, "train_loss": 0.6075375831794739, "train_acc": 0.80952, "test_loss": 1.9628248615264892, "test_acc": 0.5673, "lyapunov": null, "grad_norm": 0.8367502172326149, "grad_max_sv": 0.3639704927802086, "grad_min_sv": 1.532564684603166e-08, "grad_condition": 35699441.49240203, "lr": 0.0007223175895924635, "time_sec": 15.46337342262268 }, { "epoch": 54, "train_loss": 0.5996641965866089, "train_acc": 0.81216, "test_loss": 1.8179010778427125, "test_acc": 0.5843, "lyapunov": null, "grad_norm": 0.8307418709294171, "grad_max_sv": 0.3613003775477409, "grad_min_sv": 1.4895932505510321e-08, "grad_condition": 875528249.2472179, "lr": 0.0007128896457825361, "time_sec": 15.465355396270752 }, { "epoch": 55, "train_loss": 0.5882498831176758, "train_acc": 0.81494, "test_loss": 1.8813747344970704, "test_acc": 0.582, "lyapunov": null, "grad_norm": 0.8235931888813899, "grad_max_sv": 0.3551651187241077, "grad_min_sv": 1.469800572865415e-08, "grad_condition": 484027587.3941019, "lr": 0.0007033683215378998, "time_sec": 15.460170984268188 }, { "epoch": 56, "train_loss": 0.5707145217132569, "train_acc": 0.82072, "test_loss": 1.840101174545288, "test_acc": 0.5813, "lyapunov": null, "grad_norm": 0.8086603393569909, "grad_max_sv": 0.34960880503058434, "grad_min_sv": 1.4356627959719037e-08, "grad_condition": 198153063.82803452, "lr": 0.0006937577932260512, "time_sec": 15.455865383148193 }, { "epoch": 57, "train_loss": 0.5646172902584076, "train_acc": 0.82002, "test_loss": 1.8341705081939697, "test_acc": 0.5873, "lyapunov": null, "grad_norm": 0.810642435475112, "grad_max_sv": 0.3562955237925053, "grad_min_sv": 1.4607543052502087e-08, "grad_condition": 226679350.92895135, "lr": 0.0006840622763423388, "time_sec": 15.474364757537842 }, { "epoch": 58, "train_loss": 0.5469015620231629, "train_acc": 0.82858, "test_loss": 1.9427689083099364, "test_acc": 0.5739, "lyapunov": null, "grad_norm": 0.7944800992028263, "grad_max_sv": 0.33950445652008054, "grad_min_sv": 1.368517551399162e-08, "grad_condition": 347795127.79131866, "lr": 0.0006742860236609073, "time_sec": 15.464811563491821 }, { "epoch": 59, "train_loss": 0.5445322315883636, "train_acc": 0.82716, "test_loss": 1.8801843715667725, "test_acc": 0.5792, "lyapunov": null, "grad_norm": 0.7916664309528131, "grad_max_sv": 0.3434500187635422, "grad_min_sv": 1.4393026628520266e-08, "grad_condition": 315625887.3364844, "lr": 0.0006644333233692913, "time_sec": 15.463439702987671 }, { "epoch": 60, "train_loss": 0.5323922993850708, "train_acc": 0.8299, "test_loss": 1.9002599145889283, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.7870533377985126, "grad_max_sv": 0.34093547612428665, "grad_min_sv": 1.4214920851518542e-08, "grad_condition": 91722689.16411342, "lr": 0.0006545084971874734, "time_sec": 15.450496912002563 }, { "epoch": 61, "train_loss": 0.519907633266449, "train_acc": 0.83526, "test_loss": 1.9299441148757934, "test_acc": 0.5794, "lyapunov": null, "grad_norm": 0.7766553414478388, "grad_max_sv": 0.3247631438076496, "grad_min_sv": 1.3660971805162792e-08, "grad_condition": 158255223.31341702, "lr": 0.0006445158984722354, "time_sec": 15.486064910888672 }, { "epoch": 62, "train_loss": 0.5158719365882873, "train_acc": 0.83688, "test_loss": 1.8924803583145142, "test_acc": 0.5838, "lyapunov": null, "grad_norm": 0.7769879212152438, "grad_max_sv": 0.34014692306518557, "grad_min_sv": 1.4163850685366964e-08, "grad_condition": 69424987.38028774, "lr": 0.0006344599103076324, "time_sec": 15.469778776168823 }, { "epoch": 63, "train_loss": 0.5016013371658326, "train_acc": 0.83886, "test_loss": 1.9557724254608155, "test_acc": 0.578, "lyapunov": null, "grad_norm": 0.7667097633814496, "grad_max_sv": 0.3396275587379932, "grad_min_sv": 1.3258012922148093e-08, "grad_condition": 246523332.7028369, "lr": 0.0006243449435824269, "time_sec": 15.490433692932129 }, { "epoch": 64, "train_loss": 0.4887677048301697, "train_acc": 0.84204, "test_loss": 1.919124504852295, "test_acc": 0.5841, "lyapunov": null, "grad_norm": 0.7573654062297513, "grad_max_sv": 0.32946483269333837, "grad_min_sv": 1.3579194014026741e-08, "grad_condition": 122613286.93525049, "lr": 0.0006141754350553275, "time_sec": 15.473332166671753 }, { "epoch": 65, "train_loss": 0.4757623895263672, "train_acc": 0.84768, "test_loss": 1.9984818859100342, "test_acc": 0.5761, "lyapunov": null, "grad_norm": 0.748014318960053, "grad_max_sv": 0.33319817706942556, "grad_min_sv": 1.3326467683972414e-08, "grad_condition": 623990635.8236978, "lr": 0.0006039558454088793, "time_sec": 15.485574960708618 }, { "epoch": 66, "train_loss": 0.4649162304496765, "train_acc": 0.85152, "test_loss": 1.9724672309875488, "test_acc": 0.576, "lyapunov": null, "grad_norm": 0.7417116384839675, "grad_max_sv": 0.3309340290725231, "grad_min_sv": 1.334454621318426e-08, "grad_condition": 142248731.7186973, "lr": 0.000593690657292862, "time_sec": 15.480328559875488 }, { "epoch": 67, "train_loss": 0.4583131973075867, "train_acc": 0.85314, "test_loss": 1.911379218673706, "test_acc": 0.5815, "lyapunov": null, "grad_norm": 0.737726746568229, "grad_max_sv": 0.32083366960287096, "grad_min_sv": 1.2965913287477093e-08, "grad_condition": 78597953.03928533, "lr": 0.0005833843733580507, "time_sec": 15.469099283218384 }, { "epoch": 68, "train_loss": 0.44331007887840274, "train_acc": 0.85794, "test_loss": 1.9728064548492432, "test_acc": 0.5854, "lyapunov": null, "grad_norm": 0.7274207800935486, "grad_max_sv": 0.3188414238393307, "grad_min_sv": 1.2804001882360528e-08, "grad_condition": 55555678.95357393, "lr": 0.0005730415142812054, "time_sec": 15.481547117233276 }, { "epoch": 69, "train_loss": 0.43979987537384035, "train_acc": 0.85974, "test_loss": 1.919715219116211, "test_acc": 0.5884, "lyapunov": null, "grad_norm": 0.7242391218539499, "grad_max_sv": 0.3140024244785309, "grad_min_sv": 1.275962300552845e-08, "grad_condition": 326554514.7187793, "lr": 0.0005626666167821517, "time_sec": 15.48648977279663 }, { "epoch": 70, "train_loss": 0.4322844411468506, "train_acc": 0.86176, "test_loss": 2.0117150314331056, "test_acc": 0.5834, "lyapunov": null, "grad_norm": 0.7186156540948507, "grad_max_sv": 0.31351484879851343, "grad_min_sv": 1.2888502469096674e-08, "grad_condition": 178788272.1664782, "lr": 0.0005522642316338265, "time_sec": 15.48006272315979 }, { "epoch": 71, "train_loss": 0.42623882338523866, "train_acc": 0.86272, "test_loss": 1.9539510818481445, "test_acc": 0.5875, "lyapunov": null, "grad_norm": 0.7137008149677833, "grad_max_sv": 0.31342701613903046, "grad_min_sv": 1.2595162532727522e-08, "grad_condition": 302205097.8444015, "lr": 0.0005418389216661573, "time_sec": 15.492274284362793 }, { "epoch": 72, "train_loss": 0.41300243412017823, "train_acc": 0.86584, "test_loss": 1.9104324056625366, "test_acc": 0.5874, "lyapunov": null, "grad_norm": 0.7058331032866322, "grad_max_sv": 0.3122198607772589, "grad_min_sv": 1.2484183565045215e-08, "grad_condition": 249411647.9543108, "lr": 0.0005313952597646563, "time_sec": 15.472809076309204 }, { "epoch": 73, "train_loss": 0.4090885982322693, "train_acc": 0.86766, "test_loss": 1.9304109241485596, "test_acc": 0.5896, "lyapunov": null, "grad_norm": 0.7030000923329225, "grad_max_sv": 0.3075466021895409, "grad_min_sv": 1.252222159744791e-08, "grad_condition": 331808797.86113906, "lr": 0.0005209378268645994, "time_sec": 15.497188806533813 }, { "epoch": 74, "train_loss": 0.40033238063812254, "train_acc": 0.87144, "test_loss": 1.985810231399536, "test_acc": 0.5849, "lyapunov": null, "grad_norm": 0.6995855816146154, "grad_max_sv": 0.31191978715360164, "grad_min_sv": 1.2527367021682167e-08, "grad_condition": 263818262.83558512, "lr": 0.0005104712099416781, "time_sec": 15.483733892440796 }, { "epoch": 75, "train_loss": 0.39340143531799315, "train_acc": 0.87318, "test_loss": 1.9034859148025514, "test_acc": 0.5988, "lyapunov": null, "grad_norm": 0.6917443264462005, "grad_max_sv": 0.3097103513777256, "grad_min_sv": 1.2234487580323195e-08, "grad_condition": 189402494.46869463, "lr": 0.0004999999999999996, "time_sec": 15.491854667663574 }, { "epoch": 76, "train_loss": 0.38218573943138123, "train_acc": 0.87562, "test_loss": 1.9674748405456544, "test_acc": 0.5897, "lyapunov": null, "grad_norm": 0.6848552863949536, "grad_max_sv": 0.306015183404088, "grad_min_sv": 1.2231246879906843e-08, "grad_condition": 67368302.47465871, "lr": 0.0004895287900583212, "time_sec": 15.475126504898071 }, { "epoch": 77, "train_loss": 0.37298857500076293, "train_acc": 0.8782, "test_loss": 1.9116508392333984, "test_acc": 0.5973, "lyapunov": null, "grad_norm": 0.676733354734531, "grad_max_sv": 0.30364411063492297, "grad_min_sv": 1.2298366306937036e-08, "grad_condition": 113213891.7010752, "lr": 0.0004790621731353997, "time_sec": 15.476521015167236 }, { "epoch": 78, "train_loss": 0.3701143793487549, "train_acc": 0.88078, "test_loss": 2.085685297012329, "test_acc": 0.5795, "lyapunov": null, "grad_norm": 0.6755741762416969, "grad_max_sv": 0.30699342787265776, "grad_min_sv": 1.205234841629107e-08, "grad_condition": 3030668677.964108, "lr": 0.000468604740235343, "time_sec": 15.484160423278809 }, { "epoch": 79, "train_loss": 0.36959360103607175, "train_acc": 0.87916, "test_loss": 1.9509956113815308, "test_acc": 0.601, "lyapunov": null, "grad_norm": 0.6757618176434513, "grad_max_sv": 0.3065595250576735, "grad_min_sv": 1.2097158442331279e-08, "grad_condition": 77210703.25088154, "lr": 0.00045816107833384175, "time_sec": 15.480469226837158 }, { "epoch": 80, "train_loss": 0.3621886194419861, "train_acc": 0.88318, "test_loss": 1.9287394012451171, "test_acc": 0.5985, "lyapunov": null, "grad_norm": 0.6691339361755074, "grad_max_sv": 0.3024368964135647, "grad_min_sv": 1.2120088314785185e-08, "grad_condition": 405016123.1402856, "lr": 0.0004477357683661729, "time_sec": 15.493567705154419 }, { "epoch": 81, "train_loss": 0.35030229503631594, "train_acc": 0.88624, "test_loss": 2.00673182220459, "test_acc": 0.5919, "lyapunov": null, "grad_norm": 0.6596224304671231, "grad_max_sv": 0.29136806540191174, "grad_min_sv": 1.127730693450046e-08, "grad_condition": 1639288832.1236253, "lr": 0.00043733338321784746, "time_sec": 15.493369817733765 }, { "epoch": 82, "train_loss": 0.34493877026557923, "train_acc": 0.8872, "test_loss": 2.030837797164917, "test_acc": 0.5955, "lyapunov": null, "grad_norm": 0.656267153049647, "grad_max_sv": 0.28955256529152396, "grad_min_sv": 1.1868315586143104e-08, "grad_condition": 869246762.0746359, "lr": 0.0004269584857187939, "time_sec": 15.51423978805542 }, { "epoch": 83, "train_loss": 0.33515030410289764, "train_acc": 0.89166, "test_loss": 2.0619586929321287, "test_acc": 0.5889, "lyapunov": null, "grad_norm": 0.6433611607654642, "grad_max_sv": 0.28342132121324537, "grad_min_sv": 1.1435175364601923e-08, "grad_condition": 62926422.11698373, "lr": 0.0004166156266419484, "time_sec": 15.476901769638062 }, { "epoch": 84, "train_loss": 0.33155179508209226, "train_acc": 0.8925, "test_loss": 2.021995645713806, "test_acc": 0.5931, "lyapunov": null, "grad_norm": 0.6432295423646542, "grad_max_sv": 0.29169376716017725, "grad_min_sv": 1.1024380705050054e-08, "grad_condition": 1442816426.8026254, "lr": 0.0004063093427071373, "time_sec": 15.489609479904175 }, { "epoch": 85, "train_loss": 0.32435158078193665, "train_acc": 0.89488, "test_loss": 2.013304320335388, "test_acc": 0.5916, "lyapunov": null, "grad_norm": 0.6387569144998656, "grad_max_sv": 0.29359805807471273, "grad_min_sv": 1.1595539084474638e-08, "grad_condition": 189598831.94028363, "lr": 0.0003960441545911199, "time_sec": 15.501060247421265 }, { "epoch": 86, "train_loss": 0.3179238869667053, "train_acc": 0.89698, "test_loss": 1.9903604904174805, "test_acc": 0.5974, "lyapunov": null, "grad_norm": 0.6339090393643317, "grad_max_sv": 0.2939893651753664, "grad_min_sv": 1.1321056620980375e-08, "grad_condition": 126309584.77428427, "lr": 0.0003858245649446718, "time_sec": 15.473534345626831 }, { "epoch": 87, "train_loss": 0.3082590392589569, "train_acc": 0.90084, "test_loss": 1.9719016357421875, "test_acc": 0.5973, "lyapunov": null, "grad_norm": 0.6204648872897773, "grad_max_sv": 0.2808060821145773, "grad_min_sv": 1.1003370339922671e-08, "grad_condition": 295054731.1552657, "lr": 0.00037565505641757235, "time_sec": 15.489596128463745 }, { "epoch": 88, "train_loss": 0.30407683875083924, "train_acc": 0.9015, "test_loss": 2.046679413032532, "test_acc": 0.5983, "lyapunov": null, "grad_norm": 0.6232550099645187, "grad_max_sv": 0.2919613588601351, "grad_min_sv": 1.106688122280361e-08, "grad_condition": 322143674.85252506, "lr": 0.00036554008969236695, "time_sec": 15.49986457824707 }, { "epoch": 89, "train_loss": 0.3027446964073181, "train_acc": 0.90118, "test_loss": 2.086252244949341, "test_acc": 0.5888, "lyapunov": null, "grad_norm": 0.6190288324649083, "grad_max_sv": 0.28052753023803234, "grad_min_sv": 1.0900322809496467e-08, "grad_condition": 566479183.315316, "lr": 0.0003554841015277638, "time_sec": 15.504590034484863 }, { "epoch": 90, "train_loss": 0.29228587161064146, "train_acc": 0.9047, "test_loss": 2.0138395809173586, "test_acc": 0.5944, "lyapunov": null, "grad_norm": 0.6096912272320082, "grad_max_sv": 0.28337894156575205, "grad_min_sv": 1.0885550369042416e-08, "grad_condition": 2055184394.3102565, "lr": 0.000345491502812526, "time_sec": 15.49034571647644 }, { "epoch": 91, "train_loss": 0.2902773824119568, "train_acc": 0.9069, "test_loss": 2.0066411319732667, "test_acc": 0.6022, "lyapunov": null, "grad_norm": 0.6066794741118794, "grad_max_sv": 0.27967384792864325, "grad_min_sv": 1.113149796019841e-08, "grad_condition": 126085093.27825883, "lr": 0.0003355666766307081, "time_sec": 15.486260652542114 }, { "epoch": 92, "train_loss": 0.2833449110221863, "train_acc": 0.90814, "test_loss": 2.077221655654907, "test_acc": 0.5914, "lyapunov": null, "grad_norm": 0.6042052133918574, "grad_max_sv": 0.27325271964073183, "grad_min_sv": 1.057503346621057e-08, "grad_condition": 3596600642.934755, "lr": 0.00032571397633909225, "time_sec": 15.505445957183838 }, { "epoch": 93, "train_loss": 0.275921519203186, "train_acc": 0.91156, "test_loss": 2.0253973026275633, "test_acc": 0.6011, "lyapunov": null, "grad_norm": 0.596345487343705, "grad_max_sv": 0.27955980561673643, "grad_min_sv": 1.0745895713884512e-08, "grad_condition": 99226565.9342475, "lr": 0.00031593772365766094, "time_sec": 15.494666337966919 }, { "epoch": 94, "train_loss": 0.27615388660430906, "train_acc": 0.90982, "test_loss": 2.0751438976287844, "test_acc": 0.5926, "lyapunov": null, "grad_norm": 0.5987218023474344, "grad_max_sv": 0.27597025111317636, "grad_min_sv": 1.0580089662877434e-08, "grad_condition": 377084496.3903383, "lr": 0.0003062422067739483, "time_sec": 15.47998309135437 }, { "epoch": 95, "train_loss": 0.26991701264381407, "train_acc": 0.9106, "test_loss": 2.065015655708313, "test_acc": 0.5995, "lyapunov": null, "grad_norm": 0.591359331692498, "grad_max_sv": 0.280801360309124, "grad_min_sv": 1.058501965522929e-08, "grad_condition": 177268235.5442259, "lr": 0.00029663167846209965, "time_sec": 15.503370761871338 }, { "epoch": 96, "train_loss": 0.26606324160575867, "train_acc": 0.9137, "test_loss": 2.0547151592254638, "test_acc": 0.6024, "lyapunov": null, "grad_norm": 0.5902198713479344, "grad_max_sv": 0.2709753967821598, "grad_min_sv": 1.0618598106555168e-08, "grad_condition": 842340240.5160465, "lr": 0.00028711035421746345, "time_sec": 15.498698949813843 }, { "epoch": 97, "train_loss": 0.25566293501853943, "train_acc": 0.91732, "test_loss": 2.007575707626343, "test_acc": 0.5994, "lyapunov": null, "grad_norm": 0.5817467490050799, "grad_max_sv": 0.2697387088090181, "grad_min_sv": 1.025438704743524e-08, "grad_condition": 463836797.56778467, "lr": 0.00027768241040753615, "time_sec": 15.489367485046387 }, { "epoch": 98, "train_loss": 0.2515622547864914, "train_acc": 0.91842, "test_loss": 2.04601014251709, "test_acc": 0.6008, "lyapunov": null, "grad_norm": 0.5794799592204589, "grad_max_sv": 0.26677791140973567, "grad_min_sv": 1.029050446439174e-08, "grad_condition": 588388249.9313815, "lr": 0.00026835198244006903, "time_sec": 15.474334001541138 }, { "epoch": 99, "train_loss": 0.24500514444351196, "train_acc": 0.92196, "test_loss": 2.086534292602539, "test_acc": 0.6033, "lyapunov": null, "grad_norm": 0.5694490714138027, "grad_max_sv": 0.2623301979154348, "grad_min_sv": 9.966415031648947e-09, "grad_condition": 1015125356.3291184, "lr": 0.0002591231629491421, "time_sec": 15.491194248199463 }, { "epoch": 100, "train_loss": 0.24579128606796263, "train_acc": 0.92022, "test_loss": 2.033238724517822, "test_acc": 0.6073, "lyapunov": null, "grad_norm": 0.5680720755555388, "grad_max_sv": 0.25963654592633245, "grad_min_sv": 9.939859338002274e-09, "grad_condition": 445557731.47806203, "lr": 0.0002499999999999997, "time_sec": 15.490838050842285 }, { "epoch": 101, "train_loss": 0.24127339096069336, "train_acc": 0.92306, "test_loss": 2.1002378002166746, "test_acc": 0.6036, "lyapunov": null, "grad_norm": 0.5641906297524981, "grad_max_sv": 0.27549757733941077, "grad_min_sv": 1.0068470844863327e-08, "grad_condition": 409101783.765684, "lr": 0.00024098649531343477, "time_sec": 15.490317106246948 }, { "epoch": 102, "train_loss": 0.2390659130167961, "train_acc": 0.9225, "test_loss": 2.0233927448272704, "test_acc": 0.6081, "lyapunov": null, "grad_norm": 0.5658609942304538, "grad_max_sv": 0.2694991033524275, "grad_min_sv": 9.839277652549483e-09, "grad_condition": 3844646046.5289702, "lr": 0.0002320866025105016, "time_sec": 15.493839740753174 }, { "epoch": 103, "train_loss": 0.23365470203876496, "train_acc": 0.92546, "test_loss": 2.007601522064209, "test_acc": 0.6095, "lyapunov": null, "grad_norm": 0.5584257053092218, "grad_max_sv": 0.2743960417807102, "grad_min_sv": 1.0207792428690299e-08, "grad_condition": 250547163.15828475, "lr": 0.0002233042253783278, "time_sec": 15.469611167907715 }, { "epoch": 104, "train_loss": 0.22797604578971864, "train_acc": 0.92666, "test_loss": 1.9921390232086182, "test_acc": 0.6104, "lyapunov": null, "grad_norm": 0.5477060234172001, "grad_max_sv": 0.2509814579039812, "grad_min_sv": 9.610087979301102e-09, "grad_condition": 2430635198.302944, "lr": 0.000214643216157784, "time_sec": 15.485874652862549 }, { "epoch": 105, "train_loss": 0.2194866455602646, "train_acc": 0.92896, "test_loss": 2.065049479866028, "test_acc": 0.6048, "lyapunov": null, "grad_norm": 0.5427601977062464, "grad_max_sv": 0.24938638992607592, "grad_min_sv": 9.552283189700334e-09, "grad_condition": 249820703.92123896, "lr": 0.00020610737385376332, "time_sec": 15.492459058761597 }, { "epoch": 106, "train_loss": 0.22127391705036165, "train_acc": 0.9277, "test_loss": 2.0674615295410157, "test_acc": 0.6066, "lyapunov": null, "grad_norm": 0.545565415204051, "grad_max_sv": 0.252237818390131, "grad_min_sv": 9.870081852563286e-09, "grad_condition": 1730317003.0799267, "lr": 0.00019770044256881242, "time_sec": 15.494806051254272 }, { "epoch": 107, "train_loss": 0.21957805599212646, "train_acc": 0.92936, "test_loss": 2.069959518432617, "test_acc": 0.6059, "lyapunov": null, "grad_norm": 0.5427102510735407, "grad_max_sv": 0.26037181839346885, "grad_min_sv": 9.796433978262464e-09, "grad_condition": 619659373.2197987, "lr": 0.0001894261098608447, "time_sec": 15.494577169418335 }, { "epoch": 108, "train_loss": 0.21802687605857848, "train_acc": 0.92854, "test_loss": 2.069862120437622, "test_acc": 0.6064, "lyapunov": null, "grad_norm": 0.5412145734801318, "grad_max_sv": 0.26357722133398054, "grad_min_sv": 9.731102705856913e-09, "grad_condition": 4896886016.781491, "lr": 0.000181288005125655, "time_sec": 15.492915630340576 }, { "epoch": 109, "train_loss": 0.2105085688495636, "train_acc": 0.9329, "test_loss": 2.0300133407592775, "test_acc": 0.6118, "lyapunov": null, "grad_norm": 0.5316865416598037, "grad_max_sv": 0.24584890641272067, "grad_min_sv": 9.288343090713484e-09, "grad_condition": 1467162755.386783, "lr": 0.0001732896980049473, "time_sec": 15.496263980865479 }, { "epoch": 110, "train_loss": 0.20778575693130494, "train_acc": 0.9324, "test_loss": 2.033147290420532, "test_acc": 0.6113, "lyapunov": null, "grad_norm": 0.5310273370102141, "grad_max_sv": 0.25715232640504837, "grad_min_sv": 9.619756366117082e-09, "grad_condition": 909703469.1889927, "lr": 0.00016543469682057076, "time_sec": 15.48079514503479 }, { "epoch": 111, "train_loss": 0.2022018117570877, "train_acc": 0.93408, "test_loss": 2.0903577659606936, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.5248885212713278, "grad_max_sv": 0.25115896202623844, "grad_min_sv": 9.449230327059423e-09, "grad_condition": 654306379.114652, "lr": 0.00015772644703565552, "time_sec": 15.481376886367798 }, { "epoch": 112, "train_loss": 0.2012022008705139, "train_acc": 0.93478, "test_loss": 2.1256960330963133, "test_acc": 0.6062, "lyapunov": null, "grad_norm": 0.5259715208516651, "grad_max_sv": 0.25880570262670516, "grad_min_sv": 9.483339922537942e-09, "grad_condition": 3450539548.1120477, "lr": 0.00015016832974331713, "time_sec": 15.474645853042603 }, { "epoch": 113, "train_loss": 0.20022091041088105, "train_acc": 0.9359, "test_loss": 2.0813249099731443, "test_acc": 0.6127, "lyapunov": null, "grad_norm": 0.518582122023061, "grad_max_sv": 0.25183347687125207, "grad_min_sv": 9.362834274724563e-09, "grad_condition": 206343345.02075773, "lr": 0.00014276366018359834, "time_sec": 15.51976227760315 }, { "epoch": 114, "train_loss": 0.20003674240589142, "train_acc": 0.93548, "test_loss": 2.059957353401184, "test_acc": 0.6113, "lyapunov": null, "grad_norm": 0.5204510649985771, "grad_max_sv": 0.24840169511735438, "grad_min_sv": 9.433198861711483e-09, "grad_condition": 156281157.83753783, "lr": 0.00013551568628929425, "time_sec": 15.486659526824951 }, { "epoch": 115, "train_loss": 0.19450239594459534, "train_acc": 0.9368, "test_loss": 2.081795527267456, "test_acc": 0.613, "lyapunov": null, "grad_norm": 0.513222572000434, "grad_max_sv": 0.25595347620546816, "grad_min_sv": 9.54867237041787e-09, "grad_condition": 768174194.3770015, "lr": 0.00012842758726130276, "time_sec": 15.51030945777893 }, { "epoch": 116, "train_loss": 0.19022185802936553, "train_acc": 0.93888, "test_loss": 2.0910057247161866, "test_acc": 0.6109, "lyapunov": null, "grad_norm": 0.509950221902217, "grad_max_sv": 0.24649180248379707, "grad_min_sv": 9.286189562706521e-09, "grad_condition": 190506622.94702727, "lr": 0.0001215024721741218, "time_sec": 15.4960777759552 }, { "epoch": 117, "train_loss": 0.18697156070709228, "train_acc": 0.9409, "test_loss": 2.1048245140075683, "test_acc": 0.6113, "lyapunov": null, "grad_norm": 0.5023066665762482, "grad_max_sv": 0.24158176295459272, "grad_min_sv": 9.132921396148092e-09, "grad_condition": 4603577974.011314, "lr": 0.00011474337861210538, "time_sec": 15.499973773956299 }, { "epoch": 118, "train_loss": 0.1897142271566391, "train_acc": 0.93756, "test_loss": 2.0972971321105955, "test_acc": 0.611, "lyapunov": null, "grad_norm": 0.5079589956238173, "grad_max_sv": 0.23757222667336464, "grad_min_sv": 8.902529727208147e-09, "grad_condition": 203658547.6693558, "lr": 0.00010815327133708009, "time_sec": 15.504847049713135 }, { "epoch": 119, "train_loss": 0.1865368722629547, "train_acc": 0.93914, "test_loss": 2.071676664352417, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.503144489128604, "grad_max_sv": 0.24214695654809476, "grad_min_sv": 9.078004823076872e-09, "grad_condition": 401272428.2934058, "lr": 0.00010173504098790182, "time_sec": 15.494940042495728 }, { "epoch": 120, "train_loss": 0.18263185959339143, "train_acc": 0.9413, "test_loss": 2.0995028049468996, "test_acc": 0.61, "lyapunov": null, "grad_norm": 0.49963467133223916, "grad_max_sv": 0.2448117069900036, "grad_min_sv": 9.255170430218228e-09, "grad_condition": 840960640.7523018, "lr": 9.549150281252629e-05, "time_sec": 15.50493049621582 }, { "epoch": 121, "train_loss": 0.17661990516662598, "train_acc": 0.94376, "test_loss": 2.0479217910766603, "test_acc": 0.6139, "lyapunov": null, "grad_norm": 0.49017967274439106, "grad_max_sv": 0.24487083926796913, "grad_min_sv": 9.062790381261093e-09, "grad_condition": 297900363.86286056, "lr": 8.942539543314794e-05, "time_sec": 15.500595331192017 }, { "epoch": 122, "train_loss": 0.17436686351299285, "train_acc": 0.94568, "test_loss": 2.1033685138702394, "test_acc": 0.6076, "lyapunov": null, "grad_norm": 0.4850908453719191, "grad_max_sv": 0.24267951920628547, "grad_min_sv": 9.175133607909614e-09, "grad_condition": 151651082.8966439, "lr": 8.353937964495024e-05, "time_sec": 15.500707149505615 }, { "epoch": 123, "train_loss": 0.17420966561317444, "train_acc": 0.94574, "test_loss": 2.0771576751708984, "test_acc": 0.6091, "lyapunov": null, "grad_norm": 0.48697820878218756, "grad_max_sv": 0.24934822954237462, "grad_min_sv": 9.043736691862272e-09, "grad_condition": 342563176.44086933, "lr": 7.783603724899243e-05, "time_sec": 15.506757974624634 }, { "epoch": 124, "train_loss": 0.1725812414932251, "train_acc": 0.94486, "test_loss": 2.135185445022583, "test_acc": 0.608, "lyapunov": null, "grad_norm": 0.4844109930695783, "grad_max_sv": 0.24152979552745818, "grad_min_sv": 9.037162034160328e-09, "grad_condition": 142594941.29597357, "lr": 7.231786991974666e-05, "time_sec": 15.495522499084473 }, { "epoch": 125, "train_loss": 0.17122176954269408, "train_acc": 0.94558, "test_loss": 2.1152863483428956, "test_acc": 0.612, "lyapunov": null, "grad_norm": 0.4826385410866865, "grad_max_sv": 0.24549916423857213, "grad_min_sv": 8.782795131207118e-09, "grad_condition": 1347993858.355885, "lr": 6.698729810778072e-05, "time_sec": 15.489627361297607 }, { "epoch": 126, "train_loss": 0.17058868828058243, "train_acc": 0.94662, "test_loss": 2.1105800861358643, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.48281055678110163, "grad_max_sv": 0.24400779306888581, "grad_min_sv": 8.881911921611655e-09, "grad_condition": 907798367.550338, "lr": 6.184665997806817e-05, "time_sec": 15.487231254577637 }, { "epoch": 127, "train_loss": 0.16842705961704255, "train_acc": 0.94676, "test_loss": 2.075766274642944, "test_acc": 0.6129, "lyapunov": null, "grad_norm": 0.4814153543267475, "grad_max_sv": 0.24004302807152272, "grad_min_sv": 8.701755094839368e-09, "grad_condition": 2608046426.213746, "lr": 5.6898210384392595e-05, "time_sec": 15.498921394348145 }, { "epoch": 128, "train_loss": 0.16494292568683624, "train_acc": 0.94768, "test_loss": 2.151611907196045, "test_acc": 0.6047, "lyapunov": null, "grad_norm": 0.4763822150733386, "grad_max_sv": 0.22842325568199157, "grad_min_sv": 8.631154578726818e-09, "grad_condition": 260686423.05458745, "lr": 5.214411988029363e-05, "time_sec": 15.489452600479126 }, { "epoch": 129, "train_loss": 0.16430129640102387, "train_acc": 0.94824, "test_loss": 2.0951647556304933, "test_acc": 0.6128, "lyapunov": null, "grad_norm": 0.4754481221102857, "grad_max_sv": 0.23247553929686546, "grad_min_sv": 8.414460946461547e-09, "grad_condition": 437817787.9214033, "lr": 4.7586473766990294e-05, "time_sec": 15.491871118545532 }, { "epoch": 130, "train_loss": 0.16159661509513856, "train_acc": 0.94926, "test_loss": 2.0767082111358643, "test_acc": 0.6156, "lyapunov": null, "grad_norm": 0.4695751355550292, "grad_max_sv": 0.24420519769191742, "grad_min_sv": 8.783045789696309e-09, "grad_condition": 2887625517.4136095, "lr": 4.32272711786996e-05, "time_sec": 15.50525712966919 }, { "epoch": 131, "train_loss": 0.16233114049911498, "train_acc": 0.94986, "test_loss": 2.090193899154663, "test_acc": 0.6138, "lyapunov": null, "grad_norm": 0.4718133586500909, "grad_max_sv": 0.23811170123517514, "grad_min_sv": 8.731167988607069e-09, "grad_condition": 171473959.97673047, "lr": 3.906842420574966e-05, "time_sec": 15.489828824996948 }, { "epoch": 132, "train_loss": 0.16304145799160003, "train_acc": 0.9489, "test_loss": 2.0699268299102784, "test_acc": 0.6176, "lyapunov": null, "grad_norm": 0.47181034193305915, "grad_max_sv": 0.24468088522553444, "grad_min_sv": 8.694641913677115e-09, "grad_condition": 3950610050.0669045, "lr": 3.5111757055874305e-05, "time_sec": 15.489463329315186 }, { "epoch": 133, "train_loss": 0.16222090543746948, "train_acc": 0.94862, "test_loss": 2.0846460132598876, "test_acc": 0.6154, "lyapunov": null, "grad_norm": 0.47432514605256276, "grad_max_sv": 0.2351464234292507, "grad_min_sv": 8.508125437679944e-09, "grad_condition": 3262769680.1508665, "lr": 3.1359005254054254e-05, "time_sec": 15.493263721466064 }, { "epoch": 134, "train_loss": 0.1564504327917099, "train_acc": 0.95064, "test_loss": 2.039795367050171, "test_acc": 0.616, "lyapunov": null, "grad_norm": 0.46132567077349346, "grad_max_sv": 0.23477552309632302, "grad_min_sv": 8.499829853240298e-09, "grad_condition": 275652896.5549098, "lr": 2.7811814881259484e-05, "time_sec": 15.501915693283081 }, { "epoch": 135, "train_loss": 0.1633557910346985, "train_acc": 0.94906, "test_loss": 2.1431523998260498, "test_acc": 0.6082, "lyapunov": null, "grad_norm": 0.4725347110912027, "grad_max_sv": 0.2321782097220421, "grad_min_sv": 8.273568699135141e-09, "grad_condition": 719211854.1190578, "lr": 2.4471741852423218e-05, "time_sec": 15.49996304512024 }, { "epoch": 136, "train_loss": 0.1577922046995163, "train_acc": 0.95056, "test_loss": 2.039000785446167, "test_acc": 0.6154, "lyapunov": null, "grad_norm": 0.46347763663429586, "grad_max_sv": 0.23204916007816792, "grad_min_sv": 8.698969911215922e-09, "grad_condition": 2466699319.0239253, "lr": 2.1340251233966362e-05, "time_sec": 15.497424125671387 }, { "epoch": 137, "train_loss": 0.15701312964439393, "train_acc": 0.94962, "test_loss": 2.085305763244629, "test_acc": 0.6149, "lyapunov": null, "grad_norm": 0.46705315608384584, "grad_max_sv": 0.22602895461022854, "grad_min_sv": 8.363478537018877e-09, "grad_condition": 5418883019.032962, "lr": 1.8418716601170932e-05, "time_sec": 15.491859674453735 }, { "epoch": 138, "train_loss": 0.15615028873443604, "train_acc": 0.95128, "test_loss": 2.101923070907593, "test_acc": 0.6133, "lyapunov": null, "grad_norm": 0.46267937397470993, "grad_max_sv": 0.23617675378918648, "grad_min_sv": 8.55792531187071e-09, "grad_condition": 668785672.229811, "lr": 1.570841943568445e-05, "time_sec": 15.490991592407227 }, { "epoch": 139, "train_loss": 0.15497800857305527, "train_acc": 0.95104, "test_loss": 2.131324795150757, "test_acc": 0.6096, "lyapunov": null, "grad_norm": 0.4627316674414162, "grad_max_sv": 0.23336338251829147, "grad_min_sv": 8.54283688542061e-09, "grad_condition": 547232078.4054619, "lr": 1.3210548563419845e-05, "time_sec": 15.493245840072632 }, { "epoch": 140, "train_loss": 0.15815438273906707, "train_acc": 0.95054, "test_loss": 2.0743191734313964, "test_acc": 0.6132, "lyapunov": null, "grad_norm": 0.46525185071118685, "grad_max_sv": 0.23031578138470649, "grad_min_sv": 8.578327668909771e-09, "grad_condition": 1472538153.7679148, "lr": 1.0926199633097203e-05, "time_sec": 15.508398056030273 }, { "epoch": 141, "train_loss": 0.15565036369800567, "train_acc": 0.95156, "test_loss": 2.083190835571289, "test_acc": 0.6143, "lyapunov": null, "grad_norm": 0.4634211187185363, "grad_max_sv": 0.2209864068776369, "grad_min_sv": 8.388305931458784e-09, "grad_condition": 735187313.3407264, "lr": 8.856374635655688e-06, "time_sec": 15.477578163146973 }, { "epoch": 142, "train_loss": 0.1526834367275238, "train_acc": 0.95296, "test_loss": 2.0579229915618895, "test_acc": 0.6125, "lyapunov": null, "grad_norm": 0.45577943773159835, "grad_max_sv": 0.22755092419683934, "grad_min_sv": 8.457177222030362e-09, "grad_condition": 1934756909.5252705, "lr": 7.001981464747503e-06, "time_sec": 15.47980809211731 }, { "epoch": 143, "train_loss": 0.1551715327501297, "train_acc": 0.95138, "test_loss": 2.094068197631836, "test_acc": 0.6117, "lyapunov": null, "grad_norm": 0.46037433954931045, "grad_max_sv": 0.22780660428106786, "grad_min_sv": 8.502836361531321e-09, "grad_condition": 963929271.8099291, "lr": 5.3638335185058295e-06, "time_sec": 15.485134363174438 }, { "epoch": 144, "train_loss": 0.15432416381835937, "train_acc": 0.95178, "test_loss": 2.110651277923584, "test_acc": 0.6145, "lyapunov": null, "grad_norm": 0.4613614148812742, "grad_max_sv": 0.22735756635665894, "grad_min_sv": 8.44454743694368e-09, "grad_condition": 1076939620.5494838, "lr": 3.942649342761114e-06, "time_sec": 15.493315696716309 }, { "epoch": 145, "train_loss": 0.15650244321346282, "train_acc": 0.95044, "test_loss": 2.0880191951751708, "test_acc": 0.6119, "lyapunov": null, "grad_norm": 0.4660268832705423, "grad_max_sv": 0.23027937039732932, "grad_min_sv": 8.513131491633477e-09, "grad_condition": 297143450.17696226, "lr": 2.7390523158633524e-06, "time_sec": 15.480180501937866 }, { "epoch": 146, "train_loss": 0.15448970682621002, "train_acc": 0.952, "test_loss": 2.0194208770751954, "test_acc": 0.621, "lyapunov": null, "grad_norm": 0.4600178145858194, "grad_max_sv": 0.22371375933289528, "grad_min_sv": 8.652061342297613e-09, "grad_condition": 2586380341.3174944, "lr": 1.7535703752478133e-06, "time_sec": 15.502386331558228 }, { "epoch": 147, "train_loss": 0.15414279275417328, "train_acc": 0.95114, "test_loss": 2.1069964057922363, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.4616285885002781, "grad_max_sv": 0.2342820342630148, "grad_min_sv": 8.68108046944878e-09, "grad_condition": 379507449.7225493, "lr": 9.866357858642196e-07, "time_sec": 15.488835096359253 }, { "epoch": 148, "train_loss": 0.15620617700576783, "train_acc": 0.95078, "test_loss": 2.1161761821746827, "test_acc": 0.6085, "lyapunov": null, "grad_norm": 0.46475971700568747, "grad_max_sv": 0.2303019493818283, "grad_min_sv": 8.695906369591763e-09, "grad_condition": 729395813.573787, "lr": 4.38584950570808e-07, "time_sec": 15.500977277755737 }, { "epoch": 149, "train_loss": 0.1530400000667572, "train_acc": 0.95168, "test_loss": 2.0760107112884523, "test_acc": 0.6147, "lyapunov": null, "grad_norm": 0.4585791144767188, "grad_max_sv": 0.23029794916510582, "grad_min_sv": 8.466522902726702e-09, "grad_condition": 540903237.1982462, "lr": 1.096582625772501e-07, "time_sec": 15.49415111541748 }, { "epoch": 150, "train_loss": 0.15208094583511353, "train_acc": 0.95228, "test_loss": 2.0765135959625245, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.45743890734329773, "grad_max_sv": 0.23194126076996327, "grad_min_sv": 8.657490525268864e-09, "grad_condition": 1180436704.3069885, "lr": 0.0, "time_sec": 15.487801790237427 } ], "8": [ { "epoch": 1, "train_loss": 4.642479771652222, "train_acc": 0.0563, "test_loss": 4.471788549804687, "test_acc": 0.0525, "lyapunov": null, "grad_norm": 6.299700683423435, "grad_max_sv": 5.376748514175415, "grad_min_sv": 1.0876815811078355e-07, "grad_condition": 123806577.64929362, "lr": 0.0009998903417374227, "time_sec": 32.55821919441223 }, { "epoch": 2, "train_loss": 3.921236069869995, "train_acc": 0.1164, "test_loss": 4.031661200714112, "test_acc": 0.0987, "lyapunov": null, "grad_norm": 4.744809408953577, "grad_max_sv": 4.056096857786178, "grad_min_sv": 8.545224932585138e-08, "grad_condition": 432966802.88566554, "lr": 0.0009995614150494292, "time_sec": 32.52909827232361 }, { "epoch": 3, "train_loss": 3.563258330001831, "train_acc": 0.16394, "test_loss": 3.665959655380249, "test_acc": 0.1478, "lyapunov": null, "grad_norm": 3.968544793489477, "grad_max_sv": 3.2656030714511872, "grad_min_sv": 7.328074659307404e-08, "grad_condition": 54148101.24592471, "lr": 0.0009990133642141358, "time_sec": 32.514859199523926 }, { "epoch": 4, "train_loss": 3.30762485168457, "train_acc": 0.20282, "test_loss": 3.602442971038818, "test_acc": 0.1715, "lyapunov": null, "grad_norm": 3.360539325527588, "grad_max_sv": 2.5611240684986116, "grad_min_sv": 6.275024531099404e-08, "grad_condition": 48558402.55237199, "lr": 0.0009982464296247522, "time_sec": 32.511942863464355 }, { "epoch": 5, "train_loss": 3.070727022857666, "train_acc": 0.2431, "test_loss": 3.0896433425903322, "test_acc": 0.2428, "lyapunov": null, "grad_norm": 2.8612981669887914, "grad_max_sv": 2.039329302310944, "grad_min_sv": 5.3213209671998385e-08, "grad_condition": 45899387.46141158, "lr": 0.0009972609476841367, "time_sec": 32.535019874572754 }, { "epoch": 6, "train_loss": 2.873271194458008, "train_acc": 0.2795, "test_loss": 3.0904090099334716, "test_acc": 0.2488, "lyapunov": null, "grad_norm": 2.4953735022476837, "grad_max_sv": 1.6734129816293717, "grad_min_sv": 4.6456209978895655e-08, "grad_condition": 55631562.29872565, "lr": 0.000996057350657239, "time_sec": 32.5289192199707 }, { "epoch": 7, "train_loss": 2.698648819732666, "train_acc": 0.31066, "test_loss": 2.9098104148864747, "test_acc": 0.2799, "lyapunov": null, "grad_norm": 2.1963953249289316, "grad_max_sv": 1.3662363350391389, "grad_min_sv": 4.123726340746203e-08, "grad_condition": 175183802.14149565, "lr": 0.000994636166481494, "time_sec": 32.53304076194763 }, { "epoch": 8, "train_loss": 2.5489939933776857, "train_acc": 0.3414, "test_loss": 2.918805715942383, "test_acc": 0.2796, "lyapunov": null, "grad_norm": 1.9702205989411337, "grad_max_sv": 1.1486580684781074, "grad_min_sv": 3.6719605156498857e-08, "grad_condition": 45078452.49282994, "lr": 0.0009929980185352525, "time_sec": 32.52384686470032 }, { "epoch": 9, "train_loss": 2.429889005661011, "train_acc": 0.36856, "test_loss": 2.617208067703247, "test_acc": 0.3352, "lyapunov": null, "grad_norm": 1.7958642065413024, "grad_max_sv": 0.976833887398243, "grad_min_sv": 3.4111676243397945e-08, "grad_condition": 88392837.95669074, "lr": 0.0009911436253643444, "time_sec": 32.52341938018799 }, { "epoch": 10, "train_loss": 2.312202433395386, "train_acc": 0.39006, "test_loss": 2.6336415348052977, "test_acc": 0.3376, "lyapunov": null, "grad_norm": 1.6688154279715788, "grad_max_sv": 0.8335120677947998, "grad_min_sv": 3.1057890326202656e-08, "grad_condition": 43581868.8179111, "lr": 0.0009890738003669028, "time_sec": 32.53657627105713 }, { "epoch": 11, "train_loss": 2.2113982202911378, "train_acc": 0.41394, "test_loss": 2.4651415496826172, "test_acc": 0.3668, "lyapunov": null, "grad_norm": 1.5852177586967415, "grad_max_sv": 0.7658713042736054, "grad_min_sv": 2.981889714037678e-08, "grad_condition": 33093574.792371016, "lr": 0.00098678945143658, "time_sec": 32.52194833755493 }, { "epoch": 12, "train_loss": 2.1308777001190187, "train_acc": 0.432, "test_loss": 2.5040061386108396, "test_acc": 0.3654, "lyapunov": null, "grad_norm": 1.5129835225343262, "grad_max_sv": 0.6879909574985504, "grad_min_sv": 2.8309841176854533e-08, "grad_condition": 30209408.624890875, "lr": 0.0009842915805643154, "time_sec": 32.519477128982544 }, { "epoch": 13, "train_loss": 2.051232373428345, "train_acc": 0.4496, "test_loss": 2.3721223037719725, "test_acc": 0.3951, "lyapunov": null, "grad_norm": 1.4527042328822815, "grad_max_sv": 0.6657147958874703, "grad_min_sv": 2.7529119311919813e-08, "grad_condition": 32877524.0735294, "lr": 0.000981581283398829, "time_sec": 32.51488184928894 }, { "epoch": 14, "train_loss": 1.9786859475326537, "train_acc": 0.46372, "test_loss": 2.4099101028442385, "test_acc": 0.3885, "lyapunov": null, "grad_norm": 1.3903946049407439, "grad_max_sv": 0.619149561971426, "grad_min_sv": 2.6381883344583912e-08, "grad_condition": 32158488.579634093, "lr": 0.0009786597487660333, "time_sec": 32.53034734725952 }, { "epoch": 15, "train_loss": 1.9087054037857056, "train_acc": 0.48146, "test_loss": 2.356669859313965, "test_acc": 0.4054, "lyapunov": null, "grad_norm": 1.3401497982688246, "grad_max_sv": 0.5884689308702946, "grad_min_sv": 2.5261919572860948e-08, "grad_condition": 27243493.57243519, "lr": 0.0009755282581475766, "time_sec": 32.53805232048035 }, { "epoch": 16, "train_loss": 1.8580862741851807, "train_acc": 0.4903, "test_loss": 2.3727874526977537, "test_acc": 0.3978, "lyapunov": null, "grad_norm": 1.2980660063098806, "grad_max_sv": 0.5687403865158558, "grad_min_sv": 2.4705210138753485e-08, "grad_condition": 36506916.881677285, "lr": 0.0009721881851187403, "time_sec": 32.529054403305054 }, { "epoch": 17, "train_loss": 1.7838218069458007, "train_acc": 0.50946, "test_loss": 2.411915710067749, "test_acc": 0.4013, "lyapunov": null, "grad_norm": 1.2536082066251264, "grad_max_sv": 0.5238922812044621, "grad_min_sv": 2.3606322296920722e-08, "grad_condition": 36849925.4309851, "lr": 0.0009686409947459456, "time_sec": 32.526257038116455 }, { "epoch": 18, "train_loss": 1.7371992016983033, "train_acc": 0.51958, "test_loss": 2.2599031024932863, "test_acc": 0.4264, "lyapunov": null, "grad_norm": 1.229284180873741, "grad_max_sv": 0.5230717524886132, "grad_min_sv": 2.312521401454104e-08, "grad_condition": 49053511.209702894, "lr": 0.0009648882429441254, "time_sec": 32.5399911403656 }, { "epoch": 19, "train_loss": 1.6830381874847413, "train_acc": 0.53178, "test_loss": 2.1889729766845702, "test_acc": 0.4447, "lyapunov": null, "grad_norm": 1.1785390649791196, "grad_max_sv": 0.4872257113456726, "grad_min_sv": 2.2137700339541766e-08, "grad_condition": 138866163.95418012, "lr": 0.00096093157579425, "time_sec": 32.52653670310974 }, { "epoch": 20, "train_loss": 1.6344180388641358, "train_acc": 0.54714, "test_loss": 2.227257891082764, "test_acc": 0.4375, "lyapunov": null, "grad_norm": 1.1489035121891145, "grad_max_sv": 0.47284500747919084, "grad_min_sv": 2.1496744417870418e-08, "grad_condition": 29593450.061258078, "lr": 0.0009567727288213001, "time_sec": 32.52734684944153 }, { "epoch": 21, "train_loss": 1.5880603087615968, "train_acc": 0.55388, "test_loss": 2.109391535949707, "test_acc": 0.4605, "lyapunov": null, "grad_norm": 1.1350345214433142, "grad_max_sv": 0.47259567975997924, "grad_min_sv": 2.13382750108293e-08, "grad_condition": 39203948.276769534, "lr": 0.0009524135262330095, "time_sec": 32.51701855659485 }, { "epoch": 22, "train_loss": 1.5451898790740968, "train_acc": 0.56776, "test_loss": 2.1289856529235838, "test_acc": 0.4622, "lyapunov": null, "grad_norm": 1.1083032352595108, "grad_max_sv": 0.44387331902980803, "grad_min_sv": 2.0636199499213248e-08, "grad_condition": 31425874.99589374, "lr": 0.0009478558801197061, "time_sec": 32.51593995094299 }, { "epoch": 23, "train_loss": 1.4903677392959596, "train_acc": 0.57754, "test_loss": 2.133696251296997, "test_acc": 0.4671, "lyapunov": null, "grad_norm": 1.0825668306165386, "grad_max_sv": 0.4390222616493702, "grad_min_sv": 2.047547279677986e-08, "grad_condition": 129993822.14571199, "lr": 0.000943101789615607, "time_sec": 32.51069974899292 }, { "epoch": 24, "train_loss": 1.4748817832183838, "train_acc": 0.58158, "test_loss": 2.1626602745056154, "test_acc": 0.4632, "lyapunov": null, "grad_norm": 1.0751338305034317, "grad_max_sv": 0.43956650570034983, "grad_min_sv": 2.0244324640261713e-08, "grad_condition": 41342301.85017798, "lr": 0.0009381533400219313, "time_sec": 32.533777952194214 }, { "epoch": 25, "train_loss": 1.4211272861099242, "train_acc": 0.5951, "test_loss": 2.096311450576782, "test_acc": 0.481, "lyapunov": null, "grad_norm": 1.0399638076679998, "grad_max_sv": 0.42748609334230425, "grad_min_sv": 1.9937479189824357e-08, "grad_condition": 38871491.7985058, "lr": 0.0009330127018922189, "time_sec": 32.53145217895508 }, { "epoch": 26, "train_loss": 1.396544298095703, "train_acc": 0.6008, "test_loss": 2.1271941719055176, "test_acc": 0.4714, "lyapunov": null, "grad_norm": 1.028506322176559, "grad_max_sv": 0.4079991213977337, "grad_min_sv": 1.9165852835345554e-08, "grad_condition": 39309871.185656376, "lr": 0.000927682130080253, "time_sec": 32.53234934806824 }, { "epoch": 27, "train_loss": 1.361050274734497, "train_acc": 0.60774, "test_loss": 2.0897907325744627, "test_acc": 0.4811, "lyapunov": null, "grad_norm": 1.009655904655981, "grad_max_sv": 0.39270137771964075, "grad_min_sv": 1.8564359835493426e-08, "grad_condition": 28517922.90367631, "lr": 0.0009221639627510072, "time_sec": 32.54458284378052 }, { "epoch": 28, "train_loss": 1.3167539808654785, "train_acc": 0.62254, "test_loss": 2.2306322479248046, "test_acc": 0.4663, "lyapunov": null, "grad_norm": 0.9884512545787755, "grad_max_sv": 0.393748565018177, "grad_min_sv": 1.8592529393846036e-08, "grad_condition": 34171303.89028352, "lr": 0.0009164606203550494, "time_sec": 32.525365352630615 }, { "epoch": 29, "train_loss": 1.2844751734542847, "train_acc": 0.62692, "test_loss": 2.19309764251709, "test_acc": 0.4751, "lyapunov": null, "grad_norm": 0.9700062599103884, "grad_max_sv": 0.387305423617363, "grad_min_sv": 1.7872535887364373e-08, "grad_condition": 26903062.552241027, "lr": 0.0009105746045668516, "time_sec": 32.526561975479126 }, { "epoch": 30, "train_loss": 1.2640808475494385, "train_acc": 0.63334, "test_loss": 2.2757652931213377, "test_acc": 0.4536, "lyapunov": null, "grad_norm": 0.9608534659761124, "grad_max_sv": 0.39087340533733367, "grad_min_sv": 1.800268759344359e-08, "grad_condition": 33161981.652286977, "lr": 0.0009045084971874733, "time_sec": 32.51922965049744 }, { "epoch": 31, "train_loss": 1.2303438648223877, "train_acc": 0.64076, "test_loss": 2.1164483276367188, "test_acc": 0.4864, "lyapunov": null, "grad_norm": 0.9467438832197973, "grad_max_sv": 0.3729639552533627, "grad_min_sv": 1.7477179434233213e-08, "grad_condition": 28618454.375976466, "lr": 0.0008982649590120977, "time_sec": 32.51436138153076 }, { "epoch": 32, "train_loss": 1.2104430978012084, "train_acc": 0.6455, "test_loss": 2.2232689281463625, "test_acc": 0.481, "lyapunov": null, "grad_norm": 0.9361931150490757, "grad_max_sv": 0.37210237309336663, "grad_min_sv": 1.7445883718214537e-08, "grad_condition": 29250266.68112684, "lr": 0.0008918467286629196, "time_sec": 32.532060861587524 }, { "epoch": 33, "train_loss": 1.1789497135162355, "train_acc": 0.65278, "test_loss": 2.143947396850586, "test_acc": 0.4907, "lyapunov": null, "grad_norm": 0.9196344126113596, "grad_max_sv": 0.367071446031332, "grad_min_sv": 1.6865934492071855e-08, "grad_condition": 40056883.7628016, "lr": 0.0008852566213878943, "time_sec": 32.526479959487915 }, { "epoch": 34, "train_loss": 1.1554690090179442, "train_acc": 0.65844, "test_loss": 2.1499678684234618, "test_acc": 0.4922, "lyapunov": null, "grad_norm": 0.9057802742532243, "grad_max_sv": 0.3550798542797565, "grad_min_sv": 1.6556807021315262e-08, "grad_condition": 255610578.57101497, "lr": 0.000878497527825878, "time_sec": 32.53326392173767 }, { "epoch": 35, "train_loss": 1.1325925022506713, "train_acc": 0.66696, "test_loss": 2.187357851409912, "test_acc": 0.498, "lyapunov": null, "grad_norm": 0.8980481880537616, "grad_max_sv": 0.35023384541273117, "grad_min_sv": 1.653067620913107e-08, "grad_condition": 47664672.04568529, "lr": 0.000871572412738697, "time_sec": 32.529192209243774 }, { "epoch": 36, "train_loss": 1.1162108192062379, "train_acc": 0.67076, "test_loss": 2.078928050994873, "test_acc": 0.5062, "lyapunov": null, "grad_norm": 0.8887291214894226, "grad_max_sv": 0.34587462246418, "grad_min_sv": 1.598691768550653e-08, "grad_condition": 47253750.309311725, "lr": 0.0008644843137107055, "time_sec": 32.53391623497009 }, { "epoch": 37, "train_loss": 1.088490778541565, "train_acc": 0.67814, "test_loss": 2.117596751022339, "test_acc": 0.5079, "lyapunov": null, "grad_norm": 0.8827902897341499, "grad_max_sv": 0.3460941031575203, "grad_min_sv": 1.613751039689776e-08, "grad_condition": 120430106.41639173, "lr": 0.0008572363398164014, "time_sec": 32.52939796447754 }, { "epoch": 38, "train_loss": 1.0622543322944642, "train_acc": 0.68324, "test_loss": 2.2524201555252077, "test_acc": 0.4904, "lyapunov": null, "grad_norm": 0.8643928358196139, "grad_max_sv": 0.3311579547822475, "grad_min_sv": 1.5921391385842476e-08, "grad_condition": 28147641.32749777, "lr": 0.0008498316702566826, "time_sec": 32.51650023460388 }, { "epoch": 39, "train_loss": 1.0258385097503662, "train_acc": 0.6921, "test_loss": 2.215389312553406, "test_acc": 0.4912, "lyapunov": null, "grad_norm": 0.8507960671612714, "grad_max_sv": 0.3430253557860851, "grad_min_sv": 1.6041156275514722e-08, "grad_condition": 41417221.90444088, "lr": 0.0008422735529643442, "time_sec": 32.51078248023987 }, { "epoch": 40, "train_loss": 1.008150099067688, "train_acc": 0.69894, "test_loss": 2.285165777206421, "test_acc": 0.4887, "lyapunov": null, "grad_norm": 0.8500378683317822, "grad_max_sv": 0.33013429269194605, "grad_min_sv": 1.547893761040184e-08, "grad_condition": 735713799.268648, "lr": 0.0008345653031794289, "time_sec": 32.51578617095947 }, { "epoch": 41, "train_loss": 0.9898018364715576, "train_acc": 0.70114, "test_loss": 2.1710759185791018, "test_acc": 0.5054, "lyapunov": null, "grad_norm": 0.845636323093009, "grad_max_sv": 0.334617256373167, "grad_min_sv": 1.552002822438614e-08, "grad_condition": 178790285.2774743, "lr": 0.0008267103019950526, "time_sec": 32.55498909950256 }, { "epoch": 42, "train_loss": 0.9689999252319336, "train_acc": 0.70992, "test_loss": 2.1532568422317504, "test_acc": 0.5088, "lyapunov": null, "grad_norm": 0.8290515928528267, "grad_max_sv": 0.32156808376312257, "grad_min_sv": 1.513711112358096e-08, "grad_condition": 63393159.17157264, "lr": 0.0008187119948743447, "time_sec": 32.5278046131134 }, { "epoch": 43, "train_loss": 0.9382334645080567, "train_acc": 0.7173, "test_loss": 2.1617983654022215, "test_acc": 0.5099, "lyapunov": null, "grad_norm": 0.8199573726083517, "grad_max_sv": 0.3176788903772831, "grad_min_sv": 1.4969858624924724e-08, "grad_condition": 39337083.20882653, "lr": 0.000810573890139155, "time_sec": 32.54653334617615 }, { "epoch": 44, "train_loss": 0.9182830782318115, "train_acc": 0.7211, "test_loss": 2.2938510860443113, "test_acc": 0.5032, "lyapunov": null, "grad_norm": 0.8158010406023241, "grad_max_sv": 0.32802748009562493, "grad_min_sv": 1.5100565674969203e-08, "grad_condition": 67700595.0906401, "lr": 0.0008022995574311873, "time_sec": 32.530778884887695 }, { "epoch": 45, "train_loss": 0.89899619556427, "train_acc": 0.72596, "test_loss": 2.3243038515090944, "test_acc": 0.4978, "lyapunov": null, "grad_norm": 0.8106149860815325, "grad_max_sv": 0.31970001086592675, "grad_min_sv": 1.444995242211311e-08, "grad_condition": 61707891.58292439, "lr": 0.0007938926261462363, "time_sec": 32.53210163116455 }, { "epoch": 46, "train_loss": 0.8833617488861084, "train_acc": 0.72982, "test_loss": 2.3542774658203127, "test_acc": 0.4957, "lyapunov": null, "grad_norm": 0.8034668926314622, "grad_max_sv": 0.3169444307684898, "grad_min_sv": 1.4620525734955046e-08, "grad_condition": 2306938949.5105658, "lr": 0.0007853567838422158, "time_sec": 32.52321457862854 }, { "epoch": 47, "train_loss": 0.8611621459960938, "train_acc": 0.73636, "test_loss": 2.3614687870025635, "test_acc": 0.5019, "lyapunov": null, "grad_norm": 0.7952702534581538, "grad_max_sv": 0.3213916938751936, "grad_min_sv": 1.4360261544471564e-08, "grad_condition": 98833361.99001758, "lr": 0.0007766957746216719, "time_sec": 32.551071643829346 }, { "epoch": 48, "train_loss": 0.8414902052116394, "train_acc": 0.74232, "test_loss": 2.3029669830322264, "test_acc": 0.5085, "lyapunov": null, "grad_norm": 0.784297561095192, "grad_max_sv": 0.3114811100065708, "grad_min_sv": 1.4304356266148232e-08, "grad_condition": 35252220.65254038, "lr": 0.0007679133974894982, "time_sec": 32.53156328201294 }, { "epoch": 49, "train_loss": 0.8309669767951965, "train_acc": 0.74656, "test_loss": 2.286893635559082, "test_acc": 0.5045, "lyapunov": null, "grad_norm": 0.7866799445354931, "grad_max_sv": 0.31325423568487165, "grad_min_sv": 1.420554635719537e-08, "grad_condition": 245828981.88515216, "lr": 0.000759013504686565, "time_sec": 32.530038595199585 }, { "epoch": 50, "train_loss": 0.7998139995956421, "train_acc": 0.75392, "test_loss": 2.3185002082824706, "test_acc": 0.5087, "lyapunov": null, "grad_norm": 0.7702444904048175, "grad_max_sv": 0.3126057405024767, "grad_min_sv": 1.4057572236413247e-08, "grad_condition": 895759530.8359982, "lr": 0.0007499999999999998, "time_sec": 32.539623498916626 }, { "epoch": 51, "train_loss": 0.7901191444015503, "train_acc": 0.75788, "test_loss": 2.337850633239746, "test_acc": 0.509, "lyapunov": null, "grad_norm": 0.7647274965495858, "grad_max_sv": 0.3004269126802683, "grad_min_sv": 1.4008410850752107e-08, "grad_condition": 176379975.2857924, "lr": 0.0007408768370508575, "time_sec": 32.52524662017822 }, { "epoch": 52, "train_loss": 0.7781133801651001, "train_acc": 0.76004, "test_loss": 2.3018055530548094, "test_acc": 0.5142, "lyapunov": null, "grad_norm": 0.7628575677364715, "grad_max_sv": 0.3077410638332367, "grad_min_sv": 1.3944687078052547e-08, "grad_condition": 476227675.55278826, "lr": 0.0007316480175599307, "time_sec": 32.53758096694946 }, { "epoch": 53, "train_loss": 0.7562806001663208, "train_acc": 0.7648, "test_loss": 2.379827104949951, "test_acc": 0.5063, "lyapunov": null, "grad_norm": 0.7526764366291289, "grad_max_sv": 0.30248577073216437, "grad_min_sv": 1.3496081205355803e-08, "grad_condition": 1089676260.2113607, "lr": 0.0007223175895924635, "time_sec": 32.54466271400452 }, { "epoch": 54, "train_loss": 0.7475943574333191, "train_acc": 0.76786, "test_loss": 2.377075054550171, "test_acc": 0.512, "lyapunov": null, "grad_norm": 0.750215382398683, "grad_max_sv": 0.3043755616992712, "grad_min_sv": 1.3518679307933379e-08, "grad_condition": 37379268.11133198, "lr": 0.0007128896457825361, "time_sec": 32.53366780281067 }, { "epoch": 55, "train_loss": 0.7366778998947143, "train_acc": 0.77304, "test_loss": 2.4013710193634035, "test_acc": 0.5052, "lyapunov": null, "grad_norm": 0.7465343546140976, "grad_max_sv": 0.30028381906449797, "grad_min_sv": 1.382671875327368e-08, "grad_condition": 28698720.96166121, "lr": 0.0007033683215378998, "time_sec": 32.53609323501587 }, { "epoch": 56, "train_loss": 0.7091366660690308, "train_acc": 0.77762, "test_loss": 2.33411563911438, "test_acc": 0.5126, "lyapunov": null, "grad_norm": 0.7380136003829837, "grad_max_sv": 0.2953734669834375, "grad_min_sv": 1.303365445352823e-08, "grad_condition": 1175915690.269457, "lr": 0.0006937577932260512, "time_sec": 32.5473690032959 }, { "epoch": 57, "train_loss": 0.6999513886070251, "train_acc": 0.78266, "test_loss": 2.43815316696167, "test_acc": 0.5107, "lyapunov": null, "grad_norm": 0.7328699359209336, "grad_max_sv": 0.2920531783252954, "grad_min_sv": 1.2993845399135451e-08, "grad_condition": 152587828.403437, "lr": 0.0006840622763423388, "time_sec": 32.55185127258301 }, { "epoch": 58, "train_loss": 0.6799741724395751, "train_acc": 0.78742, "test_loss": 2.381142023277283, "test_acc": 0.5177, "lyapunov": null, "grad_norm": 0.7278793670004745, "grad_max_sv": 0.2917668532580137, "grad_min_sv": 1.304645755725517e-08, "grad_condition": 169810706.32481682, "lr": 0.0006742860236609073, "time_sec": 32.537921667099 }, { "epoch": 59, "train_loss": 0.6622171486473083, "train_acc": 0.79306, "test_loss": 2.350548614120483, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.7160794966099063, "grad_max_sv": 0.28989222049713137, "grad_min_sv": 1.3154668510517373e-08, "grad_condition": 518100543.52278435, "lr": 0.0006644333233692913, "time_sec": 32.556652784347534 }, { "epoch": 60, "train_loss": 0.6548414518356324, "train_acc": 0.79498, "test_loss": 2.558105725860596, "test_acc": 0.5026, "lyapunov": null, "grad_norm": 0.7139601066120349, "grad_max_sv": 0.2839757200330496, "grad_min_sv": 1.2719528911207812e-08, "grad_condition": 106598497.36127238, "lr": 0.0006545084971874734, "time_sec": 32.54617619514465 }, { "epoch": 61, "train_loss": 0.6367912077522278, "train_acc": 0.79956, "test_loss": 2.549720768737793, "test_acc": 0.503, "lyapunov": null, "grad_norm": 0.7072938119035849, "grad_max_sv": 0.2815666403621435, "grad_min_sv": 1.2655917643131925e-08, "grad_condition": 351545390.3878931, "lr": 0.0006445158984722354, "time_sec": 32.52895545959473 }, { "epoch": 62, "train_loss": 0.6108809622764587, "train_acc": 0.80962, "test_loss": 2.4582517892837523, "test_acc": 0.5155, "lyapunov": null, "grad_norm": 0.6871779503013541, "grad_max_sv": 0.27853575013577936, "grad_min_sv": 1.2499909360016991e-08, "grad_condition": 84323115.24066128, "lr": 0.0006344599103076324, "time_sec": 32.53638219833374 }, { "epoch": 63, "train_loss": 0.6110955193519593, "train_acc": 0.8082, "test_loss": 2.421668832015991, "test_acc": 0.5218, "lyapunov": null, "grad_norm": 0.6974575785480693, "grad_max_sv": 0.29437441378831863, "grad_min_sv": 1.2760532111023327e-08, "grad_condition": 1141074655.802474, "lr": 0.0006243449435824269, "time_sec": 32.5341739654541 }, { "epoch": 64, "train_loss": 0.5902745287513733, "train_acc": 0.81326, "test_loss": 2.525721709823608, "test_acc": 0.5137, "lyapunov": null, "grad_norm": 0.6819775061327956, "grad_max_sv": 0.2760129250586033, "grad_min_sv": 1.2472146640636617e-08, "grad_condition": 153380994.2741132, "lr": 0.0006141754350553275, "time_sec": 32.54224371910095 }, { "epoch": 65, "train_loss": 0.5767888858222961, "train_acc": 0.81892, "test_loss": 2.5681256893157958, "test_acc": 0.5109, "lyapunov": null, "grad_norm": 0.6842883453940269, "grad_max_sv": 0.27693442031741144, "grad_min_sv": 1.214616162405202e-08, "grad_condition": 180936373.24743983, "lr": 0.0006039558454088793, "time_sec": 32.535571575164795 }, { "epoch": 66, "train_loss": 0.5719620153427124, "train_acc": 0.81766, "test_loss": 2.4380872802734377, "test_acc": 0.5187, "lyapunov": null, "grad_norm": 0.6845868887152398, "grad_max_sv": 0.2806558083742857, "grad_min_sv": 1.2417019015428798e-08, "grad_condition": 91981311.14124386, "lr": 0.000593690657292862, "time_sec": 32.537678956985474 }, { "epoch": 67, "train_loss": 0.5476583632850647, "train_acc": 0.8273, "test_loss": 2.4955981588363647, "test_acc": 0.5183, "lyapunov": null, "grad_norm": 0.6627927561159936, "grad_max_sv": 0.27053381204605104, "grad_min_sv": 1.1682474739156678e-08, "grad_condition": 119357334.07208268, "lr": 0.0005833843733580507, "time_sec": 32.53704595565796 }, { "epoch": 68, "train_loss": 0.5349030065536499, "train_acc": 0.82988, "test_loss": 2.576411254119873, "test_acc": 0.5106, "lyapunov": null, "grad_norm": 0.6582392321316073, "grad_max_sv": 0.27176710218191147, "grad_min_sv": 1.180562275559377e-08, "grad_condition": 846305950.6996868, "lr": 0.0005730415142812054, "time_sec": 32.54088878631592 }, { "epoch": 69, "train_loss": 0.5356097626113892, "train_acc": 0.82918, "test_loss": 2.5702699626922607, "test_acc": 0.5154, "lyapunov": null, "grad_norm": 0.6641979366792015, "grad_max_sv": 0.27518576607108114, "grad_min_sv": 1.2052892484938627e-08, "grad_condition": 130030350.74337718, "lr": 0.0005626666167821517, "time_sec": 32.54138922691345 }, { "epoch": 70, "train_loss": 0.513014861240387, "train_acc": 0.8363, "test_loss": 2.6079680850982667, "test_acc": 0.5106, "lyapunov": null, "grad_norm": 0.6500943565960319, "grad_max_sv": 0.2724282074719667, "grad_min_sv": 1.178367022645465e-08, "grad_condition": 673776556.319051, "lr": 0.0005522642316338265, "time_sec": 32.5693633556366 }, { "epoch": 71, "train_loss": 0.49603789474487303, "train_acc": 0.84198, "test_loss": 2.5577601636886595, "test_acc": 0.5169, "lyapunov": null, "grad_norm": 0.6430240258167331, "grad_max_sv": 0.27023660503327845, "grad_min_sv": 1.1744692686443959e-08, "grad_condition": 80314537.0435541, "lr": 0.0005418389216661573, "time_sec": 32.54641532897949 }, { "epoch": 72, "train_loss": 0.49025250810623167, "train_acc": 0.8432, "test_loss": 2.5663631786346435, "test_acc": 0.5234, "lyapunov": null, "grad_norm": 0.643279476058677, "grad_max_sv": 0.27230227626860143, "grad_min_sv": 1.1624652314357053e-08, "grad_condition": 62786442.37501116, "lr": 0.0005313952597646563, "time_sec": 32.54123497009277 }, { "epoch": 73, "train_loss": 0.48772711526870727, "train_acc": 0.84528, "test_loss": 2.648895852470398, "test_acc": 0.5168, "lyapunov": null, "grad_norm": 0.6405905214601311, "grad_max_sv": 0.2699441872537136, "grad_min_sv": 1.1482883187884097e-08, "grad_condition": 111834993.35897943, "lr": 0.0005209378268645994, "time_sec": 32.56350803375244 }, { "epoch": 74, "train_loss": 0.467068857088089, "train_acc": 0.84904, "test_loss": 2.6479972763061523, "test_acc": 0.5139, "lyapunov": null, "grad_norm": 0.6363491242612465, "grad_max_sv": 0.2783078793436289, "grad_min_sv": 1.1536390146556913e-08, "grad_condition": 219390233.59819812, "lr": 0.0005104712099416781, "time_sec": 32.546509981155396 }, { "epoch": 75, "train_loss": 0.4711385968875885, "train_acc": 0.84816, "test_loss": 2.608884352874756, "test_acc": 0.5195, "lyapunov": null, "grad_norm": 0.6374082155755629, "grad_max_sv": 0.26901070438325403, "grad_min_sv": 1.1190769711073856e-08, "grad_condition": 334559678.03980315, "lr": 0.0004999999999999996, "time_sec": 32.54527187347412 }, { "epoch": 76, "train_loss": 0.45760808762550353, "train_acc": 0.85254, "test_loss": 2.6803735092163086, "test_acc": 0.5135, "lyapunov": null, "grad_norm": 0.6239727106157842, "grad_max_sv": 0.2669793125241995, "grad_min_sv": 1.1426927580722445e-08, "grad_condition": 760532191.4933506, "lr": 0.0004895287900583212, "time_sec": 32.556286096572876 }, { "epoch": 77, "train_loss": 0.4403402804660797, "train_acc": 0.85888, "test_loss": 2.6952022495269774, "test_acc": 0.5153, "lyapunov": null, "grad_norm": 0.6180261512024202, "grad_max_sv": 0.2674210451543331, "grad_min_sv": 1.1284923026578207e-08, "grad_condition": 800342890.6120255, "lr": 0.0004790621731353997, "time_sec": 32.570063829422 }, { "epoch": 78, "train_loss": 0.43386900725364685, "train_acc": 0.8609, "test_loss": 2.6530003887176514, "test_acc": 0.5232, "lyapunov": null, "grad_norm": 0.6088851948477753, "grad_max_sv": 0.2547843284904957, "grad_min_sv": 1.0926095429623917e-08, "grad_condition": 95464128.01992908, "lr": 0.000468604740235343, "time_sec": 32.54688787460327 }, { "epoch": 79, "train_loss": 0.4240487690734863, "train_acc": 0.8654, "test_loss": 2.7931711376190185, "test_acc": 0.5088, "lyapunov": null, "grad_norm": 0.5993382897461283, "grad_max_sv": 0.24774248749017716, "grad_min_sv": 1.07508628526291e-08, "grad_condition": 623384828.9212538, "lr": 0.00045816107833384175, "time_sec": 32.54505252838135 }, { "epoch": 80, "train_loss": 0.4058323986816406, "train_acc": 0.86904, "test_loss": 2.6775668907165526, "test_acc": 0.5171, "lyapunov": null, "grad_norm": 0.5885819627420461, "grad_max_sv": 0.24584074690937996, "grad_min_sv": 1.022559682466867e-08, "grad_condition": 156757634.53668588, "lr": 0.0004477357683661729, "time_sec": 32.55807185173035 }, { "epoch": 81, "train_loss": 0.3943421869087219, "train_acc": 0.87248, "test_loss": 2.596042275619507, "test_acc": 0.5241, "lyapunov": null, "grad_norm": 0.5915570736864834, "grad_max_sv": 0.252938449382782, "grad_min_sv": 1.0551333432320953e-08, "grad_condition": 290621793.5733338, "lr": 0.00043733338321784746, "time_sec": 32.56740355491638 }, { "epoch": 82, "train_loss": 0.39024432485580446, "train_acc": 0.87492, "test_loss": 2.715544410324097, "test_acc": 0.5245, "lyapunov": null, "grad_norm": 0.5825377843109248, "grad_max_sv": 0.2532011177390814, "grad_min_sv": 1.0358391808878986e-08, "grad_condition": 412597611.83888507, "lr": 0.0004269584857187939, "time_sec": 32.55344319343567 }, { "epoch": 83, "train_loss": 0.3715799244689941, "train_acc": 0.88012, "test_loss": 2.6901692249298095, "test_acc": 0.5264, "lyapunov": null, "grad_norm": 0.5717041976150569, "grad_max_sv": 0.24421822614967822, "grad_min_sv": 1.0306600353336345e-08, "grad_condition": 329985889.12779623, "lr": 0.0004166156266419484, "time_sec": 32.559467792510986 }, { "epoch": 84, "train_loss": 0.3671589259147644, "train_acc": 0.882, "test_loss": 2.6448453563690184, "test_acc": 0.5345, "lyapunov": null, "grad_norm": 0.5691852194449533, "grad_max_sv": 0.24019994884729384, "grad_min_sv": 9.989625743278551e-09, "grad_condition": 122734290.43687347, "lr": 0.0004063093427071373, "time_sec": 32.583213567733765 }, { "epoch": 85, "train_loss": 0.35963713159561156, "train_acc": 0.8824, "test_loss": 2.718573891067505, "test_acc": 0.5235, "lyapunov": null, "grad_norm": 0.5695765343654775, "grad_max_sv": 0.24239672683179378, "grad_min_sv": 1.0202618674231591e-08, "grad_condition": 1852046324.0623333, "lr": 0.0003960441545911199, "time_sec": 32.562474727630615 }, { "epoch": 86, "train_loss": 0.35900317364692685, "train_acc": 0.88314, "test_loss": 2.690758750152588, "test_acc": 0.5281, "lyapunov": null, "grad_norm": 0.5695226754489282, "grad_max_sv": 0.2359969958662987, "grad_min_sv": 9.85500920487603e-09, "grad_condition": 394077563.11466306, "lr": 0.0003858245649446718, "time_sec": 32.56024169921875 }, { "epoch": 87, "train_loss": 0.34593051030158994, "train_acc": 0.88774, "test_loss": 2.6911534130096437, "test_acc": 0.5276, "lyapunov": null, "grad_norm": 0.5605319049257929, "grad_max_sv": 0.24156057350337506, "grad_min_sv": 9.944241273420092e-09, "grad_condition": 944172650.8084786, "lr": 0.00037565505641757235, "time_sec": 32.55394530296326 }, { "epoch": 88, "train_loss": 0.3350362122821808, "train_acc": 0.89292, "test_loss": 2.761347038269043, "test_acc": 0.5248, "lyapunov": null, "grad_norm": 0.5537857918957506, "grad_max_sv": 0.24467103444039823, "grad_min_sv": 9.84480716557587e-09, "grad_condition": 557423472.2448919, "lr": 0.00036554008969236695, "time_sec": 32.565001487731934 }, { "epoch": 89, "train_loss": 0.32590197957992556, "train_acc": 0.89466, "test_loss": 2.873864278793335, "test_acc": 0.5155, "lyapunov": null, "grad_norm": 0.5519161551510952, "grad_max_sv": 0.2400045834481716, "grad_min_sv": 9.881915213807297e-09, "grad_condition": 248477788.07047543, "lr": 0.0003554841015277638, "time_sec": 32.55529260635376 }, { "epoch": 90, "train_loss": 0.31863860460281374, "train_acc": 0.89664, "test_loss": 2.8045926555633547, "test_acc": 0.5231, "lyapunov": null, "grad_norm": 0.5479641587602809, "grad_max_sv": 0.24628719314932823, "grad_min_sv": 1.0033076104122573e-08, "grad_condition": 105371945.52289103, "lr": 0.000345491502812526, "time_sec": 32.55959415435791 }, { "epoch": 91, "train_loss": 0.31169461310863494, "train_acc": 0.89832, "test_loss": 2.764314810180664, "test_acc": 0.5242, "lyapunov": null, "grad_norm": 0.5454170376093662, "grad_max_sv": 0.24890379793941975, "grad_min_sv": 9.700326364034394e-09, "grad_condition": 77171376.4128032, "lr": 0.0003355666766307081, "time_sec": 32.56360149383545 }, { "epoch": 92, "train_loss": 0.3113831770801544, "train_acc": 0.90008, "test_loss": 2.778244842529297, "test_acc": 0.5291, "lyapunov": null, "grad_norm": 0.5407137447043685, "grad_max_sv": 0.23328636735677719, "grad_min_sv": 9.360961983687077e-09, "grad_condition": 128397939.07976246, "lr": 0.00032571397633909225, "time_sec": 32.571138858795166 }, { "epoch": 93, "train_loss": 0.30188457230567933, "train_acc": 0.903, "test_loss": 2.7606024471282957, "test_acc": 0.5339, "lyapunov": null, "grad_norm": 0.5330386559824729, "grad_max_sv": 0.24647361300885678, "grad_min_sv": 9.782626700523788e-09, "grad_condition": 930794659.3385656, "lr": 0.00031593772365766094, "time_sec": 32.56698513031006 }, { "epoch": 94, "train_loss": 0.2888755958557129, "train_acc": 0.90584, "test_loss": 2.8303293384552, "test_acc": 0.5252, "lyapunov": null, "grad_norm": 0.5239071385040424, "grad_max_sv": 0.24134295992553234, "grad_min_sv": 9.665177403035685e-09, "grad_condition": 341790086.36703265, "lr": 0.0003062422067739483, "time_sec": 32.560898303985596 }, { "epoch": 95, "train_loss": 0.2843299233055115, "train_acc": 0.90856, "test_loss": 2.878970125961304, "test_acc": 0.5228, "lyapunov": null, "grad_norm": 0.5173032628331714, "grad_max_sv": 0.22986819855868817, "grad_min_sv": 9.369064224050081e-09, "grad_condition": 493164980.6666913, "lr": 0.00029663167846209965, "time_sec": 32.586976528167725 }, { "epoch": 96, "train_loss": 0.280480184469223, "train_acc": 0.9093, "test_loss": 2.9630297519683837, "test_acc": 0.5184, "lyapunov": null, "grad_norm": 0.5133233008116458, "grad_max_sv": 0.22380913645029069, "grad_min_sv": 9.095019559701712e-09, "grad_condition": 693584615.2355412, "lr": 0.00028711035421746345, "time_sec": 32.56851410865784 }, { "epoch": 97, "train_loss": 0.2670245563793182, "train_acc": 0.9139, "test_loss": 2.9036443214416505, "test_acc": 0.5232, "lyapunov": null, "grad_norm": 0.5060688229901619, "grad_max_sv": 0.23383041098713875, "grad_min_sv": 9.393182952245269e-09, "grad_condition": 365456172.90854704, "lr": 0.00027768241040753615, "time_sec": 32.560548305511475 }, { "epoch": 98, "train_loss": 0.2613537116527557, "train_acc": 0.91552, "test_loss": 2.93895020904541, "test_acc": 0.5186, "lyapunov": null, "grad_norm": 0.5033096276176704, "grad_max_sv": 0.22504370659589767, "grad_min_sv": 9.149747783043782e-09, "grad_condition": 181789237.51414594, "lr": 0.00026835198244006903, "time_sec": 32.57581615447998 }, { "epoch": 99, "train_loss": 0.25923142310142516, "train_acc": 0.91662, "test_loss": 2.9681204444885254, "test_acc": 0.519, "lyapunov": null, "grad_norm": 0.5005047043499057, "grad_max_sv": 0.23424391224980354, "grad_min_sv": 9.202334173646042e-09, "grad_condition": 1390486041.6800082, "lr": 0.0002591231629491421, "time_sec": 32.568488359451294 }, { "epoch": 100, "train_loss": 0.2552828652858734, "train_acc": 0.91668, "test_loss": 2.9585084489822386, "test_acc": 0.5195, "lyapunov": null, "grad_norm": 0.5000052829086656, "grad_max_sv": 0.23269009366631507, "grad_min_sv": 9.008429451874688e-09, "grad_condition": 118235741.33881798, "lr": 0.0002499999999999997, "time_sec": 32.64319896697998 }, { "epoch": 101, "train_loss": 0.2504552359342575, "train_acc": 0.92034, "test_loss": 2.881327504348755, "test_acc": 0.527, "lyapunov": null, "grad_norm": 0.4976095445457081, "grad_max_sv": 0.23710807636380196, "grad_min_sv": 8.987613531706572e-09, "grad_condition": 188175820.91636205, "lr": 0.00024098649531343477, "time_sec": 32.56459856033325 }, { "epoch": 102, "train_loss": 0.24319207516670227, "train_acc": 0.9211, "test_loss": 2.8339650466918944, "test_acc": 0.5304, "lyapunov": null, "grad_norm": 0.49020316429940586, "grad_max_sv": 0.22668980285525323, "grad_min_sv": 8.876688220674786e-09, "grad_condition": 3067014755.4611425, "lr": 0.0002320866025105016, "time_sec": 32.56655430793762 }, { "epoch": 103, "train_loss": 0.23643713227272034, "train_acc": 0.92328, "test_loss": 2.8374974479675292, "test_acc": 0.5312, "lyapunov": null, "grad_norm": 0.48382300142218854, "grad_max_sv": 0.22789723835885525, "grad_min_sv": 8.629146283113676e-09, "grad_condition": 335837582.58375555, "lr": 0.0002233042253783278, "time_sec": 32.56167936325073 }, { "epoch": 104, "train_loss": 0.23221797705173491, "train_acc": 0.92652, "test_loss": 2.8848680614471434, "test_acc": 0.5292, "lyapunov": null, "grad_norm": 0.47687316634744686, "grad_max_sv": 0.21569081246852875, "grad_min_sv": 8.62663665758762e-09, "grad_condition": 1157675505.971954, "lr": 0.000214643216157784, "time_sec": 32.563629150390625 }, { "epoch": 105, "train_loss": 0.2289664591026306, "train_acc": 0.9265, "test_loss": 2.9271271530151366, "test_acc": 0.5268, "lyapunov": null, "grad_norm": 0.47818041348027984, "grad_max_sv": 0.21913939844816924, "grad_min_sv": 8.707405810184226e-09, "grad_condition": 207155237.78245467, "lr": 0.00020610737385376332, "time_sec": 32.56299424171448 }, { "epoch": 106, "train_loss": 0.22260613627433776, "train_acc": 0.92814, "test_loss": 2.8978806022644044, "test_acc": 0.5295, "lyapunov": null, "grad_norm": 0.4722385726091627, "grad_max_sv": 0.2149375133216381, "grad_min_sv": 8.579168120879944e-09, "grad_condition": 165117262.170354, "lr": 0.00019770044256881242, "time_sec": 32.58579874038696 }, { "epoch": 107, "train_loss": 0.21763298731803893, "train_acc": 0.93018, "test_loss": 2.908183602523804, "test_acc": 0.5286, "lyapunov": null, "grad_norm": 0.4652522989647011, "grad_max_sv": 0.22290415540337563, "grad_min_sv": 8.928726000223541e-09, "grad_condition": 479064684.028664, "lr": 0.0001894261098608447, "time_sec": 32.594443798065186 }, { "epoch": 108, "train_loss": 0.2121983386325836, "train_acc": 0.9317, "test_loss": 2.8597964405059813, "test_acc": 0.5362, "lyapunov": null, "grad_norm": 0.45763107412030085, "grad_max_sv": 0.21216899007558823, "grad_min_sv": 8.420200893585924e-09, "grad_condition": 688259775.9446552, "lr": 0.000181288005125655, "time_sec": 32.56038689613342 }, { "epoch": 109, "train_loss": 0.20583704056739807, "train_acc": 0.93444, "test_loss": 2.9211787143707277, "test_acc": 0.5282, "lyapunov": null, "grad_norm": 0.4568920236456778, "grad_max_sv": 0.22295879386365414, "grad_min_sv": 8.673458856169048e-09, "grad_condition": 89075535.84085791, "lr": 0.0001732896980049473, "time_sec": 32.575947761535645 }, { "epoch": 110, "train_loss": 0.21038897478103638, "train_acc": 0.93206, "test_loss": 2.9601449073791506, "test_acc": 0.5279, "lyapunov": null, "grad_norm": 0.45979845223683363, "grad_max_sv": 0.22593539729714393, "grad_min_sv": 8.6531671937215e-09, "grad_condition": 89403715.48231289, "lr": 0.00016543469682057076, "time_sec": 32.607563495635986 }, { "epoch": 111, "train_loss": 0.19834216837882995, "train_acc": 0.93586, "test_loss": 2.9055423223495485, "test_acc": 0.5353, "lyapunov": null, "grad_norm": 0.44710603724659786, "grad_max_sv": 0.2183500427752733, "grad_min_sv": 8.1763572969476e-09, "grad_condition": 161545447.91228038, "lr": 0.00015772644703565552, "time_sec": 32.57204461097717 }, { "epoch": 112, "train_loss": 0.19908358410835267, "train_acc": 0.93552, "test_loss": 2.994161311531067, "test_acc": 0.5244, "lyapunov": null, "grad_norm": 0.4546597416131923, "grad_max_sv": 0.21809808388352395, "grad_min_sv": 8.425444494170043e-09, "grad_condition": 140538020.508261, "lr": 0.00015016832974331713, "time_sec": 32.601916790008545 }, { "epoch": 113, "train_loss": 0.191571541864872, "train_acc": 0.93866, "test_loss": 2.986764238739014, "test_acc": 0.5296, "lyapunov": null, "grad_norm": 0.4450596671055528, "grad_max_sv": 0.21210374720394612, "grad_min_sv": 8.032377695355725e-09, "grad_condition": 1444127435.9832203, "lr": 0.00014276366018359834, "time_sec": 32.559205770492554 }, { "epoch": 114, "train_loss": 0.1893005026912689, "train_acc": 0.93862, "test_loss": 3.0139925247192383, "test_acc": 0.5255, "lyapunov": null, "grad_norm": 0.4424054116910155, "grad_max_sv": 0.21594099812209605, "grad_min_sv": 8.292241756094332e-09, "grad_condition": 1221030181.2962646, "lr": 0.00013551568628929425, "time_sec": 32.54303812980652 }, { "epoch": 115, "train_loss": 0.1869383985710144, "train_acc": 0.94032, "test_loss": 2.9447794439315795, "test_acc": 0.5338, "lyapunov": null, "grad_norm": 0.44046789562845245, "grad_max_sv": 0.22429420053958893, "grad_min_sv": 8.562988351723532e-09, "grad_condition": 109188406.44486985, "lr": 0.00012842758726130276, "time_sec": 32.57725954055786 }, { "epoch": 116, "train_loss": 0.18216380766868592, "train_acc": 0.94282, "test_loss": 2.9761684719085695, "test_acc": 0.533, "lyapunov": null, "grad_norm": 0.43380483120573066, "grad_max_sv": 0.21227659583091735, "grad_min_sv": 8.084414394003703e-09, "grad_condition": 442388430.74640197, "lr": 0.0001215024721741218, "time_sec": 32.56703448295593 }, { "epoch": 117, "train_loss": 0.18284838955402374, "train_acc": 0.94104, "test_loss": 2.988401131248474, "test_acc": 0.5304, "lyapunov": null, "grad_norm": 0.43518014689479523, "grad_max_sv": 0.20529667772352694, "grad_min_sv": 8.008318215188027e-09, "grad_condition": 525224592.1224529, "lr": 0.00011474337861210538, "time_sec": 32.56633758544922 }, { "epoch": 118, "train_loss": 0.17929271565437316, "train_acc": 0.94202, "test_loss": 2.969692068481445, "test_acc": 0.531, "lyapunov": null, "grad_norm": 0.43166468988319484, "grad_max_sv": 0.20995365753769873, "grad_min_sv": 7.949281083993037e-09, "grad_condition": 206686551.43998715, "lr": 0.00010815327133708009, "time_sec": 32.58298921585083 }, { "epoch": 119, "train_loss": 0.1746947413468361, "train_acc": 0.94538, "test_loss": 2.9470513034820556, "test_acc": 0.5265, "lyapunov": null, "grad_norm": 0.4240479391496432, "grad_max_sv": 0.21465191170573233, "grad_min_sv": 8.01244074109808e-09, "grad_condition": 266673927.46960324, "lr": 0.00010173504098790182, "time_sec": 32.58079934120178 }, { "epoch": 120, "train_loss": 0.17056026011943817, "train_acc": 0.94666, "test_loss": 2.9715382446289063, "test_acc": 0.5374, "lyapunov": null, "grad_norm": 0.4216192661535551, "grad_max_sv": 0.21133692860603331, "grad_min_sv": 8.155698732288316e-09, "grad_condition": 310751065.89462894, "lr": 9.549150281252629e-05, "time_sec": 32.567041635513306 }, { "epoch": 121, "train_loss": 0.16829824639320373, "train_acc": 0.94648, "test_loss": 3.087546385574341, "test_acc": 0.5255, "lyapunov": null, "grad_norm": 0.4183748049917772, "grad_max_sv": 0.20680695101618768, "grad_min_sv": 7.995454154665922e-09, "grad_condition": 1023933342.3354034, "lr": 8.942539543314794e-05, "time_sec": 32.589598178863525 }, { "epoch": 122, "train_loss": 0.16800043944358825, "train_acc": 0.94632, "test_loss": 2.9318422325134277, "test_acc": 0.5338, "lyapunov": null, "grad_norm": 0.42099752391898676, "grad_max_sv": 0.21042499877512455, "grad_min_sv": 7.547093950439551e-09, "grad_condition": 900826897.3857119, "lr": 8.353937964495024e-05, "time_sec": 32.595381021499634 }, { "epoch": 123, "train_loss": 0.16323296820640565, "train_acc": 0.94816, "test_loss": 3.0529399940490722, "test_acc": 0.5285, "lyapunov": null, "grad_norm": 0.41313116824251195, "grad_max_sv": 0.19900580085814, "grad_min_sv": 7.892230206862915e-09, "grad_condition": 209614816.18259263, "lr": 7.783603724899243e-05, "time_sec": 32.5691282749176 }, { "epoch": 124, "train_loss": 0.16248614077568055, "train_acc": 0.94808, "test_loss": 2.968647869491577, "test_acc": 0.5376, "lyapunov": null, "grad_norm": 0.4109739294498664, "grad_max_sv": 0.2045503228902817, "grad_min_sv": 7.709402672934767e-09, "grad_condition": 204317712.1943869, "lr": 7.231786991974666e-05, "time_sec": 32.56873893737793 }, { "epoch": 125, "train_loss": 0.16562083917617798, "train_acc": 0.94652, "test_loss": 2.990608223724365, "test_acc": 0.5324, "lyapunov": null, "grad_norm": 0.41726227575170305, "grad_max_sv": 0.21484395451843738, "grad_min_sv": 8.067420890524312e-09, "grad_condition": 451509267.6606773, "lr": 6.698729810778072e-05, "time_sec": 32.563942432403564 }, { "epoch": 126, "train_loss": 0.16248787566184997, "train_acc": 0.94908, "test_loss": 3.0610411296844484, "test_acc": 0.5248, "lyapunov": null, "grad_norm": 0.41265591679124974, "grad_max_sv": 0.20524860061705114, "grad_min_sv": 7.563831366450003e-09, "grad_condition": 115790817.80184206, "lr": 6.184665997806817e-05, "time_sec": 32.568299770355225 }, { "epoch": 127, "train_loss": 0.15771708325862885, "train_acc": 0.95078, "test_loss": 2.962667014122009, "test_acc": 0.5409, "lyapunov": null, "grad_norm": 0.4075071230249109, "grad_max_sv": 0.20769537538290023, "grad_min_sv": 8.188405986597757e-09, "grad_condition": 380886928.1801485, "lr": 5.6898210384392595e-05, "time_sec": 32.57155394554138 }, { "epoch": 128, "train_loss": 0.15537331622004508, "train_acc": 0.95126, "test_loss": 2.9610030857086183, "test_acc": 0.5357, "lyapunov": null, "grad_norm": 0.4021889013709537, "grad_max_sv": 0.19925076719373463, "grad_min_sv": 7.527878987789033e-09, "grad_condition": 171791225.70681745, "lr": 5.214411988029363e-05, "time_sec": 32.58445978164673 }, { "epoch": 129, "train_loss": 0.15362726456165313, "train_acc": 0.9504, "test_loss": 3.0267199047088624, "test_acc": 0.5318, "lyapunov": null, "grad_norm": 0.40304342978976343, "grad_max_sv": 0.2073110181838274, "grad_min_sv": 7.651128650391566e-09, "grad_condition": 655223821.7012879, "lr": 4.7586473766990294e-05, "time_sec": 32.58788251876831 }, { "epoch": 130, "train_loss": 0.15159179414272309, "train_acc": 0.95296, "test_loss": 3.075101675415039, "test_acc": 0.5263, "lyapunov": null, "grad_norm": 0.3974054527380892, "grad_max_sv": 0.20575362853705884, "grad_min_sv": 7.740591648555672e-09, "grad_condition": 144759180.06870463, "lr": 4.32272711786996e-05, "time_sec": 32.578858613967896 }, { "epoch": 131, "train_loss": 0.1488430485343933, "train_acc": 0.95292, "test_loss": 2.9862019886016844, "test_acc": 0.5315, "lyapunov": null, "grad_norm": 0.3954060106149679, "grad_max_sv": 0.20766182690858842, "grad_min_sv": 7.58607175857344e-09, "grad_condition": 425579805.0794872, "lr": 3.906842420574966e-05, "time_sec": 32.586265325546265 }, { "epoch": 132, "train_loss": 0.14661406512260436, "train_acc": 0.95324, "test_loss": 3.057056298828125, "test_acc": 0.5262, "lyapunov": null, "grad_norm": 0.39095745142548216, "grad_max_sv": 0.19490535818040372, "grad_min_sv": 7.49121251628342e-09, "grad_condition": 3507301112.9708757, "lr": 3.5111757055874305e-05, "time_sec": 32.574090003967285 }, { "epoch": 133, "train_loss": 0.1463806065893173, "train_acc": 0.95318, "test_loss": 3.0613175567626953, "test_acc": 0.527, "lyapunov": null, "grad_norm": 0.3949318760097119, "grad_max_sv": 0.2000393845140934, "grad_min_sv": 7.511325199847929e-09, "grad_condition": 264016430.37942663, "lr": 3.1359005254054254e-05, "time_sec": 32.57793402671814 }, { "epoch": 134, "train_loss": 0.14586117388010025, "train_acc": 0.95352, "test_loss": 3.0277784969329833, "test_acc": 0.5333, "lyapunov": null, "grad_norm": 0.3915443650869973, "grad_max_sv": 0.20002376139163972, "grad_min_sv": 7.407051562673041e-09, "grad_condition": 1569872714.1138968, "lr": 2.7811814881259484e-05, "time_sec": 32.58327078819275 }, { "epoch": 135, "train_loss": 0.14679538232803344, "train_acc": 0.9531, "test_loss": 3.02330316696167, "test_acc": 0.5325, "lyapunov": null, "grad_norm": 0.39654447314663155, "grad_max_sv": 0.2064110331237316, "grad_min_sv": 8.009200439971707e-09, "grad_condition": 408075856.5604743, "lr": 2.4471741852423218e-05, "time_sec": 32.57164478302002 }, { "epoch": 136, "train_loss": 0.14213005175113677, "train_acc": 0.95606, "test_loss": 3.066131346511841, "test_acc": 0.5326, "lyapunov": null, "grad_norm": 0.386859099144263, "grad_max_sv": 0.20008183866739274, "grad_min_sv": 7.493826075335216e-09, "grad_condition": 1294487907.3292127, "lr": 2.1340251233966362e-05, "time_sec": 32.59002447128296 }, { "epoch": 137, "train_loss": 0.14528326896190644, "train_acc": 0.95314, "test_loss": 2.9820048439025877, "test_acc": 0.5384, "lyapunov": null, "grad_norm": 0.3940518150499405, "grad_max_sv": 0.20172332599759102, "grad_min_sv": 7.518978299708582e-09, "grad_condition": 2050951064.0374703, "lr": 1.8418716601170932e-05, "time_sec": 32.582863569259644 }, { "epoch": 138, "train_loss": 0.14290555841445923, "train_acc": 0.954, "test_loss": 2.9484275436401366, "test_acc": 0.5392, "lyapunov": null, "grad_norm": 0.3885095445150157, "grad_max_sv": 0.1956668719649315, "grad_min_sv": 7.481351363262425e-09, "grad_condition": 817168787.737042, "lr": 1.570841943568445e-05, "time_sec": 32.56788969039917 }, { "epoch": 139, "train_loss": 0.1455221847629547, "train_acc": 0.95376, "test_loss": 2.9918841510772705, "test_acc": 0.539, "lyapunov": null, "grad_norm": 0.39394584988421966, "grad_max_sv": 0.1982663732022047, "grad_min_sv": 7.502347731524073e-09, "grad_condition": 1796580822.5410652, "lr": 1.3210548563419845e-05, "time_sec": 32.57190442085266 }, { "epoch": 140, "train_loss": 0.1442144584083557, "train_acc": 0.95352, "test_loss": 2.970733211517334, "test_acc": 0.5376, "lyapunov": null, "grad_norm": 0.39260771988813964, "grad_max_sv": 0.19792755618691443, "grad_min_sv": 7.351794456978561e-09, "grad_condition": 208762115.79842368, "lr": 1.0926199633097203e-05, "time_sec": 32.58234429359436 }, { "epoch": 141, "train_loss": 0.1421483956861496, "train_acc": 0.95486, "test_loss": 2.9954518421173097, "test_acc": 0.5376, "lyapunov": null, "grad_norm": 0.3895044607831209, "grad_max_sv": 0.19535492211580277, "grad_min_sv": 7.2159212467261255e-09, "grad_condition": 226711442.0952455, "lr": 8.856374635655688e-06, "time_sec": 32.580827951431274 }, { "epoch": 142, "train_loss": 0.14344135119915008, "train_acc": 0.95412, "test_loss": 3.0175164573669435, "test_acc": 0.5347, "lyapunov": null, "grad_norm": 0.3912699552240718, "grad_max_sv": 0.20520108379423618, "grad_min_sv": 7.762914990688819e-09, "grad_condition": 387803307.69275963, "lr": 7.001981464747503e-06, "time_sec": 32.58955121040344 }, { "epoch": 143, "train_loss": 0.145557352809906, "train_acc": 0.95334, "test_loss": 2.9905672885894776, "test_acc": 0.5351, "lyapunov": null, "grad_norm": 0.3937145534468507, "grad_max_sv": 0.19824392758309842, "grad_min_sv": 7.470967854170812e-09, "grad_condition": 615993628.5132923, "lr": 5.3638335185058295e-06, "time_sec": 32.584557056427 }, { "epoch": 144, "train_loss": 0.13792892556190492, "train_acc": 0.9568, "test_loss": 3.0243384300231932, "test_acc": 0.5351, "lyapunov": null, "grad_norm": 0.38137874618156004, "grad_max_sv": 0.20396318212151526, "grad_min_sv": 7.759564610645975e-09, "grad_condition": 401781652.79968464, "lr": 3.942649342761114e-06, "time_sec": 32.58082866668701 }, { "epoch": 145, "train_loss": 0.14240989098906517, "train_acc": 0.95506, "test_loss": 3.008878281021118, "test_acc": 0.5332, "lyapunov": null, "grad_norm": 0.38824198485970274, "grad_max_sv": 0.1965224850922823, "grad_min_sv": 7.475432478099615e-09, "grad_condition": 547980005.9847585, "lr": 2.7390523158633524e-06, "time_sec": 32.580146074295044 }, { "epoch": 146, "train_loss": 0.14141309247016906, "train_acc": 0.95526, "test_loss": 2.9967607612609863, "test_acc": 0.5355, "lyapunov": null, "grad_norm": 0.3897738666220961, "grad_max_sv": 0.20576116181910037, "grad_min_sv": 7.723471491180578e-09, "grad_condition": 174968319.88759154, "lr": 1.7535703752478133e-06, "time_sec": 32.57999658584595 }, { "epoch": 147, "train_loss": 0.14116668840408325, "train_acc": 0.95622, "test_loss": 3.015700612258911, "test_acc": 0.5356, "lyapunov": null, "grad_norm": 0.38647682331651556, "grad_max_sv": 0.20005690585821867, "grad_min_sv": 7.458373789469112e-09, "grad_condition": 559134109.3457831, "lr": 9.866357858642196e-07, "time_sec": 32.57423949241638 }, { "epoch": 148, "train_loss": 0.13872075388908386, "train_acc": 0.95694, "test_loss": 3.02675003452301, "test_acc": 0.5311, "lyapunov": null, "grad_norm": 0.3834516001697345, "grad_max_sv": 0.20063496865332126, "grad_min_sv": 7.280352303873708e-09, "grad_condition": 342935155.3336584, "lr": 4.38584950570808e-07, "time_sec": 32.59147930145264 }, { "epoch": 149, "train_loss": 0.14044044229030608, "train_acc": 0.9558, "test_loss": 3.0015827127456665, "test_acc": 0.537, "lyapunov": null, "grad_norm": 0.38662537604202735, "grad_max_sv": 0.1903643485158682, "grad_min_sv": 7.2725075060480446e-09, "grad_condition": 1114748941.7660475, "lr": 1.096582625772501e-07, "time_sec": 32.56627154350281 }, { "epoch": 150, "train_loss": 0.14047483313083647, "train_acc": 0.95586, "test_loss": 3.1137742416381835, "test_acc": 0.5222, "lyapunov": null, "grad_norm": 0.38553295960146916, "grad_max_sv": 0.2001470748335123, "grad_min_sv": 7.337464655082695e-09, "grad_condition": 1377858482.3116786, "lr": 0.0, "time_sec": 32.586660385131836 } ], "12": [ { "epoch": 1, "train_loss": 4.87748296585083, "train_acc": 0.0306, "test_loss": 4.82872876663208, "test_acc": 0.0165, "lyapunov": null, "grad_norm": 5.932964620640208, "grad_max_sv": 5.34441111087799, "grad_min_sv": 9.95076935739192e-08, "grad_condition": 162613846.39082906, "lr": 0.0009998903417374227, "time_sec": 49.64781618118286 }, { "epoch": 2, "train_loss": 4.325910377655029, "train_acc": 0.05894, "test_loss": 4.736625276947022, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 4.434671975936239, "grad_max_sv": 3.9236845791339876, "grad_min_sv": 7.506598741907622e-08, "grad_condition": 326618949.3555427, "lr": 0.0009995614150494292, "time_sec": 49.66104316711426 }, { "epoch": 3, "train_loss": 4.033521332244873, "train_acc": 0.08816, "test_loss": 4.546054625701904, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 3.5972867305140204, "grad_max_sv": 3.0456687450408935, "grad_min_sv": 6.285284603370356e-08, "grad_condition": 641155242.0675491, "lr": 0.0009990133642141358, "time_sec": 49.67153525352478 }, { "epoch": 4, "train_loss": 3.8378815770721437, "train_acc": 0.11312, "test_loss": 4.485385893249512, "test_acc": 0.0421, "lyapunov": null, "grad_norm": 3.005868245561951, "grad_max_sv": 2.4899374902248383, "grad_min_sv": 5.274935636068179e-08, "grad_condition": 56291013.628438115, "lr": 0.0009982464296247522, "time_sec": 49.65495419502258 }, { "epoch": 5, "train_loss": 3.6790373979949953, "train_acc": 0.1354, "test_loss": 4.809463809204102, "test_acc": 0.0483, "lyapunov": null, "grad_norm": 2.481791347519261, "grad_max_sv": 1.911762249469757, "grad_min_sv": 4.251578253344768e-08, "grad_condition": 59447447.39549043, "lr": 0.0009972609476841367, "time_sec": 49.609050989151 }, { "epoch": 6, "train_loss": 3.5471466955566404, "train_acc": 0.1563, "test_loss": 4.763859475708008, "test_acc": 0.0562, "lyapunov": null, "grad_norm": 2.0531107778434636, "grad_max_sv": 1.4932055324316025, "grad_min_sv": 3.614347272584695e-08, "grad_condition": 45442606.51570525, "lr": 0.000996057350657239, "time_sec": 49.593199491500854 }, { "epoch": 7, "train_loss": 3.4418113514709474, "train_acc": 0.17478, "test_loss": 4.615470837402344, "test_acc": 0.061, "lyapunov": null, "grad_norm": 1.7367000738812381, "grad_max_sv": 1.1847797572612762, "grad_min_sv": 3.088092909442341e-08, "grad_condition": 65255140.867708586, "lr": 0.000994636166481494, "time_sec": 49.60785531997681 }, { "epoch": 8, "train_loss": 3.354895782546997, "train_acc": 0.18784, "test_loss": 5.2386075889587405, "test_acc": 0.0585, "lyapunov": null, "grad_norm": 1.5335851977180728, "grad_max_sv": 0.9428193107247352, "grad_min_sv": 2.6885542893373415e-08, "grad_condition": 75909476.50814043, "lr": 0.0009929980185352525, "time_sec": 49.60816526412964 }, { "epoch": 9, "train_loss": 3.2788688597869875, "train_acc": 0.20466, "test_loss": 5.2327860107421875, "test_acc": 0.0714, "lyapunov": null, "grad_norm": 1.374914600034168, "grad_max_sv": 0.7664340496063232, "grad_min_sv": 2.4066519885290737e-08, "grad_condition": 51969313.05697616, "lr": 0.0009911436253643444, "time_sec": 49.62115836143494 }, { "epoch": 10, "train_loss": 3.214320725250244, "train_acc": 0.21478, "test_loss": 5.367890010070801, "test_acc": 0.0635, "lyapunov": null, "grad_norm": 1.2723756047607861, "grad_max_sv": 0.6678376257419586, "grad_min_sv": 2.3140357913176147e-08, "grad_condition": 33781734.36143675, "lr": 0.0009890738003669028, "time_sec": 49.653478384017944 }, { "epoch": 11, "train_loss": 3.157560857696533, "train_acc": 0.22716, "test_loss": 4.9893413871765135, "test_acc": 0.0793, "lyapunov": null, "grad_norm": 1.1804196554033854, "grad_max_sv": 0.5599115259945393, "grad_min_sv": 2.0999575375824088e-08, "grad_condition": 40003653.553005375, "lr": 0.00098678945143658, "time_sec": 49.64659833908081 }, { "epoch": 12, "train_loss": 3.10919125541687, "train_acc": 0.23374, "test_loss": 5.922018681335449, "test_acc": 0.0572, "lyapunov": null, "grad_norm": 1.1127516543729237, "grad_max_sv": 0.5103657670319081, "grad_min_sv": 2.0326233945988648e-08, "grad_condition": 31959597.02886455, "lr": 0.0009842915805643154, "time_sec": 49.6422758102417 }, { "epoch": 13, "train_loss": 3.0661709033203124, "train_acc": 0.24498, "test_loss": 5.5857378784179685, "test_acc": 0.0641, "lyapunov": null, "grad_norm": 1.0572945850355566, "grad_max_sv": 0.468644580245018, "grad_min_sv": 1.9489185115739716e-08, "grad_condition": 28974309.240684826, "lr": 0.000981581283398829, "time_sec": 49.644200801849365 }, { "epoch": 14, "train_loss": 3.031631886138916, "train_acc": 0.2494, "test_loss": 6.1126462295532225, "test_acc": 0.0622, "lyapunov": null, "grad_norm": 1.0078886975437553, "grad_max_sv": 0.4199274107813835, "grad_min_sv": 1.78886194669714e-08, "grad_condition": 58726821.90857921, "lr": 0.0009786597487660333, "time_sec": 49.64050054550171 }, { "epoch": 15, "train_loss": 2.9854307820892334, "train_acc": 0.25912, "test_loss": 6.682256416320801, "test_acc": 0.0577, "lyapunov": null, "grad_norm": 0.9661185163428607, "grad_max_sv": 0.4044369950890541, "grad_min_sv": 1.7625257230091673e-08, "grad_condition": 47054066.77256496, "lr": 0.0009755282581475766, "time_sec": 49.64783048629761 }, { "epoch": 16, "train_loss": 2.950966311187744, "train_acc": 0.26442, "test_loss": 6.452827975463867, "test_acc": 0.0549, "lyapunov": null, "grad_norm": 0.9327205202160699, "grad_max_sv": 0.38560108840465546, "grad_min_sv": 1.7282875616189337e-08, "grad_condition": 314726395.9437877, "lr": 0.0009721881851187403, "time_sec": 49.64088153839111 }, { "epoch": 17, "train_loss": 2.916735321044922, "train_acc": 0.27246, "test_loss": 6.896680711364746, "test_acc": 0.0438, "lyapunov": null, "grad_norm": 0.8945744514519771, "grad_max_sv": 0.354119461029768, "grad_min_sv": 1.643565590847551e-08, "grad_condition": 26255983.39074681, "lr": 0.0009686409947459456, "time_sec": 49.627718448638916 }, { "epoch": 18, "train_loss": 2.8857511570739747, "train_acc": 0.27974, "test_loss": 5.6459962882995605, "test_acc": 0.0503, "lyapunov": null, "grad_norm": 0.8793484279442325, "grad_max_sv": 0.35779951736330984, "grad_min_sv": 1.628617940785393e-08, "grad_condition": 111551423.90357837, "lr": 0.0009648882429441254, "time_sec": 49.611419677734375 }, { "epoch": 19, "train_loss": 2.850851222381592, "train_acc": 0.28394, "test_loss": 6.184397215270996, "test_acc": 0.0477, "lyapunov": null, "grad_norm": 0.8560875588234809, "grad_max_sv": 0.3290360912680626, "grad_min_sv": 1.5741092075638452e-08, "grad_condition": 33852379.436212204, "lr": 0.00096093157579425, "time_sec": 49.60723423957825 }, { "epoch": 20, "train_loss": 2.8297593169403075, "train_acc": 0.2865, "test_loss": 6.550658810424805, "test_acc": 0.052, "lyapunov": null, "grad_norm": 0.8484343768951315, "grad_max_sv": 0.3310988314449787, "grad_min_sv": 1.579570341747605e-08, "grad_condition": 26630780.62742402, "lr": 0.0009567727288213001, "time_sec": 49.63738775253296 }, { "epoch": 21, "train_loss": 2.8062883308410647, "train_acc": 0.29554, "test_loss": 6.611366340637207, "test_acc": 0.0425, "lyapunov": null, "grad_norm": 0.8271444897566678, "grad_max_sv": 0.31499212570488455, "grad_min_sv": 1.5104316366393312e-08, "grad_condition": 56385885.9009584, "lr": 0.0009524135262330095, "time_sec": 49.624245405197144 }, { "epoch": 22, "train_loss": 2.7797841816711424, "train_acc": 0.29848, "test_loss": 5.2575527236938475, "test_acc": 0.0689, "lyapunov": null, "grad_norm": 0.8192773127159139, "grad_max_sv": 0.3165230479091406, "grad_min_sv": 1.5343957029956278e-08, "grad_condition": 28932546.565699626, "lr": 0.0009478558801197061, "time_sec": 49.6358916759491 }, { "epoch": 23, "train_loss": 2.758929995956421, "train_acc": 0.30298, "test_loss": 5.9057046417236325, "test_acc": 0.0483, "lyapunov": null, "grad_norm": 0.7977853555521689, "grad_max_sv": 0.2981082580983639, "grad_min_sv": 1.4607530535171166e-08, "grad_condition": 23062158.33463922, "lr": 0.000943101789615607, "time_sec": 49.64936828613281 }, { "epoch": 24, "train_loss": 2.7243907251739503, "train_acc": 0.30978, "test_loss": 6.879129153442383, "test_acc": 0.0503, "lyapunov": null, "grad_norm": 0.785562618961601, "grad_max_sv": 0.3072618875652552, "grad_min_sv": 1.4546391063907649e-08, "grad_condition": 26103951.701446574, "lr": 0.0009381533400219313, "time_sec": 49.654170513153076 }, { "epoch": 25, "train_loss": 2.7052862129211426, "train_acc": 0.31438, "test_loss": 7.123418940734863, "test_acc": 0.0498, "lyapunov": null, "grad_norm": 0.7800832079587465, "grad_max_sv": 0.28868941627442835, "grad_min_sv": 1.4423146366127071e-08, "grad_condition": 25468875.32253523, "lr": 0.0009330127018922189, "time_sec": 49.644099712371826 }, { "epoch": 26, "train_loss": 2.6786952052307127, "train_acc": 0.31786, "test_loss": 6.8779948043823245, "test_acc": 0.04, "lyapunov": null, "grad_norm": 0.7660717213990589, "grad_max_sv": 0.28445089757442477, "grad_min_sv": 1.4051416873800404e-08, "grad_condition": 157008558.44244316, "lr": 0.000927682130080253, "time_sec": 49.6546745300293 }, { "epoch": 27, "train_loss": 2.650107885437012, "train_acc": 0.3233, "test_loss": 6.409167988586426, "test_acc": 0.0663, "lyapunov": null, "grad_norm": 0.7553219053413048, "grad_max_sv": 0.2734900705516338, "grad_min_sv": 1.3975185350623143e-08, "grad_condition": 26675374.92153287, "lr": 0.0009221639627510072, "time_sec": 49.651949882507324 }, { "epoch": 28, "train_loss": 2.6323010539245604, "train_acc": 0.32642, "test_loss": 6.348737354278565, "test_acc": 0.0767, "lyapunov": null, "grad_norm": 0.7542460840346141, "grad_max_sv": 0.28178194239735604, "grad_min_sv": 1.4111558673673974e-08, "grad_condition": 153191030.94962814, "lr": 0.0009164606203550494, "time_sec": 49.657703161239624 }, { "epoch": 29, "train_loss": 2.622528738861084, "train_acc": 0.33052, "test_loss": 5.323012785339356, "test_acc": 0.0615, "lyapunov": null, "grad_norm": 0.7434329600183185, "grad_max_sv": 0.28229105696082113, "grad_min_sv": 1.3741382927194567e-08, "grad_condition": 99920561.24148658, "lr": 0.0009105746045668516, "time_sec": 49.640869140625 }, { "epoch": 30, "train_loss": 2.589859499359131, "train_acc": 0.3361, "test_loss": 5.348752153015137, "test_acc": 0.0806, "lyapunov": null, "grad_norm": 0.7401188593705409, "grad_max_sv": 0.2747684422880411, "grad_min_sv": 1.3880728885751203e-08, "grad_condition": 23324413.51449412, "lr": 0.0009045084971874733, "time_sec": 49.62320137023926 }, { "epoch": 31, "train_loss": 2.574071376495361, "train_acc": 0.33836, "test_loss": 4.929797785949707, "test_acc": 0.0696, "lyapunov": null, "grad_norm": 0.7328550694976608, "grad_max_sv": 0.27694769613444803, "grad_min_sv": 1.3843863291840286e-08, "grad_condition": 27250825.622907154, "lr": 0.0008982649590120977, "time_sec": 49.61762976646423 }, { "epoch": 32, "train_loss": 2.5636251927185056, "train_acc": 0.33996, "test_loss": 4.977822930908203, "test_acc": 0.0603, "lyapunov": null, "grad_norm": 0.72578993407064, "grad_max_sv": 0.26916658468544485, "grad_min_sv": 1.3664173616201313e-08, "grad_condition": 37586474.04914663, "lr": 0.0008918467286629196, "time_sec": 49.59874439239502 }, { "epoch": 33, "train_loss": 2.534274593658447, "train_acc": 0.34576, "test_loss": 5.612884985351562, "test_acc": 0.0648, "lyapunov": null, "grad_norm": 0.7195677912828391, "grad_max_sv": 0.2578020472079515, "grad_min_sv": 1.3214893858359833e-08, "grad_condition": 31599310.228798192, "lr": 0.0008852566213878943, "time_sec": 49.60587477684021 }, { "epoch": 34, "train_loss": 2.5204806367492676, "train_acc": 0.34968, "test_loss": 5.823319554901123, "test_acc": 0.0571, "lyapunov": null, "grad_norm": 0.7058229239582122, "grad_max_sv": 0.2517259892076254, "grad_min_sv": 1.3128194935319027e-08, "grad_condition": 38016748.40510639, "lr": 0.000878497527825878, "time_sec": 49.63596320152283 }, { "epoch": 35, "train_loss": 2.4967036684417723, "train_acc": 0.35386, "test_loss": 5.568839009094238, "test_acc": 0.0655, "lyapunov": null, "grad_norm": 0.7071521329332581, "grad_max_sv": 0.2598913241177797, "grad_min_sv": 1.3420283057063997e-08, "grad_condition": 21475756.171551444, "lr": 0.000871572412738697, "time_sec": 49.64343976974487 }, { "epoch": 36, "train_loss": 2.483395898208618, "train_acc": 0.356, "test_loss": 5.925778231811523, "test_acc": 0.0775, "lyapunov": null, "grad_norm": 0.7019030587227678, "grad_max_sv": 0.2620332419872284, "grad_min_sv": 1.330909059973906e-08, "grad_condition": 39143745.76315293, "lr": 0.0008644843137107055, "time_sec": 49.633464097976685 }, { "epoch": 37, "train_loss": 2.455888598480225, "train_acc": 0.3619, "test_loss": 5.800891122436523, "test_acc": 0.0522, "lyapunov": null, "grad_norm": 0.7041203727881495, "grad_max_sv": 0.25247339606285096, "grad_min_sv": 1.317027563119133e-08, "grad_condition": 25971636.862640023, "lr": 0.0008572363398164014, "time_sec": 49.641075134277344 }, { "epoch": 38, "train_loss": 2.444258794937134, "train_acc": 0.3643, "test_loss": 6.3827191253662106, "test_acc": 0.0512, "lyapunov": null, "grad_norm": 0.6991868964165402, "grad_max_sv": 0.2449926756322384, "grad_min_sv": 1.2983126976284787e-08, "grad_condition": 22727640.443126805, "lr": 0.0008498316702566826, "time_sec": 49.6653778553009 }, { "epoch": 39, "train_loss": 2.427623992614746, "train_acc": 0.36718, "test_loss": 5.836345671081543, "test_acc": 0.0532, "lyapunov": null, "grad_norm": 0.6944654131754266, "grad_max_sv": 0.24421218782663345, "grad_min_sv": 1.2779784830385666e-08, "grad_condition": 26159365.26096248, "lr": 0.0008422735529643442, "time_sec": 49.65552568435669 }, { "epoch": 40, "train_loss": 2.4149912483215332, "train_acc": 0.36854, "test_loss": 5.969065676879882, "test_acc": 0.0689, "lyapunov": null, "grad_norm": 0.6869986110904911, "grad_max_sv": 0.23399859815835952, "grad_min_sv": 1.2716373970489415e-08, "grad_condition": 21923336.447286993, "lr": 0.0008345653031794289, "time_sec": 49.66923117637634 }, { "epoch": 41, "train_loss": 2.386474126663208, "train_acc": 0.37558, "test_loss": 6.019966047668457, "test_acc": 0.0579, "lyapunov": null, "grad_norm": 0.68492309888036, "grad_max_sv": 0.2508115164935589, "grad_min_sv": 1.3077304128472633e-08, "grad_condition": 23198341.25841063, "lr": 0.0008267103019950526, "time_sec": 49.620418071746826 }, { "epoch": 42, "train_loss": 2.3729596766662597, "train_acc": 0.38002, "test_loss": 6.315153423309326, "test_acc": 0.0611, "lyapunov": null, "grad_norm": 0.6839063548904902, "grad_max_sv": 0.24613724276423454, "grad_min_sv": 1.2924071682296479e-08, "grad_condition": 24553794.967906404, "lr": 0.0008187119948743447, "time_sec": 49.66134309768677 }, { "epoch": 43, "train_loss": 2.3540061936950685, "train_acc": 0.38038, "test_loss": 6.8890972946166995, "test_acc": 0.052, "lyapunov": null, "grad_norm": 0.6797404469786038, "grad_max_sv": 0.23774098604917526, "grad_min_sv": 1.269067942399893e-08, "grad_condition": 36055931.35688925, "lr": 0.000810573890139155, "time_sec": 49.60659217834473 }, { "epoch": 44, "train_loss": 2.3270812229919433, "train_acc": 0.38584, "test_loss": 6.7161765426635744, "test_acc": 0.0423, "lyapunov": null, "grad_norm": 0.6759173721688353, "grad_max_sv": 0.24107158593833447, "grad_min_sv": 1.2535652725575997e-08, "grad_condition": 27534242.15084389, "lr": 0.0008022995574311873, "time_sec": 49.602726459503174 }, { "epoch": 45, "train_loss": 2.3246476860046386, "train_acc": 0.39008, "test_loss": 6.29091294631958, "test_acc": 0.0518, "lyapunov": null, "grad_norm": 0.6715272373280456, "grad_max_sv": 0.23545034006237983, "grad_min_sv": 1.2545344027503624e-08, "grad_condition": 21225788.36034053, "lr": 0.0007938926261462363, "time_sec": 49.6089346408844 }, { "epoch": 46, "train_loss": 2.302794339752197, "train_acc": 0.3932, "test_loss": 6.331070534515381, "test_acc": 0.0457, "lyapunov": null, "grad_norm": 0.6695288339948315, "grad_max_sv": 0.2387615241110325, "grad_min_sv": 1.267214993216914e-08, "grad_condition": 21439809.063333027, "lr": 0.0007853567838422158, "time_sec": 49.6616952419281 }, { "epoch": 47, "train_loss": 2.2937580155944826, "train_acc": 0.39494, "test_loss": 6.747457525634766, "test_acc": 0.0403, "lyapunov": null, "grad_norm": 0.6703150590025013, "grad_max_sv": 0.23008973710238934, "grad_min_sv": 1.243687924035175e-08, "grad_condition": 21332244.897804268, "lr": 0.0007766957746216719, "time_sec": 49.64005661010742 }, { "epoch": 48, "train_loss": 2.271936141662598, "train_acc": 0.40028, "test_loss": 8.364392227172852, "test_acc": 0.045, "lyapunov": null, "grad_norm": 0.6688819126115724, "grad_max_sv": 0.23257951848208905, "grad_min_sv": 1.2320799760989764e-08, "grad_condition": 43562236.54403031, "lr": 0.0007679133974894982, "time_sec": 49.66763877868652 }, { "epoch": 49, "train_loss": 2.2604706730651856, "train_acc": 0.40228, "test_loss": 6.142012088012695, "test_acc": 0.0648, "lyapunov": null, "grad_norm": 0.6643101794178548, "grad_max_sv": 0.2336978729814291, "grad_min_sv": 1.2540253756243568e-08, "grad_condition": 33614084.08040741, "lr": 0.000759013504686565, "time_sec": 49.65048050880432 }, { "epoch": 50, "train_loss": 2.238395141143799, "train_acc": 0.40952, "test_loss": 7.636728004455566, "test_acc": 0.0642, "lyapunov": null, "grad_norm": 0.6646450225062208, "grad_max_sv": 0.23055841773748398, "grad_min_sv": 1.2360750140105737e-08, "grad_condition": 29243478.728895236, "lr": 0.0007499999999999998, "time_sec": 49.64303922653198 }, { "epoch": 51, "train_loss": 2.22945908203125, "train_acc": 0.40844, "test_loss": 6.013677481079101, "test_acc": 0.0746, "lyapunov": null, "grad_norm": 0.6654733307343168, "grad_max_sv": 0.23596662729978563, "grad_min_sv": 1.2487093845048314e-08, "grad_condition": 24754111.81759522, "lr": 0.0007408768370508575, "time_sec": 49.64409947395325 }, { "epoch": 52, "train_loss": 2.2170784504699705, "train_acc": 0.40908, "test_loss": 6.157418632507325, "test_acc": 0.0702, "lyapunov": null, "grad_norm": 0.6594175681266546, "grad_max_sv": 0.2355981681495905, "grad_min_sv": 1.236185071251672e-08, "grad_condition": 25757058.499904532, "lr": 0.0007316480175599307, "time_sec": 49.636614084243774 }, { "epoch": 53, "train_loss": 2.1939515002059937, "train_acc": 0.41558, "test_loss": 6.859078231048584, "test_acc": 0.0569, "lyapunov": null, "grad_norm": 0.662946169812431, "grad_max_sv": 0.23508151918649672, "grad_min_sv": 1.2330145124361813e-08, "grad_condition": 32594540.125570327, "lr": 0.0007223175895924635, "time_sec": 49.70306444168091 }, { "epoch": 54, "train_loss": 2.1878874357604983, "train_acc": 0.41686, "test_loss": 6.514185330963135, "test_acc": 0.0579, "lyapunov": null, "grad_norm": 0.6592013207620988, "grad_max_sv": 0.23284565843641758, "grad_min_sv": 1.246490098361086e-08, "grad_condition": 21669360.08749289, "lr": 0.0007128896457825361, "time_sec": 49.62425947189331 }, { "epoch": 55, "train_loss": 2.1700433895111084, "train_acc": 0.42082, "test_loss": 7.349776064300537, "test_acc": 0.0557, "lyapunov": null, "grad_norm": 0.6591415320918335, "grad_max_sv": 0.23167332261800766, "grad_min_sv": 1.2205207861396006e-08, "grad_condition": 238494592.31476593, "lr": 0.0007033683215378998, "time_sec": 49.62825536727905 }, { "epoch": 56, "train_loss": 2.153282830657959, "train_acc": 0.4221, "test_loss": 6.606533212280273, "test_acc": 0.0616, "lyapunov": null, "grad_norm": 0.6581126496222481, "grad_max_sv": 0.22157299481332302, "grad_min_sv": 1.218345958564626e-08, "grad_condition": 21160581.40499527, "lr": 0.0006937577932260512, "time_sec": 49.614638328552246 }, { "epoch": 57, "train_loss": 2.1483337621307372, "train_acc": 0.42194, "test_loss": 8.756062689208985, "test_acc": 0.0525, "lyapunov": null, "grad_norm": 0.655149621093074, "grad_max_sv": 0.23063393794000148, "grad_min_sv": 1.2325510248545334e-08, "grad_condition": 32561576.294376243, "lr": 0.0006840622763423388, "time_sec": 49.604514598846436 }, { "epoch": 58, "train_loss": 2.13039572971344, "train_acc": 0.428, "test_loss": 6.102099295043946, "test_acc": 0.077, "lyapunov": null, "grad_norm": 0.6579204722244499, "grad_max_sv": 0.22870929054915906, "grad_min_sv": 1.2437226873385221e-08, "grad_condition": 29029893.441014826, "lr": 0.0006742860236609073, "time_sec": 49.63142991065979 }, { "epoch": 59, "train_loss": 2.1072697998809815, "train_acc": 0.4333, "test_loss": 6.253016600799561, "test_acc": 0.0479, "lyapunov": null, "grad_norm": 0.6541760692934044, "grad_max_sv": 0.22985584288835526, "grad_min_sv": 1.2442094027981244e-08, "grad_condition": 231036397.09788594, "lr": 0.0006644333233692913, "time_sec": 49.64534831047058 }, { "epoch": 60, "train_loss": 2.1020205306243898, "train_acc": 0.43472, "test_loss": 5.772405567932129, "test_acc": 0.0592, "lyapunov": null, "grad_norm": 0.6527505369999154, "grad_max_sv": 0.22004029378294945, "grad_min_sv": 1.217291406285792e-08, "grad_condition": 24874942.26037088, "lr": 0.0006545084971874734, "time_sec": 49.647597312927246 }, { "epoch": 61, "train_loss": 2.0730964871215822, "train_acc": 0.4414, "test_loss": 7.9832359893798825, "test_acc": 0.0641, "lyapunov": null, "grad_norm": 0.6546297418175855, "grad_max_sv": 0.223886064812541, "grad_min_sv": 1.2451116643275028e-08, "grad_condition": 22916995.636865757, "lr": 0.0006445158984722354, "time_sec": 49.65083956718445 }, { "epoch": 62, "train_loss": 2.062996348876953, "train_acc": 0.4436, "test_loss": 7.34946787109375, "test_acc": 0.044, "lyapunov": null, "grad_norm": 0.6483177973397803, "grad_max_sv": 0.22704768665134906, "grad_min_sv": 1.20682398005445e-08, "grad_condition": 38390561.96495845, "lr": 0.0006344599103076324, "time_sec": 49.65266275405884 }, { "epoch": 63, "train_loss": 2.0523825840759278, "train_acc": 0.44564, "test_loss": 8.959309451293946, "test_acc": 0.0413, "lyapunov": null, "grad_norm": 0.6488732278425234, "grad_max_sv": 0.22664117477834225, "grad_min_sv": 1.2159747242446172e-08, "grad_condition": 31006507.26126058, "lr": 0.0006243449435824269, "time_sec": 49.65293788909912 }, { "epoch": 64, "train_loss": 2.0479974696350096, "train_acc": 0.44714, "test_loss": 8.05115908203125, "test_acc": 0.0537, "lyapunov": null, "grad_norm": 0.6455494446410326, "grad_max_sv": 0.2193945564329624, "grad_min_sv": 1.2038907266117942e-08, "grad_condition": 901694346.4545784, "lr": 0.0006141754350553275, "time_sec": 49.64103627204895 }, { "epoch": 65, "train_loss": 2.027272645950317, "train_acc": 0.45036, "test_loss": 8.782285342407226, "test_acc": 0.0554, "lyapunov": null, "grad_norm": 0.6482083158352888, "grad_max_sv": 0.2296803079545498, "grad_min_sv": 1.2045603877547384e-08, "grad_condition": 44744302.33572485, "lr": 0.0006039558454088793, "time_sec": 49.62383842468262 }, { "epoch": 66, "train_loss": 2.012310220794678, "train_acc": 0.4561, "test_loss": 8.360753945922852, "test_acc": 0.0486, "lyapunov": null, "grad_norm": 0.6486341651257033, "grad_max_sv": 0.21999806091189383, "grad_min_sv": 1.2103176813549332e-08, "grad_condition": 25365047.453725625, "lr": 0.000593690657292862, "time_sec": 49.620052099227905 }, { "epoch": 67, "train_loss": 2.2251435960388184, "train_acc": 0.43342, "test_loss": 4.351189101409912, "test_acc": 0.0583, "lyapunov": null, "grad_norm": 0.6822841692183329, "grad_max_sv": 0.23429610803723336, "grad_min_sv": 1.2533971320831828e-08, "grad_condition": 620776564.7686789, "lr": 0.0005833843733580507, "time_sec": 49.6039252281189 }, { "epoch": 68, "train_loss": 3.644752220916748, "train_acc": 0.14882, "test_loss": 4.446993719482422, "test_acc": 0.1036, "lyapunov": null, "grad_norm": 0.5322357731359522, "grad_max_sv": 0.1740941284224391, "grad_min_sv": 9.981525750379916e-09, "grad_condition": 19772886.771588072, "lr": 0.0005730415142812054, "time_sec": 49.6299045085907 }, { "epoch": 69, "train_loss": 3.1906630830383302, "train_acc": 0.22138, "test_loss": 4.447753040695191, "test_acc": 0.1086, "lyapunov": null, "grad_norm": 0.5849582495428348, "grad_max_sv": 0.19428364057093858, "grad_min_sv": 1.0978856412879878e-08, "grad_condition": 20893419.13528825, "lr": 0.0005626666167821517, "time_sec": 49.62305164337158 }, { "epoch": 70, "train_loss": 2.9685875498962404, "train_acc": 0.26182, "test_loss": 5.079945266723633, "test_acc": 0.1082, "lyapunov": null, "grad_norm": 0.5988082474018407, "grad_max_sv": 0.20677474029362203, "grad_min_sv": 1.1152884460408074e-08, "grad_condition": 28125873.10543083, "lr": 0.0005522642316338265, "time_sec": 49.63573360443115 }, { "epoch": 71, "train_loss": 2.8187981507110598, "train_acc": 0.29056, "test_loss": 5.128676221466065, "test_acc": 0.1097, "lyapunov": null, "grad_norm": 0.6073589396586558, "grad_max_sv": 0.19603765942156315, "grad_min_sv": 1.1142021388854673e-08, "grad_condition": 23682104.838631887, "lr": 0.0005418389216661573, "time_sec": 49.65342855453491 }, { "epoch": 72, "train_loss": 2.7264524671173094, "train_acc": 0.30584, "test_loss": 4.905041383361817, "test_acc": 0.1255, "lyapunov": null, "grad_norm": 0.6147190521685049, "grad_max_sv": 0.20450513996183872, "grad_min_sv": 1.1536205649087527e-08, "grad_condition": 28562481.748963058, "lr": 0.0005313952597646563, "time_sec": 49.65431094169617 }, { "epoch": 73, "train_loss": 2.6403448142242434, "train_acc": 0.32094, "test_loss": 5.800853311538696, "test_acc": 0.107, "lyapunov": null, "grad_norm": 0.6247716864218055, "grad_max_sv": 0.21473125889897346, "grad_min_sv": 1.1889953104027295e-08, "grad_condition": 65722876.53475368, "lr": 0.0005209378268645994, "time_sec": 49.64467167854309 }, { "epoch": 74, "train_loss": 2.5647068825531005, "train_acc": 0.33604, "test_loss": 6.016946387481689, "test_acc": 0.1108, "lyapunov": null, "grad_norm": 0.6262187013652493, "grad_max_sv": 0.21014209054410457, "grad_min_sv": 1.1593367979512159e-08, "grad_condition": 23978185.39414488, "lr": 0.0005104712099416781, "time_sec": 49.635523080825806 }, { "epoch": 75, "train_loss": 2.5212148859405517, "train_acc": 0.34632, "test_loss": 6.316108853149414, "test_acc": 0.1027, "lyapunov": null, "grad_norm": 0.6347754908556336, "grad_max_sv": 0.21141788363456726, "grad_min_sv": 1.179611141682857e-08, "grad_condition": 33522616.12577144, "lr": 0.0004999999999999996, "time_sec": 49.63302993774414 }, { "epoch": 76, "train_loss": 2.470890021209717, "train_acc": 0.35636, "test_loss": 6.3965694896698, "test_acc": 0.106, "lyapunov": null, "grad_norm": 0.6330916660078362, "grad_max_sv": 0.21149154454469682, "grad_min_sv": 1.186264902419687e-08, "grad_condition": 78784632.22578731, "lr": 0.0004895287900583212, "time_sec": 49.637208223342896 }, { "epoch": 77, "train_loss": 2.421552244262695, "train_acc": 0.36788, "test_loss": 6.69319435043335, "test_acc": 0.1017, "lyapunov": null, "grad_norm": 0.634293677395214, "grad_max_sv": 0.2066604733467102, "grad_min_sv": 1.1785100880942756e-08, "grad_condition": 59189077.883828625, "lr": 0.0004790621731353997, "time_sec": 49.63215613365173 }, { "epoch": 78, "train_loss": 2.3847443492126463, "train_acc": 0.37546, "test_loss": 7.132302479934692, "test_acc": 0.0943, "lyapunov": null, "grad_norm": 0.6382190364657672, "grad_max_sv": 0.20905729271471502, "grad_min_sv": 1.1757649508170598e-08, "grad_condition": 26167748.83618117, "lr": 0.000468604740235343, "time_sec": 49.61492323875427 }, { "epoch": 79, "train_loss": 2.3435024488830565, "train_acc": 0.38554, "test_loss": 7.740195120239258, "test_acc": 0.0916, "lyapunov": null, "grad_norm": 0.6365390593800095, "grad_max_sv": 0.214980835467577, "grad_min_sv": 1.20849943802126e-08, "grad_condition": 26878255.479230188, "lr": 0.00045816107833384175, "time_sec": 49.625444412231445 }, { "epoch": 80, "train_loss": 2.3083001178741456, "train_acc": 0.39014, "test_loss": 6.61783053894043, "test_acc": 0.1104, "lyapunov": null, "grad_norm": 0.6406625014101909, "grad_max_sv": 0.21362034603953362, "grad_min_sv": 1.2048267306052906e-08, "grad_condition": 20392384.690080393, "lr": 0.0004477357683661729, "time_sec": 49.60279703140259 }, { "epoch": 81, "train_loss": 2.2839368876647947, "train_acc": 0.39676, "test_loss": 6.873206716918945, "test_acc": 0.1118, "lyapunov": null, "grad_norm": 0.640888071388829, "grad_max_sv": 0.21525344289839268, "grad_min_sv": 1.1972712192151457e-08, "grad_condition": 50063258.30804229, "lr": 0.00043733338321784746, "time_sec": 49.61454939842224 }, { "epoch": 82, "train_loss": 2.256084364776611, "train_acc": 0.40168, "test_loss": 8.169263735961914, "test_acc": 0.0948, "lyapunov": null, "grad_norm": 0.6434003244484818, "grad_max_sv": 0.21655187159776687, "grad_min_sv": 1.23490741438248e-08, "grad_condition": 21577781.507507768, "lr": 0.0004269584857187939, "time_sec": 49.62588882446289 }, { "epoch": 83, "train_loss": 2.2249307306671144, "train_acc": 0.40856, "test_loss": 7.893931579589844, "test_acc": 0.1041, "lyapunov": null, "grad_norm": 0.6443153342631529, "grad_max_sv": 0.2138610877096653, "grad_min_sv": 1.1779399097799904e-08, "grad_condition": 37321529.4476779, "lr": 0.0004166156266419484, "time_sec": 49.63660502433777 }, { "epoch": 84, "train_loss": 2.208123627166748, "train_acc": 0.4104, "test_loss": 7.499340794372559, "test_acc": 0.104, "lyapunov": null, "grad_norm": 0.6478863121733859, "grad_max_sv": 0.21281871050596238, "grad_min_sv": 1.2020403913903798e-08, "grad_condition": 28996288.04674848, "lr": 0.0004063093427071373, "time_sec": 49.6533477306366 }, { "epoch": 85, "train_loss": 2.187458460845947, "train_acc": 0.41414, "test_loss": 7.118385442352295, "test_acc": 0.1033, "lyapunov": null, "grad_norm": 0.6504270947812989, "grad_max_sv": 0.22195289880037308, "grad_min_sv": 1.2075933084054746e-08, "grad_condition": 35680632.041642115, "lr": 0.0003960441545911199, "time_sec": 49.64801740646362 }, { "epoch": 86, "train_loss": 2.16914088722229, "train_acc": 0.41866, "test_loss": 8.384735362243653, "test_acc": 0.0929, "lyapunov": null, "grad_norm": 0.6545464063385937, "grad_max_sv": 0.22763431407511234, "grad_min_sv": 1.2551986523431924e-08, "grad_condition": 55796762.73182211, "lr": 0.0003858245649446718, "time_sec": 49.66041612625122 }, { "epoch": 87, "train_loss": 2.1368742782592776, "train_acc": 0.42592, "test_loss": 6.581503366088867, "test_acc": 0.1232, "lyapunov": null, "grad_norm": 0.6536380667194897, "grad_max_sv": 0.2278426967561245, "grad_min_sv": 1.2359256434946175e-08, "grad_condition": 24353654.705191635, "lr": 0.00037565505641757235, "time_sec": 49.66181540489197 }, { "epoch": 88, "train_loss": 2.1224456649780272, "train_acc": 0.4304, "test_loss": 7.7792722061157225, "test_acc": 0.1034, "lyapunov": null, "grad_norm": 0.6522543248368956, "grad_max_sv": 0.21917447336018087, "grad_min_sv": 1.2232303508996622e-08, "grad_condition": 23923683.00683912, "lr": 0.00036554008969236695, "time_sec": 49.64878726005554 }, { "epoch": 89, "train_loss": 2.099866188964844, "train_acc": 0.4329, "test_loss": 7.891568328857422, "test_acc": 0.0965, "lyapunov": null, "grad_norm": 0.6502507826061058, "grad_max_sv": 0.2151956543326378, "grad_min_sv": 1.197734313118648e-08, "grad_condition": 22524026.625488658, "lr": 0.0003554841015277638, "time_sec": 49.636536598205566 }, { "epoch": 90, "train_loss": 2.0865442153167724, "train_acc": 0.43664, "test_loss": 7.531399671936035, "test_acc": 0.106, "lyapunov": null, "grad_norm": 0.6569777082536814, "grad_max_sv": 0.2229558028280735, "grad_min_sv": 1.218858882712226e-08, "grad_condition": 23258750.132011104, "lr": 0.000345491502812526, "time_sec": 49.61567449569702 }, { "epoch": 91, "train_loss": 2.06498106628418, "train_acc": 0.44214, "test_loss": 8.12637159576416, "test_acc": 0.0982, "lyapunov": null, "grad_norm": 0.6551117087544674, "grad_max_sv": 0.2304719265550375, "grad_min_sv": 1.2402068626238271e-08, "grad_condition": 26484691.211153176, "lr": 0.0003355666766307081, "time_sec": 49.61532545089722 }, { "epoch": 92, "train_loss": 2.05007131362915, "train_acc": 0.44468, "test_loss": 8.683588043212891, "test_acc": 0.0875, "lyapunov": null, "grad_norm": 0.6572758654097208, "grad_max_sv": 0.2220118623226881, "grad_min_sv": 1.228345688220056e-08, "grad_condition": 43719860.633667246, "lr": 0.00032571397633909225, "time_sec": 49.61735486984253 }, { "epoch": 93, "train_loss": 2.0329663645935057, "train_acc": 0.44968, "test_loss": 8.036752981567382, "test_acc": 0.0946, "lyapunov": null, "grad_norm": 0.6594762151865757, "grad_max_sv": 0.23468641191720963, "grad_min_sv": 1.2702623283789016e-08, "grad_condition": 22758035.70513925, "lr": 0.00031593772365766094, "time_sec": 49.594003438949585 }, { "epoch": 94, "train_loss": 2.015877328491211, "train_acc": 0.45332, "test_loss": 6.995108350372314, "test_acc": 0.1074, "lyapunov": null, "grad_norm": 0.652167332688343, "grad_max_sv": 0.21848529055714608, "grad_min_sv": 1.2157653033612048e-08, "grad_condition": 31954927.567971922, "lr": 0.0003062422067739483, "time_sec": 49.64247727394104 }, { "epoch": 95, "train_loss": 1.9991163059997559, "train_acc": 0.45638, "test_loss": 7.588622467803955, "test_acc": 0.1142, "lyapunov": null, "grad_norm": 0.6621803475520015, "grad_max_sv": 0.21934038177132606, "grad_min_sv": 1.2358172536697243e-08, "grad_condition": 24385893.04871109, "lr": 0.00029663167846209965, "time_sec": 49.63428497314453 }, { "epoch": 96, "train_loss": 1.9834483330917358, "train_acc": 0.45752, "test_loss": 7.558978903198242, "test_acc": 0.1094, "lyapunov": null, "grad_norm": 0.6668846817868389, "grad_max_sv": 0.21797076910734176, "grad_min_sv": 1.225281484884544e-08, "grad_condition": 22333814.982193254, "lr": 0.00028711035421746345, "time_sec": 49.63755655288696 }, { "epoch": 97, "train_loss": 1.969242282485962, "train_acc": 0.46376, "test_loss": 7.394112825012207, "test_acc": 0.1099, "lyapunov": null, "grad_norm": 0.6554699630149605, "grad_max_sv": 0.2301444172859192, "grad_min_sv": 1.2433391152755214e-08, "grad_condition": 24491819.03636659, "lr": 0.00027768241040753615, "time_sec": 49.655335903167725 }, { "epoch": 98, "train_loss": 1.9529696557617187, "train_acc": 0.46774, "test_loss": 7.055284997558593, "test_acc": 0.1162, "lyapunov": null, "grad_norm": 0.6640537000345971, "grad_max_sv": 0.22325844801962375, "grad_min_sv": 1.2163324900060778e-08, "grad_condition": 52648989.07312742, "lr": 0.00026835198244006903, "time_sec": 49.669140100479126 }, { "epoch": 99, "train_loss": 1.939459365234375, "train_acc": 0.46992, "test_loss": 7.755525547790527, "test_acc": 0.1106, "lyapunov": null, "grad_norm": 0.6598990438805343, "grad_max_sv": 0.23020310550928116, "grad_min_sv": 1.2323512080247845e-08, "grad_condition": 26539045.73575706, "lr": 0.0002591231629491421, "time_sec": 49.658100605010986 }, { "epoch": 100, "train_loss": 1.9241277764892577, "train_acc": 0.47272, "test_loss": 6.962932342529297, "test_acc": 0.1245, "lyapunov": null, "grad_norm": 0.6566318375145326, "grad_max_sv": 0.228052269667387, "grad_min_sv": 1.2546390118495231e-08, "grad_condition": 21651299.709478803, "lr": 0.0002499999999999997, "time_sec": 49.63715100288391 }, { "epoch": 101, "train_loss": 1.9074506490325929, "train_acc": 0.47786, "test_loss": 7.837496071624756, "test_acc": 0.1147, "lyapunov": null, "grad_norm": 0.6602483696560503, "grad_max_sv": 0.2316434532403946, "grad_min_sv": 1.2379145530871938e-08, "grad_condition": 26011010.493026, "lr": 0.00024098649531343477, "time_sec": 49.64603877067566 }, { "epoch": 102, "train_loss": 1.8926145942687989, "train_acc": 0.48072, "test_loss": 8.698235131835938, "test_acc": 0.0935, "lyapunov": null, "grad_norm": 0.6633351574173826, "grad_max_sv": 0.22496680207550526, "grad_min_sv": 1.2393885331918319e-08, "grad_condition": 62142872.25343563, "lr": 0.0002320866025105016, "time_sec": 49.613752126693726 }, { "epoch": 103, "train_loss": 1.8847379415130616, "train_acc": 0.48146, "test_loss": 8.400778024291991, "test_acc": 0.1064, "lyapunov": null, "grad_norm": 0.6628163988108642, "grad_max_sv": 0.2389563336968422, "grad_min_sv": 1.2502011579674024e-08, "grad_condition": 561960509.0407003, "lr": 0.0002233042253783278, "time_sec": 49.64220905303955 }, { "epoch": 104, "train_loss": 1.864337573890686, "train_acc": 0.48388, "test_loss": 7.582353992080688, "test_acc": 0.1105, "lyapunov": null, "grad_norm": 0.6662860681196462, "grad_max_sv": 0.2305597063153982, "grad_min_sv": 1.2549438151154835e-08, "grad_condition": 28749280.670694787, "lr": 0.000214643216157784, "time_sec": 49.59931921958923 }, { "epoch": 105, "train_loss": 1.8436736141586303, "train_acc": 0.49176, "test_loss": 7.296687260437012, "test_acc": 0.1222, "lyapunov": null, "grad_norm": 0.6651015349952935, "grad_max_sv": 0.22770841754972934, "grad_min_sv": 1.2484767888520238e-08, "grad_condition": 223685448.9202466, "lr": 0.00020610737385376332, "time_sec": 49.59563899040222 }, { "epoch": 106, "train_loss": 1.841442982711792, "train_acc": 0.49332, "test_loss": 8.086389836120606, "test_acc": 0.1055, "lyapunov": null, "grad_norm": 0.6642212770974275, "grad_max_sv": 0.23377629406750203, "grad_min_sv": 1.239430658661611e-08, "grad_condition": 25560457.467378292, "lr": 0.00019770044256881242, "time_sec": 49.633612394332886 }, { "epoch": 107, "train_loss": 1.8276642670440675, "train_acc": 0.49872, "test_loss": 8.12283078918457, "test_acc": 0.1035, "lyapunov": null, "grad_norm": 0.6635032674607848, "grad_max_sv": 0.22688985653221608, "grad_min_sv": 1.237523354902237e-08, "grad_condition": 25808230.55779849, "lr": 0.0001894261098608447, "time_sec": 49.63720369338989 }, { "epoch": 108, "train_loss": 1.8169137536621094, "train_acc": 0.49852, "test_loss": 8.409533373260498, "test_acc": 0.0987, "lyapunov": null, "grad_norm": 0.6667541497565868, "grad_max_sv": 0.22939535826444626, "grad_min_sv": 1.2364147994672892e-08, "grad_condition": 124450338.46619192, "lr": 0.000181288005125655, "time_sec": 49.650787591934204 }, { "epoch": 109, "train_loss": 1.7991494818115235, "train_acc": 0.50362, "test_loss": 7.646248370361328, "test_acc": 0.1117, "lyapunov": null, "grad_norm": 0.6718663681176132, "grad_max_sv": 0.22661731615662575, "grad_min_sv": 1.2321765009010166e-08, "grad_condition": 38880987.41150442, "lr": 0.0001732896980049473, "time_sec": 49.649791955947876 }, { "epoch": 110, "train_loss": 1.8055472195053102, "train_acc": 0.5002, "test_loss": 7.981080414581299, "test_acc": 0.1032, "lyapunov": null, "grad_norm": 0.66872350270792, "grad_max_sv": 0.22803995087742807, "grad_min_sv": 1.2362955611371421e-08, "grad_condition": 262033827.92100912, "lr": 0.00016543469682057076, "time_sec": 49.647390365600586 }, { "epoch": 111, "train_loss": 1.7805239984130858, "train_acc": 0.50612, "test_loss": 8.953764317321777, "test_acc": 0.098, "lyapunov": null, "grad_norm": 0.673049303663611, "grad_max_sv": 0.23256770558655263, "grad_min_sv": 1.2522076875409738e-08, "grad_condition": 79448628.08930221, "lr": 0.00015772644703565552, "time_sec": 49.64419651031494 }, { "epoch": 112, "train_loss": 1.7635594388580322, "train_acc": 0.51178, "test_loss": 9.006199928283692, "test_acc": 0.0944, "lyapunov": null, "grad_norm": 0.6690577762179267, "grad_max_sv": 0.231477802246809, "grad_min_sv": 1.2611339457110904e-08, "grad_condition": 74574181.95014855, "lr": 0.00015016832974331713, "time_sec": 49.6623969078064 }, { "epoch": 113, "train_loss": 1.7649991600799562, "train_acc": 0.50992, "test_loss": 8.706898388671876, "test_acc": 0.0957, "lyapunov": null, "grad_norm": 0.6698910233260391, "grad_max_sv": 0.24120958633720874, "grad_min_sv": 1.2578526964457382e-08, "grad_condition": 53483669.38925791, "lr": 0.00014276366018359834, "time_sec": 49.66872000694275 }, { "epoch": 114, "train_loss": 1.7550373428726196, "train_acc": 0.51416, "test_loss": 9.079370852661134, "test_acc": 0.0946, "lyapunov": null, "grad_norm": 0.6663575459996698, "grad_max_sv": 0.22731570713222027, "grad_min_sv": 1.247297455250762e-08, "grad_condition": 42511186.51551006, "lr": 0.00013551568628929425, "time_sec": 49.61651134490967 }, { "epoch": 115, "train_loss": 1.7389271509552002, "train_acc": 0.51604, "test_loss": 8.636061263275147, "test_acc": 0.1024, "lyapunov": null, "grad_norm": 0.6736568214282298, "grad_max_sv": 0.23145201802253723, "grad_min_sv": 1.2523735046232608e-08, "grad_condition": 34281489.67578278, "lr": 0.00012842758726130276, "time_sec": 49.587687492370605 }, { "epoch": 116, "train_loss": 1.73655320854187, "train_acc": 0.51642, "test_loss": 9.354261597442626, "test_acc": 0.0971, "lyapunov": null, "grad_norm": 0.6692761494554511, "grad_max_sv": 0.23360017724335194, "grad_min_sv": 1.2428947707143757e-08, "grad_condition": 42706933.20787396, "lr": 0.0001215024721741218, "time_sec": 49.61284112930298 }, { "epoch": 117, "train_loss": 1.722219416847229, "train_acc": 0.52034, "test_loss": 9.05172070465088, "test_acc": 0.0864, "lyapunov": null, "grad_norm": 0.6709665811373348, "grad_max_sv": 0.23329499438405038, "grad_min_sv": 1.2499731633086597e-08, "grad_condition": 23426718.363504913, "lr": 0.00011474337861210538, "time_sec": 49.612444162368774 }, { "epoch": 118, "train_loss": 1.720088274269104, "train_acc": 0.5212, "test_loss": 8.445899168395997, "test_acc": 0.1071, "lyapunov": null, "grad_norm": 0.6772013084899083, "grad_max_sv": 0.23568132370710373, "grad_min_sv": 1.26266935157604e-08, "grad_condition": 30951096.93160528, "lr": 0.00010815327133708009, "time_sec": 49.616597414016724 }, { "epoch": 119, "train_loss": 1.7100347495269776, "train_acc": 0.52412, "test_loss": 7.941069074249268, "test_acc": 0.116, "lyapunov": null, "grad_norm": 0.6653971862031371, "grad_max_sv": 0.23134685456752777, "grad_min_sv": 1.2402505802922015e-08, "grad_condition": 22810188.64319814, "lr": 0.00010173504098790182, "time_sec": 49.63788056373596 }, { "epoch": 120, "train_loss": 1.700667360534668, "train_acc": 0.52674, "test_loss": 9.192179844665528, "test_acc": 0.0952, "lyapunov": null, "grad_norm": 0.67019495782139, "grad_max_sv": 0.23498024754226207, "grad_min_sv": 1.2522474526766025e-08, "grad_condition": 25575812.55122325, "lr": 9.549150281252629e-05, "time_sec": 49.633721113204956 }, { "epoch": 121, "train_loss": 1.6934022713470458, "train_acc": 0.52622, "test_loss": 8.246514013671876, "test_acc": 0.1052, "lyapunov": null, "grad_norm": 0.67264731502187, "grad_max_sv": 0.23390924520790576, "grad_min_sv": 1.2629734989083596e-08, "grad_condition": 75127709.41882512, "lr": 8.942539543314794e-05, "time_sec": 49.658979177474976 }, { "epoch": 122, "train_loss": 1.6853880523681641, "train_acc": 0.52858, "test_loss": 8.835922454071046, "test_acc": 0.1015, "lyapunov": null, "grad_norm": 0.6681915576498015, "grad_max_sv": 0.22805486135184766, "grad_min_sv": 1.2523601156111397e-08, "grad_condition": 22825184.37456271, "lr": 8.353937964495024e-05, "time_sec": 49.645174980163574 }, { "epoch": 123, "train_loss": 1.6754656018447875, "train_acc": 0.52996, "test_loss": 8.766720679473877, "test_acc": 0.0969, "lyapunov": null, "grad_norm": 0.6635381868278838, "grad_max_sv": 0.23943961299955846, "grad_min_sv": 1.2716584071870152e-08, "grad_condition": 25094494.26316102, "lr": 7.783603724899243e-05, "time_sec": 49.64848589897156 }, { "epoch": 124, "train_loss": 1.6794914197158815, "train_acc": 0.53018, "test_loss": 8.580409744262695, "test_acc": 0.1045, "lyapunov": null, "grad_norm": 0.671245577708117, "grad_max_sv": 0.23060270808637143, "grad_min_sv": 1.234503174199486e-08, "grad_condition": 63345986.58758273, "lr": 7.231786991974666e-05, "time_sec": 49.87266302108765 }, { "epoch": 125, "train_loss": 1.6680570980834961, "train_acc": 0.53182, "test_loss": 8.834838022613525, "test_acc": 0.1023, "lyapunov": null, "grad_norm": 0.6759384740097162, "grad_max_sv": 0.23802748061716555, "grad_min_sv": 1.276443843678532e-08, "grad_condition": 24804650.245445848, "lr": 6.698729810778072e-05, "time_sec": 49.65100860595703 }, { "epoch": 126, "train_loss": 1.6599959258651733, "train_acc": 0.53514, "test_loss": 8.445849030303956, "test_acc": 0.0993, "lyapunov": null, "grad_norm": 0.6683123713335807, "grad_max_sv": 0.23196808211505413, "grad_min_sv": 1.239824619359009e-08, "grad_condition": 24122291.210029412, "lr": 6.184665997806817e-05, "time_sec": 49.60801029205322 }, { "epoch": 127, "train_loss": 1.6581390426254272, "train_acc": 0.53286, "test_loss": 8.180217957305908, "test_acc": 0.1144, "lyapunov": null, "grad_norm": 0.671697720762431, "grad_max_sv": 0.23852520175278186, "grad_min_sv": 1.290384490787444e-08, "grad_condition": 30505273.567765664, "lr": 5.6898210384392595e-05, "time_sec": 49.62530255317688 }, { "epoch": 128, "train_loss": 1.6536951416015624, "train_acc": 0.53944, "test_loss": 9.100402154541015, "test_acc": 0.0967, "lyapunov": null, "grad_norm": 0.667185365414166, "grad_max_sv": 0.2322216048836708, "grad_min_sv": 1.2572321161918864e-08, "grad_condition": 23830602.615603756, "lr": 5.214411988029363e-05, "time_sec": 49.59242367744446 }, { "epoch": 129, "train_loss": 1.6502027558135985, "train_acc": 0.53564, "test_loss": 8.243769989013671, "test_acc": 0.1101, "lyapunov": null, "grad_norm": 0.6719880999378245, "grad_max_sv": 0.23203521333634852, "grad_min_sv": 1.2620684003428195e-08, "grad_condition": 74978797.83799863, "lr": 4.7586473766990294e-05, "time_sec": 49.60294818878174 }, { "epoch": 130, "train_loss": 1.6536482720565795, "train_acc": 0.53586, "test_loss": 8.237010109710694, "test_acc": 0.1067, "lyapunov": null, "grad_norm": 0.6804852067291551, "grad_max_sv": 0.2377860952168703, "grad_min_sv": 1.2762065921406718e-08, "grad_condition": 39212371.63315557, "lr": 4.32272711786996e-05, "time_sec": 49.597888708114624 }, { "epoch": 131, "train_loss": 1.639038058242798, "train_acc": 0.54146, "test_loss": 8.44538454055786, "test_acc": 0.1063, "lyapunov": null, "grad_norm": 0.6724835885199256, "grad_max_sv": 0.2353504840284586, "grad_min_sv": 1.2740010607581453e-08, "grad_condition": 26983674.320896793, "lr": 3.906842420574966e-05, "time_sec": 49.665122509002686 }, { "epoch": 132, "train_loss": 1.6450230081176758, "train_acc": 0.53788, "test_loss": 8.850830727386475, "test_acc": 0.1028, "lyapunov": null, "grad_norm": 0.6728968812754041, "grad_max_sv": 0.2380696687847376, "grad_min_sv": 1.2689633881700357e-08, "grad_condition": 85473852.69328196, "lr": 3.5111757055874305e-05, "time_sec": 49.62814116477966 }, { "epoch": 133, "train_loss": 1.6397483406066895, "train_acc": 0.53942, "test_loss": 8.841438789367675, "test_acc": 0.0951, "lyapunov": null, "grad_norm": 0.6743180544065257, "grad_max_sv": 0.23258159644901752, "grad_min_sv": 1.2391172625816904e-08, "grad_condition": 50130338.96886261, "lr": 3.1359005254054254e-05, "time_sec": 49.650676250457764 }, { "epoch": 134, "train_loss": 1.6300106893539428, "train_acc": 0.54306, "test_loss": 8.161712069702148, "test_acc": 0.0977, "lyapunov": null, "grad_norm": 0.6697898119311428, "grad_max_sv": 0.23791733495891093, "grad_min_sv": 1.2599619581693533e-08, "grad_condition": 33905362.44570724, "lr": 2.7811814881259484e-05, "time_sec": 49.678349018096924 }, { "epoch": 135, "train_loss": 1.6280161280059815, "train_acc": 0.54206, "test_loss": 8.8084473777771, "test_acc": 0.099, "lyapunov": null, "grad_norm": 0.6685419282298722, "grad_max_sv": 0.2294952504336834, "grad_min_sv": 1.2453856032546007e-08, "grad_condition": 28183066.52638216, "lr": 2.4471741852423218e-05, "time_sec": 49.63830757141113 }, { "epoch": 136, "train_loss": 1.6250385632324218, "train_acc": 0.5424, "test_loss": 9.245115556335449, "test_acc": 0.0982, "lyapunov": null, "grad_norm": 0.673719312762165, "grad_max_sv": 0.2436251524835825, "grad_min_sv": 1.2834923374116514e-08, "grad_condition": 22720217.479475908, "lr": 2.1340251233966362e-05, "time_sec": 49.68732476234436 }, { "epoch": 137, "train_loss": 1.6283387484741212, "train_acc": 0.5456, "test_loss": 8.400495840454102, "test_acc": 0.1051, "lyapunov": null, "grad_norm": 0.6729648252425294, "grad_max_sv": 0.228320786729455, "grad_min_sv": 1.2201329287198082e-08, "grad_condition": 29654367.28966447, "lr": 1.8418716601170932e-05, "time_sec": 49.65324902534485 }, { "epoch": 138, "train_loss": 1.6186187603378297, "train_acc": 0.54454, "test_loss": 8.544135133361817, "test_acc": 0.1026, "lyapunov": null, "grad_norm": 0.6767335790557945, "grad_max_sv": 0.24417912773787975, "grad_min_sv": 1.2745562341653915e-08, "grad_condition": 22462589.905390937, "lr": 1.570841943568445e-05, "time_sec": 49.62770223617554 }, { "epoch": 139, "train_loss": 1.614481148033142, "train_acc": 0.54796, "test_loss": 8.814221725463867, "test_acc": 0.0977, "lyapunov": null, "grad_norm": 0.6703542181357327, "grad_max_sv": 0.2325075563043356, "grad_min_sv": 1.2578777475180657e-08, "grad_condition": 21363698.231181078, "lr": 1.3210548563419845e-05, "time_sec": 49.592610120773315 }, { "epoch": 140, "train_loss": 1.6180111114883422, "train_acc": 0.54492, "test_loss": 8.483137963104248, "test_acc": 0.1107, "lyapunov": null, "grad_norm": 0.6809540897117702, "grad_max_sv": 0.2395390760153532, "grad_min_sv": 1.2634957796686664e-08, "grad_condition": 54098275.066982284, "lr": 1.0926199633097203e-05, "time_sec": 49.62364315986633 }, { "epoch": 141, "train_loss": 1.613265188369751, "train_acc": 0.548, "test_loss": 9.025719612884522, "test_acc": 0.0959, "lyapunov": null, "grad_norm": 0.6738933430180942, "grad_max_sv": 0.2385118592530489, "grad_min_sv": 1.2675423211039316e-08, "grad_condition": 24268524.45347375, "lr": 8.856374635655688e-06, "time_sec": 49.6093544960022 }, { "epoch": 142, "train_loss": 1.6109765142822265, "train_acc": 0.54672, "test_loss": 8.501644051361083, "test_acc": 0.1071, "lyapunov": null, "grad_norm": 0.6688401906779454, "grad_max_sv": 0.2420313537120819, "grad_min_sv": 1.2541520851006016e-08, "grad_condition": 34051323.70080558, "lr": 7.001981464747503e-06, "time_sec": 49.626237869262695 }, { "epoch": 143, "train_loss": 1.6083808990859985, "train_acc": 0.5495, "test_loss": 8.410878736114501, "test_acc": 0.1029, "lyapunov": null, "grad_norm": 0.6694620190305317, "grad_max_sv": 0.2360597461462021, "grad_min_sv": 1.2411240957882486e-08, "grad_condition": 256359120.1912489, "lr": 5.3638335185058295e-06, "time_sec": 49.64081525802612 }, { "epoch": 144, "train_loss": 1.6100667620468139, "train_acc": 0.54798, "test_loss": 8.832001342010498, "test_acc": 0.1019, "lyapunov": null, "grad_norm": 0.6707738006928022, "grad_max_sv": 0.23732503540813923, "grad_min_sv": 1.258596476483298e-08, "grad_condition": 24176116.650407396, "lr": 3.942649342761114e-06, "time_sec": 49.650325536727905 }, { "epoch": 145, "train_loss": 1.6037773385238647, "train_acc": 0.54702, "test_loss": 8.7359261428833, "test_acc": 0.0989, "lyapunov": null, "grad_norm": 0.6690176163372957, "grad_max_sv": 0.23970598317682743, "grad_min_sv": 1.2538464763678369e-08, "grad_condition": 33292646.116570044, "lr": 2.7390523158633524e-06, "time_sec": 49.64434027671814 }, { "epoch": 146, "train_loss": 1.6090083113098144, "train_acc": 0.54738, "test_loss": 8.776909831237793, "test_acc": 0.1015, "lyapunov": null, "grad_norm": 0.6706150402911953, "grad_max_sv": 0.2313551239669323, "grad_min_sv": 1.2493580149597339e-08, "grad_condition": 36814707.572352916, "lr": 1.7535703752478133e-06, "time_sec": 49.653162479400635 }, { "epoch": 147, "train_loss": 1.6126505808258056, "train_acc": 0.54692, "test_loss": 9.092076904296874, "test_acc": 0.0975, "lyapunov": null, "grad_norm": 0.6703962324024396, "grad_max_sv": 0.233590966463089, "grad_min_sv": 1.2700339725724153e-08, "grad_condition": 46904603.438913696, "lr": 9.866357858642196e-07, "time_sec": 49.64583897590637 }, { "epoch": 148, "train_loss": 1.6134785464096069, "train_acc": 0.54594, "test_loss": 8.983751535797118, "test_acc": 0.0995, "lyapunov": null, "grad_norm": 0.674578489012928, "grad_max_sv": 0.23970573469996453, "grad_min_sv": 1.272608372571149e-08, "grad_condition": 21842271.84696827, "lr": 4.38584950570808e-07, "time_sec": 49.64808487892151 }, { "epoch": 149, "train_loss": 1.6119013549423218, "train_acc": 0.54862, "test_loss": 8.56843572845459, "test_acc": 0.1054, "lyapunov": null, "grad_norm": 0.6747520334683573, "grad_max_sv": 0.2384514592587948, "grad_min_sv": 1.2600235418935846e-08, "grad_condition": 25340562.620727975, "lr": 1.096582625772501e-07, "time_sec": 49.64168334007263 }, { "epoch": 150, "train_loss": 1.6072704146957397, "train_acc": 0.54742, "test_loss": 8.887614213562012, "test_acc": 0.1015, "lyapunov": null, "grad_norm": 0.6742776904392008, "grad_max_sv": 0.24012672565877438, "grad_min_sv": 1.2860058681840591e-08, "grad_condition": 24539045.015578836, "lr": 0.0, "time_sec": 49.61355018615723 } ], "16": [ { "epoch": 1, "train_loss": 5.088581143493652, "train_acc": 0.01332, "test_loss": 4.951591259765625, "test_acc": 0.01, "lyapunov": null, "grad_norm": 5.595797699274781, "grad_max_sv": 5.059777915477753, "grad_min_sv": 8.380082079928463e-08, "grad_condition": 144739678.32890567, "lr": 0.0009998903417374227, "time_sec": 66.76207876205444 }, { "epoch": 2, "train_loss": 4.727508141174316, "train_acc": 0.0242, "test_loss": 4.891763400268554, "test_acc": 0.0104, "lyapunov": null, "grad_norm": 4.11050155163041, "grad_max_sv": 3.698546850681305, "grad_min_sv": 6.387429426490954e-08, "grad_condition": 67471298.37535235, "lr": 0.0009995614150494292, "time_sec": 66.79832410812378 }, { "epoch": 3, "train_loss": 4.516627143707275, "train_acc": 0.03364, "test_loss": 5.023839845275879, "test_acc": 0.0096, "lyapunov": null, "grad_norm": 3.230804659530269, "grad_max_sv": 2.737754541635513, "grad_min_sv": 4.854583614544161e-08, "grad_condition": 87922174.2345469, "lr": 0.0009990133642141358, "time_sec": 66.76044511795044 }, { "epoch": 4, "train_loss": 4.37137044631958, "train_acc": 0.04084, "test_loss": 5.107725936889649, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 2.5815981982320455, "grad_max_sv": 2.1624936670064927, "grad_min_sv": 3.8690102244220983e-08, "grad_condition": 66775302.44012289, "lr": 0.0009982464296247522, "time_sec": 66.69986486434937 }, { "epoch": 5, "train_loss": 4.2787111569213865, "train_acc": 0.0499, "test_loss": 5.093746864318848, "test_acc": 0.0119, "lyapunov": null, "grad_norm": 2.0501754928637608, "grad_max_sv": 1.6735655426979066, "grad_min_sv": 3.02018420605954e-08, "grad_condition": 83847616.58229446, "lr": 0.0009972609476841367, "time_sec": 66.70642113685608 }, { "epoch": 6, "train_loss": 4.173126724395752, "train_acc": 0.06114, "test_loss": 5.650288801574707, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 1.4461755519297805, "grad_max_sv": 1.029741930961609, "grad_min_sv": 2.1617413775709693e-08, "grad_condition": 53690503.75103078, "lr": 0.000996057350657239, "time_sec": 66.68753027915955 }, { "epoch": 7, "train_loss": 4.093725746765137, "train_acc": 0.07048, "test_loss": 5.236350575256347, "test_acc": 0.0131, "lyapunov": null, "grad_norm": 1.104296817764675, "grad_max_sv": 0.6810471951961518, "grad_min_sv": 1.7525281126307134e-08, "grad_condition": 46908594.94631828, "lr": 0.000994636166481494, "time_sec": 66.73089575767517 }, { "epoch": 8, "train_loss": 4.031361261062622, "train_acc": 0.08184, "test_loss": 5.266020038604736, "test_acc": 0.011, "lyapunov": null, "grad_norm": 0.9907154687339563, "grad_max_sv": 0.5727237299084663, "grad_min_sv": 1.568161453573136e-08, "grad_condition": 205087186.79278168, "lr": 0.0009929980185352525, "time_sec": 66.74000144004822 }, { "epoch": 9, "train_loss": 3.9836690045166017, "train_acc": 0.08876, "test_loss": 5.373385707092285, "test_acc": 0.0145, "lyapunov": null, "grad_norm": 0.9286442561107239, "grad_max_sv": 0.49140588417649267, "grad_min_sv": 1.4355377359054344e-08, "grad_condition": 49567929.749295376, "lr": 0.0009911436253643444, "time_sec": 66.75752806663513 }, { "epoch": 10, "train_loss": 3.9524392292785646, "train_acc": 0.09442, "test_loss": 5.648289218139649, "test_acc": 0.011, "lyapunov": null, "grad_norm": 0.8635186549937055, "grad_max_sv": 0.44110502675175667, "grad_min_sv": 1.380239241649539e-08, "grad_condition": 160205558.71937332, "lr": 0.0009890738003669028, "time_sec": 66.74852681159973 }, { "epoch": 11, "train_loss": 3.9057430783081055, "train_acc": 0.09904, "test_loss": 5.593870043945312, "test_acc": 0.0153, "lyapunov": null, "grad_norm": 0.8313455134497171, "grad_max_sv": 0.4245350927114487, "grad_min_sv": 1.3408236181761123e-08, "grad_condition": 70475775.54279244, "lr": 0.00098678945143658, "time_sec": 66.72569394111633 }, { "epoch": 12, "train_loss": 3.879755588531494, "train_acc": 0.1059, "test_loss": 5.91184571685791, "test_acc": 0.0122, "lyapunov": null, "grad_norm": 0.8098343665002108, "grad_max_sv": 0.3995117902755737, "grad_min_sv": 1.3223197731335352e-08, "grad_condition": 2262455188.632939, "lr": 0.0009842915805643154, "time_sec": 66.74134874343872 }, { "epoch": 13, "train_loss": 3.8387034120178223, "train_acc": 0.11128, "test_loss": 5.55406644744873, "test_acc": 0.0159, "lyapunov": null, "grad_norm": 0.7779364983364899, "grad_max_sv": 0.36580874100327493, "grad_min_sv": 1.2747200656137991e-08, "grad_condition": 31403290.857171714, "lr": 0.000981581283398829, "time_sec": 66.71355533599854 }, { "epoch": 14, "train_loss": 3.8182811224365234, "train_acc": 0.11366, "test_loss": 5.846968073272705, "test_acc": 0.0132, "lyapunov": null, "grad_norm": 0.7545251260271086, "grad_max_sv": 0.34809157326817514, "grad_min_sv": 1.2320788722597342e-08, "grad_condition": 32144212.47563106, "lr": 0.0009786597487660333, "time_sec": 66.72689533233643 }, { "epoch": 15, "train_loss": 3.7967992616271973, "train_acc": 0.11852, "test_loss": 5.68047932510376, "test_acc": 0.0155, "lyapunov": null, "grad_norm": 0.731162073111203, "grad_max_sv": 0.3421657994389534, "grad_min_sv": 1.1936111505433944e-08, "grad_condition": 244312799.4199868, "lr": 0.0009755282581475766, "time_sec": 66.7026903629303 }, { "epoch": 16, "train_loss": 3.7741379774475097, "train_acc": 0.12086, "test_loss": 5.484867942047119, "test_acc": 0.0182, "lyapunov": null, "grad_norm": 0.7090304412758509, "grad_max_sv": 0.3223520040512085, "grad_min_sv": 1.1672073835233832e-08, "grad_condition": 31524319.78711735, "lr": 0.0009721881851187403, "time_sec": 66.739328622818 }, { "epoch": 17, "train_loss": 3.753197032470703, "train_acc": 0.1256, "test_loss": 6.568574522399902, "test_acc": 0.0151, "lyapunov": null, "grad_norm": 0.6935882502734273, "grad_max_sv": 0.3146128565073013, "grad_min_sv": 1.1361096601426174e-08, "grad_condition": 210125774.08050695, "lr": 0.0009686409947459456, "time_sec": 66.74520659446716 }, { "epoch": 18, "train_loss": 3.725816408157349, "train_acc": 0.1287, "test_loss": 6.34478737487793, "test_acc": 0.0159, "lyapunov": null, "grad_norm": 0.6758795184950354, "grad_max_sv": 0.30437840037047864, "grad_min_sv": 1.1510641159673262e-08, "grad_condition": 31558341.74036485, "lr": 0.0009648882429441254, "time_sec": 66.78180265426636 }, { "epoch": 19, "train_loss": 3.714654729003906, "train_acc": 0.13168, "test_loss": 6.368891102600098, "test_acc": 0.016, "lyapunov": null, "grad_norm": 0.6618910868321934, "grad_max_sv": 0.2960255391895771, "grad_min_sv": 1.1117618592404455e-08, "grad_condition": 30205848.660664685, "lr": 0.00096093157579425, "time_sec": 66.74912786483765 }, { "epoch": 20, "train_loss": 3.6946691497802733, "train_acc": 0.13396, "test_loss": 6.4278502319335935, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.6443454538226331, "grad_max_sv": 0.28263592235744, "grad_min_sv": 1.0974601266297567e-08, "grad_condition": 85210724.40585044, "lr": 0.0009567727288213001, "time_sec": 66.75979924201965 }, { "epoch": 21, "train_loss": 3.678538037261963, "train_acc": 0.1389, "test_loss": 5.944661869812012, "test_acc": 0.0147, "lyapunov": null, "grad_norm": 0.6338793846375858, "grad_max_sv": 0.2817647561430931, "grad_min_sv": 1.0979779263564637e-08, "grad_condition": 31384399.636330932, "lr": 0.0009524135262330095, "time_sec": 66.75862097740173 }, { "epoch": 22, "train_loss": 3.6583445849609375, "train_acc": 0.1389, "test_loss": 6.617507224273681, "test_acc": 0.0186, "lyapunov": null, "grad_norm": 0.6270968339485256, "grad_max_sv": 0.2682405423372984, "grad_min_sv": 1.0661627264374474e-08, "grad_condition": 28199289.108431924, "lr": 0.0009478558801197061, "time_sec": 66.70150375366211 }, { "epoch": 23, "train_loss": 3.646308810348511, "train_acc": 0.14268, "test_loss": 6.335385469818116, "test_acc": 0.0149, "lyapunov": null, "grad_norm": 0.6088892694217577, "grad_max_sv": 0.25535150058567524, "grad_min_sv": 1.0300061187296095e-08, "grad_condition": 34795287.59915707, "lr": 0.000943101789615607, "time_sec": 66.70925712585449 }, { "epoch": 24, "train_loss": 3.6351177741241454, "train_acc": 0.1426, "test_loss": 6.3158514701843265, "test_acc": 0.0177, "lyapunov": null, "grad_norm": 0.5964648659799031, "grad_max_sv": 0.24951178021728992, "grad_min_sv": 1.0093550447537458e-08, "grad_condition": 51838350.11107895, "lr": 0.0009381533400219313, "time_sec": 66.70350575447083 }, { "epoch": 25, "train_loss": 3.6183255680847166, "train_acc": 0.14644, "test_loss": 6.721168376159668, "test_acc": 0.0181, "lyapunov": null, "grad_norm": 0.5933387221507487, "grad_max_sv": 0.25210563503205774, "grad_min_sv": 1.0153997685290878e-08, "grad_condition": 247394984.04080305, "lr": 0.0009330127018922189, "time_sec": 66.75347089767456 }, { "epoch": 26, "train_loss": 3.6071299158477785, "train_acc": 0.14866, "test_loss": 6.642034001922608, "test_acc": 0.0181, "lyapunov": null, "grad_norm": 0.5954282647789416, "grad_max_sv": 0.2547519262880087, "grad_min_sv": 1.0135606323680157e-08, "grad_condition": 28483815.51624248, "lr": 0.000927682130080253, "time_sec": 66.75868964195251 }, { "epoch": 27, "train_loss": 3.5931669886779787, "train_acc": 0.1502, "test_loss": 6.223846574401856, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.5877941221593797, "grad_max_sv": 0.24717812985181808, "grad_min_sv": 9.855245958201308e-09, "grad_condition": 28193359.09622656, "lr": 0.0009221639627510072, "time_sec": 66.77666926383972 }, { "epoch": 28, "train_loss": 3.5780224719238283, "train_acc": 0.15286, "test_loss": 6.90847115020752, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.5733930952654505, "grad_max_sv": 0.2419151894748211, "grad_min_sv": 9.843924880792442e-09, "grad_condition": 28364870.16247251, "lr": 0.0009164606203550494, "time_sec": 66.74913716316223 }, { "epoch": 29, "train_loss": 3.573341248779297, "train_acc": 0.15312, "test_loss": 6.439982345581055, "test_acc": 0.021, "lyapunov": null, "grad_norm": 0.5679699095868811, "grad_max_sv": 0.2286886375397444, "grad_min_sv": 9.63519248414757e-09, "grad_condition": 29833754.648618333, "lr": 0.0009105746045668516, "time_sec": 66.7665946483612 }, { "epoch": 30, "train_loss": 3.5598143620300293, "train_acc": 0.1562, "test_loss": 6.429332733154297, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.5589691788337113, "grad_max_sv": 0.227083408087492, "grad_min_sv": 9.709436735172439e-09, "grad_condition": 27930931.211393736, "lr": 0.0009045084971874733, "time_sec": 66.75674724578857 }, { "epoch": 31, "train_loss": 3.5470434929656984, "train_acc": 0.16, "test_loss": 6.6052438804626465, "test_acc": 0.0237, "lyapunov": null, "grad_norm": 0.5612591002612681, "grad_max_sv": 0.22930745929479598, "grad_min_sv": 9.687322477525128e-09, "grad_condition": 27425333.623921502, "lr": 0.0008982649590120977, "time_sec": 66.71509528160095 }, { "epoch": 32, "train_loss": 3.537414684448242, "train_acc": 0.16062, "test_loss": 6.011712426757812, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.5564909883403706, "grad_max_sv": 0.22170890271663665, "grad_min_sv": 9.485011626120255e-09, "grad_condition": 25722607.460985243, "lr": 0.0008918467286629196, "time_sec": 66.73007607460022 }, { "epoch": 33, "train_loss": 3.5317853105163572, "train_acc": 0.1603, "test_loss": 6.360434799194336, "test_acc": 0.0189, "lyapunov": null, "grad_norm": 0.550433878030662, "grad_max_sv": 0.2289751097559929, "grad_min_sv": 9.54062134832928e-09, "grad_condition": 381531522.893629, "lr": 0.0008852566213878943, "time_sec": 66.71780228614807 }, { "epoch": 34, "train_loss": 3.5253816675567626, "train_acc": 0.16216, "test_loss": 6.247197938537598, "test_acc": 0.0221, "lyapunov": null, "grad_norm": 0.5426800931973276, "grad_max_sv": 0.21441863812506198, "grad_min_sv": 9.316700774752996e-09, "grad_condition": 26950152.667612456, "lr": 0.000878497527825878, "time_sec": 66.72579026222229 }, { "epoch": 35, "train_loss": 3.502744727020264, "train_acc": 0.16578, "test_loss": 6.571361762237549, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.5398257014810475, "grad_max_sv": 0.20931940749287606, "grad_min_sv": 9.403711298539009e-09, "grad_condition": 25780458.398535747, "lr": 0.000871572412738697, "time_sec": 66.74532318115234 }, { "epoch": 36, "train_loss": 3.5064585032653808, "train_acc": 0.1655, "test_loss": 6.218161656951905, "test_acc": 0.0264, "lyapunov": null, "grad_norm": 0.5305975593103218, "grad_max_sv": 0.20301839672029018, "grad_min_sv": 9.261498659651757e-09, "grad_condition": 24222820.24324985, "lr": 0.0008644843137107055, "time_sec": 66.7688057422638 }, { "epoch": 37, "train_loss": 3.4891217603302, "train_acc": 0.16706, "test_loss": 6.142190956115723, "test_acc": 0.0211, "lyapunov": null, "grad_norm": 0.5317318651110877, "grad_max_sv": 0.20387103594839573, "grad_min_sv": 9.19414472749791e-09, "grad_condition": 41748735.80026223, "lr": 0.0008572363398164014, "time_sec": 66.75609850883484 }, { "epoch": 38, "train_loss": 3.4776386444854737, "train_acc": 0.17062, "test_loss": 6.417214579772949, "test_acc": 0.0205, "lyapunov": null, "grad_norm": 0.5236386972874332, "grad_max_sv": 0.20101286694407464, "grad_min_sv": 9.154465988037152e-09, "grad_condition": 37634567.23075999, "lr": 0.0008498316702566826, "time_sec": 66.79052495956421 }, { "epoch": 39, "train_loss": 3.46743884765625, "train_acc": 0.16932, "test_loss": 5.726113172912598, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.5210988175669885, "grad_max_sv": 0.19942357540130615, "grad_min_sv": 8.937806597608677e-09, "grad_condition": 49428217.19173406, "lr": 0.0008422735529643442, "time_sec": 66.74242496490479 }, { "epoch": 40, "train_loss": 3.451697437210083, "train_acc": 0.17372, "test_loss": 6.044572091674804, "test_acc": 0.0225, "lyapunov": null, "grad_norm": 0.5170646983548032, "grad_max_sv": 0.19684507846832275, "grad_min_sv": 9.003056534485909e-09, "grad_condition": 138977031.8076538, "lr": 0.0008345653031794289, "time_sec": 66.70748567581177 }, { "epoch": 41, "train_loss": 3.4474837628173827, "train_acc": 0.17626, "test_loss": 5.9893402641296385, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.5155937638119307, "grad_max_sv": 0.19306579753756523, "grad_min_sv": 8.943595689384076e-09, "grad_condition": 75805302.28035732, "lr": 0.0008267103019950526, "time_sec": 66.69197702407837 }, { "epoch": 42, "train_loss": 3.4423429164123536, "train_acc": 0.17422, "test_loss": 5.739228091430664, "test_acc": 0.0203, "lyapunov": null, "grad_norm": 0.5099978166539899, "grad_max_sv": 0.1884769570082426, "grad_min_sv": 8.939715143152505e-09, "grad_condition": 24445550.576415405, "lr": 0.0008187119948743447, "time_sec": 66.70687818527222 }, { "epoch": 43, "train_loss": 3.4337082667541505, "train_acc": 0.1755, "test_loss": 5.964181529998779, "test_acc": 0.0177, "lyapunov": null, "grad_norm": 0.5104491505466159, "grad_max_sv": 0.19002889432013034, "grad_min_sv": 9.048546927015178e-09, "grad_condition": 102521993.69997685, "lr": 0.000810573890139155, "time_sec": 66.7257513999939 }, { "epoch": 44, "train_loss": 3.420871334762573, "train_acc": 0.17948, "test_loss": 5.929026190948487, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.5050154925488476, "grad_max_sv": 0.18516961708664895, "grad_min_sv": 8.980576357564551e-09, "grad_condition": 24771047.136464976, "lr": 0.0008022995574311873, "time_sec": 66.74575066566467 }, { "epoch": 45, "train_loss": 3.4096126289367676, "train_acc": 0.18164, "test_loss": 5.663789749145508, "test_acc": 0.0195, "lyapunov": null, "grad_norm": 0.5049903163352594, "grad_max_sv": 0.18273597210645676, "grad_min_sv": 8.972159917797207e-09, "grad_condition": 23794424.428349543, "lr": 0.0007938926261462363, "time_sec": 66.7593412399292 }, { "epoch": 46, "train_loss": 3.410715911254883, "train_acc": 0.1807, "test_loss": 5.895871440124512, "test_acc": 0.018, "lyapunov": null, "grad_norm": 0.5025553542851052, "grad_max_sv": 0.1833956018090248, "grad_min_sv": 8.830828140959924e-09, "grad_condition": 30936751.6432406, "lr": 0.0007853567838422158, "time_sec": 66.75630521774292 }, { "epoch": 47, "train_loss": 3.4009066193389894, "train_acc": 0.18276, "test_loss": 6.028702513122559, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.5031283438960251, "grad_max_sv": 0.1799595769494772, "grad_min_sv": 8.917869195879114e-09, "grad_condition": 23059530.36595428, "lr": 0.0007766957746216719, "time_sec": 66.75422596931458 }, { "epoch": 48, "train_loss": 3.390701540603638, "train_acc": 0.18414, "test_loss": 6.1965219741821285, "test_acc": 0.0191, "lyapunov": null, "grad_norm": 0.4978643158932146, "grad_max_sv": 0.1835469003766775, "grad_min_sv": 8.827262552163485e-09, "grad_condition": 51184664.832447655, "lr": 0.0007679133974894982, "time_sec": 66.75912022590637 }, { "epoch": 49, "train_loss": 3.3818662035369873, "train_acc": 0.185, "test_loss": 5.9103582473754885, "test_acc": 0.0216, "lyapunov": null, "grad_norm": 0.49852008894363287, "grad_max_sv": 0.18433105908334255, "grad_min_sv": 8.89238179827001e-09, "grad_condition": 40247674.29131043, "lr": 0.000759013504686565, "time_sec": 66.705406665802 }, { "epoch": 50, "train_loss": 3.3789881330871583, "train_acc": 0.18412, "test_loss": 6.037129666137695, "test_acc": 0.0221, "lyapunov": null, "grad_norm": 0.49658079337268785, "grad_max_sv": 0.179146596416831, "grad_min_sv": 8.88557344369545e-09, "grad_condition": 24117261.20845995, "lr": 0.0007499999999999998, "time_sec": 66.72649240493774 }, { "epoch": 51, "train_loss": 3.368231953201294, "train_acc": 0.18852, "test_loss": 5.9292546646118165, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.4961366760585921, "grad_max_sv": 0.17853211835026742, "grad_min_sv": 8.978999294084744e-09, "grad_condition": 23793132.034851797, "lr": 0.0007408768370508575, "time_sec": 66.72111701965332 }, { "epoch": 52, "train_loss": 3.3652955891418457, "train_acc": 0.18696, "test_loss": 6.321981049346924, "test_acc": 0.0194, "lyapunov": null, "grad_norm": 0.492099764209841, "grad_max_sv": 0.16977054849267006, "grad_min_sv": 8.831625028515866e-09, "grad_condition": 22251962.97293579, "lr": 0.0007316480175599307, "time_sec": 66.76648426055908 }, { "epoch": 53, "train_loss": 3.348167460861206, "train_acc": 0.19116, "test_loss": 6.423485536193848, "test_acc": 0.0194, "lyapunov": null, "grad_norm": 0.49189585228327304, "grad_max_sv": 0.17462090440094472, "grad_min_sv": 8.786478893248183e-09, "grad_condition": 188050773.829039, "lr": 0.0007223175895924635, "time_sec": 66.76346206665039 }, { "epoch": 54, "train_loss": 3.348860473022461, "train_acc": 0.1902, "test_loss": 5.888034158325195, "test_acc": 0.0208, "lyapunov": null, "grad_norm": 0.49279210316788963, "grad_max_sv": 0.17498359829187393, "grad_min_sv": 8.822100200367444e-09, "grad_condition": 28219026.60736394, "lr": 0.0007128896457825361, "time_sec": 66.78646183013916 }, { "epoch": 55, "train_loss": 3.340097451171875, "train_acc": 0.19068, "test_loss": 6.104175454711914, "test_acc": 0.0217, "lyapunov": null, "grad_norm": 0.48880812803196916, "grad_max_sv": 0.16894785091280937, "grad_min_sv": 8.688565139580718e-09, "grad_condition": 29986515.161999334, "lr": 0.0007033683215378998, "time_sec": 66.76022791862488 }, { "epoch": 56, "train_loss": 3.3290103381347658, "train_acc": 0.19526, "test_loss": 6.31472435760498, "test_acc": 0.021, "lyapunov": null, "grad_norm": 0.4920323275084941, "grad_max_sv": 0.16673259809613228, "grad_min_sv": 8.834232892440674e-09, "grad_condition": 22477005.35692047, "lr": 0.0006937577932260512, "time_sec": 66.74644947052002 }, { "epoch": 57, "train_loss": 3.3146336823272704, "train_acc": 0.19646, "test_loss": 5.99189327545166, "test_acc": 0.0226, "lyapunov": null, "grad_norm": 0.48946191063890415, "grad_max_sv": 0.167069473862648, "grad_min_sv": 8.78488659317167e-09, "grad_condition": 21365105.05732888, "lr": 0.0006840622763423388, "time_sec": 66.73155951499939 }, { "epoch": 58, "train_loss": 3.304142900466919, "train_acc": 0.19854, "test_loss": 5.5838108703613285, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.4865732671541852, "grad_max_sv": 0.16740650571882726, "grad_min_sv": 8.786859095888389e-09, "grad_condition": 22043022.83729876, "lr": 0.0006742860236609073, "time_sec": 66.7638807296753 }, { "epoch": 59, "train_loss": 3.306339856491089, "train_acc": 0.19832, "test_loss": 6.71665584564209, "test_acc": 0.0226, "lyapunov": null, "grad_norm": 0.4874859882247268, "grad_max_sv": 0.17165971212089062, "grad_min_sv": 8.715364420430748e-09, "grad_condition": 25734869.826652374, "lr": 0.0006644333233692913, "time_sec": 66.69665598869324 }, { "epoch": 60, "train_loss": 3.2998611443328856, "train_acc": 0.19806, "test_loss": 5.851872462463379, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.4884739100521322, "grad_max_sv": 0.16974798031151295, "grad_min_sv": 8.883696248074279e-09, "grad_condition": 21737745.94010177, "lr": 0.0006545084971874734, "time_sec": 66.72846579551697 }, { "epoch": 61, "train_loss": 3.2928254180908203, "train_acc": 0.19828, "test_loss": 5.552249732971191, "test_acc": 0.023, "lyapunov": null, "grad_norm": 0.49016744220935893, "grad_max_sv": 0.16948793716728688, "grad_min_sv": 8.760361631943159e-09, "grad_condition": 27254819.27808509, "lr": 0.0006445158984722354, "time_sec": 66.78463363647461 }, { "epoch": 62, "train_loss": 3.275610556716919, "train_acc": 0.20532, "test_loss": 5.873171199035644, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.4866265828805679, "grad_max_sv": 0.16542929150164126, "grad_min_sv": 8.78843325786971e-09, "grad_condition": 66183687.20952544, "lr": 0.0006344599103076324, "time_sec": 66.76870799064636 }, { "epoch": 63, "train_loss": 3.271966901855469, "train_acc": 0.20438, "test_loss": 5.9298525764465335, "test_acc": 0.024, "lyapunov": null, "grad_norm": 0.4859022585476048, "grad_max_sv": 0.16404966413974761, "grad_min_sv": 8.811849419587681e-09, "grad_condition": 22319350.467063613, "lr": 0.0006243449435824269, "time_sec": 66.73905062675476 }, { "epoch": 64, "train_loss": 3.266578521652222, "train_acc": 0.2042, "test_loss": 5.641555810546875, "test_acc": 0.0272, "lyapunov": null, "grad_norm": 0.48486007197076664, "grad_max_sv": 0.1655890803784132, "grad_min_sv": 8.723941788413291e-09, "grad_condition": 22305108.16299928, "lr": 0.0006141754350553275, "time_sec": 66.7476577758789 }, { "epoch": 65, "train_loss": 3.2511880633544923, "train_acc": 0.2074, "test_loss": 5.8412233901977535, "test_acc": 0.024, "lyapunov": null, "grad_norm": 0.48754428036288966, "grad_max_sv": 0.16739307381212712, "grad_min_sv": 8.817329924526441e-09, "grad_condition": 21968003.756148495, "lr": 0.0006039558454088793, "time_sec": 66.75903058052063 }, { "epoch": 66, "train_loss": 3.249825279388428, "train_acc": 0.2102, "test_loss": 5.375687086486816, "test_acc": 0.0237, "lyapunov": null, "grad_norm": 0.4852656386861206, "grad_max_sv": 0.16313621625304223, "grad_min_sv": 8.705907367234644e-09, "grad_condition": 22679705.957923576, "lr": 0.000593690657292862, "time_sec": 66.70783424377441 }, { "epoch": 67, "train_loss": 3.245251103134155, "train_acc": 0.21036, "test_loss": 6.777110389709472, "test_acc": 0.0168, "lyapunov": null, "grad_norm": 0.4867378238882827, "grad_max_sv": 0.1655280452221632, "grad_min_sv": 8.915351975939679e-09, "grad_condition": 110454092.86004348, "lr": 0.0005833843733580507, "time_sec": 66.69803929328918 }, { "epoch": 68, "train_loss": 3.2381321800231935, "train_acc": 0.20952, "test_loss": 6.102328826904297, "test_acc": 0.0197, "lyapunov": null, "grad_norm": 0.48671688246611916, "grad_max_sv": 0.1659169655293226, "grad_min_sv": 8.76257463186536e-09, "grad_condition": 44812459.07892763, "lr": 0.0005730415142812054, "time_sec": 66.69719409942627 }, { "epoch": 69, "train_loss": 3.2316595709991454, "train_acc": 0.21144, "test_loss": 5.602972175598144, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.4847784835340826, "grad_max_sv": 0.1632793139666319, "grad_min_sv": 8.814856525610204e-09, "grad_condition": 107593372.59174109, "lr": 0.0005626666167821517, "time_sec": 66.68555569648743 }, { "epoch": 70, "train_loss": 3.21884576965332, "train_acc": 0.21162, "test_loss": 6.080870904541015, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.4868075160552665, "grad_max_sv": 0.15996163412928582, "grad_min_sv": 8.820852938351554e-09, "grad_condition": 24906478.982524626, "lr": 0.0005522642316338265, "time_sec": 66.75078678131104 }, { "epoch": 71, "train_loss": 3.2169480547332765, "train_acc": 0.2131, "test_loss": 6.322179025268555, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.48693869340308327, "grad_max_sv": 0.16328724324703217, "grad_min_sv": 8.897740871871563e-09, "grad_condition": 21378151.74249644, "lr": 0.0005418389216661573, "time_sec": 66.82618498802185 }, { "epoch": 72, "train_loss": 3.209583250656128, "train_acc": 0.21452, "test_loss": 5.9164725677490235, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.48710676929190333, "grad_max_sv": 0.1638231087476015, "grad_min_sv": 8.895584530099753e-09, "grad_condition": 26372411.903145302, "lr": 0.0005313952597646563, "time_sec": 66.76002073287964 }, { "epoch": 73, "train_loss": 3.206989998016357, "train_acc": 0.2156, "test_loss": 6.779888274383545, "test_acc": 0.02, "lyapunov": null, "grad_norm": 0.4871385804296449, "grad_max_sv": 0.16540717855095863, "grad_min_sv": 8.919061500467506e-09, "grad_condition": 24713788.997361727, "lr": 0.0005209378268645994, "time_sec": 66.79043841362 }, { "epoch": 74, "train_loss": 3.196985797729492, "train_acc": 0.21718, "test_loss": 6.031893154907227, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.4885299333145373, "grad_max_sv": 0.1637456502765417, "grad_min_sv": 8.884239661999249e-09, "grad_condition": 31643344.54858377, "lr": 0.0005104712099416781, "time_sec": 66.7399845123291 }, { "epoch": 75, "train_loss": 3.1916642933654784, "train_acc": 0.21804, "test_loss": 6.505784149169922, "test_acc": 0.0263, "lyapunov": null, "grad_norm": 0.48738903646108195, "grad_max_sv": 0.16264366619288922, "grad_min_sv": 8.976378307323785e-09, "grad_condition": 23550016.098660976, "lr": 0.0004999999999999996, "time_sec": 66.73288559913635 }, { "epoch": 76, "train_loss": 3.1814585160827638, "train_acc": 0.22052, "test_loss": 6.48178818359375, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.4843426315380276, "grad_max_sv": 0.16138911359012126, "grad_min_sv": 8.912034432650984e-09, "grad_condition": 23286891.30520594, "lr": 0.0004895287900583212, "time_sec": 66.69967555999756 }, { "epoch": 77, "train_loss": 3.1693101245117186, "train_acc": 0.22188, "test_loss": 6.60695295715332, "test_acc": 0.0274, "lyapunov": null, "grad_norm": 0.48473864055458005, "grad_max_sv": 0.16252022571861743, "grad_min_sv": 8.865778075572983e-09, "grad_condition": 20379861.793125592, "lr": 0.0004790621731353997, "time_sec": 66.73058843612671 }, { "epoch": 78, "train_loss": 3.172366504058838, "train_acc": 0.22092, "test_loss": 6.633734432983398, "test_acc": 0.0249, "lyapunov": null, "grad_norm": 0.4834678400720691, "grad_max_sv": 0.1624290570616722, "grad_min_sv": 8.932120706961477e-09, "grad_condition": 23408681.375307254, "lr": 0.000468604740235343, "time_sec": 66.69404172897339 }, { "epoch": 79, "train_loss": 3.1615784413146972, "train_acc": 0.2258, "test_loss": 6.273578634643554, "test_acc": 0.0281, "lyapunov": null, "grad_norm": 0.48944403353102334, "grad_max_sv": 0.16398866586387156, "grad_min_sv": 8.946382384911189e-09, "grad_condition": 22712578.898883633, "lr": 0.00045816107833384175, "time_sec": 66.7472972869873 }, { "epoch": 80, "train_loss": 3.1575608079528807, "train_acc": 0.22382, "test_loss": 6.2906877746582035, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.4897084401415468, "grad_max_sv": 0.16338732056319713, "grad_min_sv": 8.928839754715478e-09, "grad_condition": 54043718.99023694, "lr": 0.0004477357683661729, "time_sec": 66.72847270965576 }, { "epoch": 81, "train_loss": 3.1497875170898437, "train_acc": 0.22584, "test_loss": 6.6115754776000975, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.48772100619317266, "grad_max_sv": 0.15775733068585396, "grad_min_sv": 9.009791279712686e-09, "grad_condition": 20818306.202141248, "lr": 0.00043733338321784746, "time_sec": 66.74951100349426 }, { "epoch": 82, "train_loss": 3.150099751586914, "train_acc": 0.22466, "test_loss": 6.489882479858398, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.48649716303896257, "grad_max_sv": 0.15712360739707948, "grad_min_sv": 8.928376640099378e-09, "grad_condition": 33122173.6130862, "lr": 0.0004269584857187939, "time_sec": 66.73039722442627 }, { "epoch": 83, "train_loss": 3.1423302052307127, "train_acc": 0.22782, "test_loss": 6.021305515289306, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.48633742199561775, "grad_max_sv": 0.1581266548484564, "grad_min_sv": 8.888032958058456e-09, "grad_condition": 115025831.2804152, "lr": 0.0004166156266419484, "time_sec": 66.74857115745544 }, { "epoch": 84, "train_loss": 3.128035169677734, "train_acc": 0.22886, "test_loss": 6.798161625671387, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.48802181363511177, "grad_max_sv": 0.1612305197864771, "grad_min_sv": 8.905917459056666e-09, "grad_condition": 24037955.80487976, "lr": 0.0004063093427071373, "time_sec": 66.70986270904541 }, { "epoch": 85, "train_loss": 3.127580302810669, "train_acc": 0.23112, "test_loss": 6.7588252937316895, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.4875306431638057, "grad_max_sv": 0.16091111600399016, "grad_min_sv": 9.01161150146379e-09, "grad_condition": 21073737.755382914, "lr": 0.0003960441545911199, "time_sec": 66.68802571296692 }, { "epoch": 86, "train_loss": 3.114855668182373, "train_acc": 0.2308, "test_loss": 6.564279100036621, "test_acc": 0.0282, "lyapunov": null, "grad_norm": 0.48637730612121255, "grad_max_sv": 0.15542719289660453, "grad_min_sv": 8.93872263707518e-09, "grad_condition": 21703985.404231258, "lr": 0.0003858245649446718, "time_sec": 66.6933023929596 }, { "epoch": 87, "train_loss": 3.1120968659210204, "train_acc": 0.23044, "test_loss": 6.98433928451538, "test_acc": 0.0287, "lyapunov": null, "grad_norm": 0.4900107193499055, "grad_max_sv": 0.16207418888807296, "grad_min_sv": 8.972892097738883e-09, "grad_condition": 47614869.04451983, "lr": 0.00037565505641757235, "time_sec": 66.71200680732727 }, { "epoch": 88, "train_loss": 3.105097593078613, "train_acc": 0.23214, "test_loss": 6.7922447959899905, "test_acc": 0.0302, "lyapunov": null, "grad_norm": 0.4884472360111878, "grad_max_sv": 0.15889082551002504, "grad_min_sv": 8.899033936138335e-09, "grad_condition": 25000729.654329486, "lr": 0.00036554008969236695, "time_sec": 66.7427408695221 }, { "epoch": 89, "train_loss": 3.0926671070098877, "train_acc": 0.23664, "test_loss": 6.916401704406738, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.49050493507655857, "grad_max_sv": 0.16100925132632254, "grad_min_sv": 9.010439719348006e-09, "grad_condition": 21207674.720614858, "lr": 0.0003554841015277638, "time_sec": 66.76495027542114 }, { "epoch": 90, "train_loss": 3.090296846160889, "train_acc": 0.23536, "test_loss": 7.012615090179444, "test_acc": 0.0308, "lyapunov": null, "grad_norm": 0.49019979842343425, "grad_max_sv": 0.1572930809110403, "grad_min_sv": 8.949024762796698e-09, "grad_condition": 734920063.8359609, "lr": 0.000345491502812526, "time_sec": 66.73302173614502 }, { "epoch": 91, "train_loss": 3.085657378997803, "train_acc": 0.23746, "test_loss": 6.360618818664551, "test_acc": 0.0363, "lyapunov": null, "grad_norm": 0.4915162849741807, "grad_max_sv": 0.15855198130011558, "grad_min_sv": 8.980356871329809e-09, "grad_condition": 28731902.889844812, "lr": 0.0003355666766307081, "time_sec": 66.74396848678589 }, { "epoch": 92, "train_loss": 3.0831817041778566, "train_acc": 0.2383, "test_loss": 5.9396498611450195, "test_acc": 0.0352, "lyapunov": null, "grad_norm": 0.49047678071806555, "grad_max_sv": 0.15942419767379762, "grad_min_sv": 9.062854348755588e-09, "grad_condition": 57497218.341688454, "lr": 0.00032571397633909225, "time_sec": 66.77806997299194 }, { "epoch": 93, "train_loss": 3.071146830596924, "train_acc": 0.23998, "test_loss": 6.60078558807373, "test_acc": 0.0328, "lyapunov": null, "grad_norm": 0.48952410405337216, "grad_max_sv": 0.1553661532700062, "grad_min_sv": 9.10862152092573e-09, "grad_condition": 20074531.31734441, "lr": 0.00031593772365766094, "time_sec": 66.71407961845398 }, { "epoch": 94, "train_loss": 3.0655629290008544, "train_acc": 0.23992, "test_loss": 6.003435957336426, "test_acc": 0.0378, "lyapunov": null, "grad_norm": 0.49221246193757373, "grad_max_sv": 0.15908809714019298, "grad_min_sv": 9.144222304358074e-09, "grad_condition": 19907441.898985844, "lr": 0.0003062422067739483, "time_sec": 66.693532705307 }, { "epoch": 95, "train_loss": 3.060634704437256, "train_acc": 0.23888, "test_loss": 6.056681440734863, "test_acc": 0.0373, "lyapunov": null, "grad_norm": 0.49339217556104, "grad_max_sv": 0.15901063568890095, "grad_min_sv": 9.065924972545547e-09, "grad_condition": 29502219.759497046, "lr": 0.00029663167846209965, "time_sec": 66.70557427406311 }, { "epoch": 96, "train_loss": 3.061671485443115, "train_acc": 0.24224, "test_loss": 6.776474742126465, "test_acc": 0.0353, "lyapunov": null, "grad_norm": 0.49062641992823525, "grad_max_sv": 0.15993262231349945, "grad_min_sv": 9.044680277306427e-09, "grad_condition": 42484326.952753186, "lr": 0.00028711035421746345, "time_sec": 66.71291422843933 }, { "epoch": 97, "train_loss": 3.0552709561157227, "train_acc": 0.24368, "test_loss": 6.627662403869629, "test_acc": 0.0312, "lyapunov": null, "grad_norm": 0.49312118223102674, "grad_max_sv": 0.1586600374430418, "grad_min_sv": 9.106857379315159e-09, "grad_condition": 19815371.442228314, "lr": 0.00027768241040753615, "time_sec": 66.74342608451843 }, { "epoch": 98, "train_loss": 3.047260310974121, "train_acc": 0.24534, "test_loss": 6.661625199890136, "test_acc": 0.0358, "lyapunov": null, "grad_norm": 0.4920094661808142, "grad_max_sv": 0.1592965368181467, "grad_min_sv": 9.102059620250124e-09, "grad_condition": 78440147.91108674, "lr": 0.00026835198244006903, "time_sec": 66.75223684310913 }, { "epoch": 99, "train_loss": 3.046775559768677, "train_acc": 0.24216, "test_loss": 6.965150428771973, "test_acc": 0.0306, "lyapunov": null, "grad_norm": 0.4926874565507386, "grad_max_sv": 0.16148377656936647, "grad_min_sv": 9.167028746162597e-09, "grad_condition": 82327087.71133485, "lr": 0.0002591231629491421, "time_sec": 66.76156210899353 }, { "epoch": 100, "train_loss": 3.041998874053955, "train_acc": 0.24108, "test_loss": 6.647268369293213, "test_acc": 0.0319, "lyapunov": null, "grad_norm": 0.49732363208650837, "grad_max_sv": 0.15973055586218834, "grad_min_sv": 9.144760823587283e-09, "grad_condition": 19643395.96339509, "lr": 0.0002499999999999997, "time_sec": 66.74560022354126 }, { "epoch": 101, "train_loss": 3.0355277448272706, "train_acc": 0.24656, "test_loss": 6.661636563873291, "test_acc": 0.0352, "lyapunov": null, "grad_norm": 0.4945949712556627, "grad_max_sv": 0.16228868998587132, "grad_min_sv": 9.097275698727314e-09, "grad_condition": 29717156.96899251, "lr": 0.00024098649531343477, "time_sec": 66.74929976463318 }, { "epoch": 102, "train_loss": 3.028595997467041, "train_acc": 0.24942, "test_loss": 7.008212976837158, "test_acc": 0.0297, "lyapunov": null, "grad_norm": 0.4951875945091829, "grad_max_sv": 0.1601081270724535, "grad_min_sv": 9.183049341776606e-09, "grad_condition": 28833554.07107707, "lr": 0.0002320866025105016, "time_sec": 66.70356440544128 }, { "epoch": 103, "train_loss": 3.0245940507507325, "train_acc": 0.24584, "test_loss": 6.46308011932373, "test_acc": 0.0341, "lyapunov": null, "grad_norm": 0.49371498929192353, "grad_max_sv": 0.15619246214628218, "grad_min_sv": 9.060142111202984e-09, "grad_condition": 39182662.24958947, "lr": 0.0002233042253783278, "time_sec": 66.71340656280518 }, { "epoch": 104, "train_loss": 3.021408618774414, "train_acc": 0.2456, "test_loss": 6.825051796722412, "test_acc": 0.0336, "lyapunov": null, "grad_norm": 0.4938389055758033, "grad_max_sv": 0.1602877888828516, "grad_min_sv": 9.021206631709689e-09, "grad_condition": 22621712.521351572, "lr": 0.000214643216157784, "time_sec": 66.69873213768005 }, { "epoch": 105, "train_loss": 3.0085532719421386, "train_acc": 0.25126, "test_loss": 6.49373994140625, "test_acc": 0.0345, "lyapunov": null, "grad_norm": 0.49734202210836465, "grad_max_sv": 0.1637524042278528, "grad_min_sv": 9.15554402847185e-09, "grad_condition": 21636907.97691984, "lr": 0.00020610737385376332, "time_sec": 66.7116219997406 }, { "epoch": 106, "train_loss": 3.0132780470275877, "train_acc": 0.24846, "test_loss": 6.5495201698303225, "test_acc": 0.0336, "lyapunov": null, "grad_norm": 0.4981310757648767, "grad_max_sv": 0.15820327922701835, "grad_min_sv": 9.158961136734866e-09, "grad_condition": 20307530.065489154, "lr": 0.00019770044256881242, "time_sec": 66.74218201637268 }, { "epoch": 107, "train_loss": 3.0039769695281984, "train_acc": 0.24998, "test_loss": 6.218603918457031, "test_acc": 0.0361, "lyapunov": null, "grad_norm": 0.4961392053949623, "grad_max_sv": 0.1600139781832695, "grad_min_sv": 9.131589118194228e-09, "grad_condition": 36979479.48401734, "lr": 0.0001894261098608447, "time_sec": 66.80793809890747 }, { "epoch": 108, "train_loss": 3.001887908782959, "train_acc": 0.2516, "test_loss": 6.588950064086914, "test_acc": 0.0328, "lyapunov": null, "grad_norm": 0.49597326074702125, "grad_max_sv": 0.1588774763047695, "grad_min_sv": 9.17765310692875e-09, "grad_condition": 50896304.22255845, "lr": 0.000181288005125655, "time_sec": 66.76537990570068 }, { "epoch": 109, "train_loss": 2.9904132221221924, "train_acc": 0.25664, "test_loss": 6.382045315551758, "test_acc": 0.0395, "lyapunov": null, "grad_norm": 0.4973619331899814, "grad_max_sv": 0.1614119179546833, "grad_min_sv": 9.145205881466722e-09, "grad_condition": 19754492.90124496, "lr": 0.0001732896980049473, "time_sec": 66.78630447387695 }, { "epoch": 110, "train_loss": 2.989228514251709, "train_acc": 0.25492, "test_loss": 6.322301493072509, "test_acc": 0.0369, "lyapunov": null, "grad_norm": 0.498337161336674, "grad_max_sv": 0.15811876803636551, "grad_min_sv": 9.229779307506902e-09, "grad_condition": 19822899.140848357, "lr": 0.00016543469682057076, "time_sec": 66.75606536865234 }, { "epoch": 111, "train_loss": 2.984906556854248, "train_acc": 0.25606, "test_loss": 6.8701157440185545, "test_acc": 0.0367, "lyapunov": null, "grad_norm": 0.49721550527739367, "grad_max_sv": 0.16228222362697126, "grad_min_sv": 9.23479824502943e-09, "grad_condition": 293614052.48096585, "lr": 0.00015772644703565552, "time_sec": 66.73988127708435 }, { "epoch": 112, "train_loss": 2.9811305560302737, "train_acc": 0.25646, "test_loss": 7.038999290466308, "test_acc": 0.0335, "lyapunov": null, "grad_norm": 0.4941490782513605, "grad_max_sv": 0.15477370359003545, "grad_min_sv": 9.218313174429171e-09, "grad_condition": 164935506.24721447, "lr": 0.00015016832974331713, "time_sec": 66.71515774726868 }, { "epoch": 113, "train_loss": 2.9800968042755125, "train_acc": 0.25398, "test_loss": 6.309658117675781, "test_acc": 0.0389, "lyapunov": null, "grad_norm": 0.49886850458670223, "grad_max_sv": 0.16330830678343772, "grad_min_sv": 9.236376152799153e-09, "grad_condition": 21870251.37413417, "lr": 0.00014276366018359834, "time_sec": 66.71296858787537 }, { "epoch": 114, "train_loss": 2.9754512078094484, "train_acc": 0.25594, "test_loss": 6.60843113861084, "test_acc": 0.0346, "lyapunov": null, "grad_norm": 0.4960627007320755, "grad_max_sv": 0.1573273716494441, "grad_min_sv": 9.209630175144312e-09, "grad_condition": 21208142.4041068, "lr": 0.00013551568628929425, "time_sec": 66.73864150047302 }, { "epoch": 115, "train_loss": 2.973171382446289, "train_acc": 0.25546, "test_loss": 6.1580316360473635, "test_acc": 0.0359, "lyapunov": null, "grad_norm": 0.4975170133978326, "grad_max_sv": 0.16185041181743146, "grad_min_sv": 9.172154036285463e-09, "grad_condition": 23675277.644423716, "lr": 0.00012842758726130276, "time_sec": 66.7741425037384 }, { "epoch": 116, "train_loss": 2.9698315058135987, "train_acc": 0.2585, "test_loss": 6.728188695526123, "test_acc": 0.0352, "lyapunov": null, "grad_norm": 0.49786156791485014, "grad_max_sv": 0.1629601776599884, "grad_min_sv": 9.141069147108882e-09, "grad_condition": 42245446.81835711, "lr": 0.0001215024721741218, "time_sec": 66.85877132415771 }, { "epoch": 117, "train_loss": 2.96759364151001, "train_acc": 0.25688, "test_loss": 6.810253086853027, "test_acc": 0.0317, "lyapunov": null, "grad_norm": 0.5004102922188621, "grad_max_sv": 0.16316126510500908, "grad_min_sv": 9.275286505516789e-09, "grad_condition": 21737711.712548293, "lr": 0.00011474337861210538, "time_sec": 66.78435349464417 }, { "epoch": 118, "train_loss": 2.9639752848815917, "train_acc": 0.25784, "test_loss": 6.6183334121704105, "test_acc": 0.037, "lyapunov": null, "grad_norm": 0.4993536159032588, "grad_max_sv": 0.16331967823207377, "grad_min_sv": 9.30454736036701e-09, "grad_condition": 24980238.64283476, "lr": 0.00010815327133708009, "time_sec": 66.78651332855225 }, { "epoch": 119, "train_loss": 2.955244768218994, "train_acc": 0.26012, "test_loss": 7.170739624023438, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.49772875386211013, "grad_max_sv": 0.15745177641510963, "grad_min_sv": 9.275912776773865e-09, "grad_condition": 20252652.260798354, "lr": 0.00010173504098790182, "time_sec": 66.7590229511261 }, { "epoch": 120, "train_loss": 2.9573191987609864, "train_acc": 0.25902, "test_loss": 6.63704820098877, "test_acc": 0.0341, "lyapunov": null, "grad_norm": 0.4996347696527594, "grad_max_sv": 0.16082486175000668, "grad_min_sv": 9.223728218710203e-09, "grad_condition": 31826325.619799424, "lr": 9.549150281252629e-05, "time_sec": 66.7681827545166 }, { "epoch": 121, "train_loss": 2.9523595883178713, "train_acc": 0.2618, "test_loss": 6.729842405700683, "test_acc": 0.036, "lyapunov": null, "grad_norm": 0.5013710314611776, "grad_max_sv": 0.15908933244645596, "grad_min_sv": 9.356316055253444e-09, "grad_condition": 25691489.85231958, "lr": 8.942539543314794e-05, "time_sec": 66.74568009376526 }, { "epoch": 122, "train_loss": 2.9497915851593017, "train_acc": 0.2617, "test_loss": 6.87424278717041, "test_acc": 0.033, "lyapunov": null, "grad_norm": 0.5005453549657005, "grad_max_sv": 0.16275203377008438, "grad_min_sv": 9.293272996112322e-09, "grad_condition": 83221431.81677945, "lr": 8.353937964495024e-05, "time_sec": 66.74210405349731 }, { "epoch": 123, "train_loss": 2.9416942150115966, "train_acc": 0.2643, "test_loss": 6.686075965118408, "test_acc": 0.0363, "lyapunov": null, "grad_norm": 0.5025049175782571, "grad_max_sv": 0.15961344465613364, "grad_min_sv": 9.371966801230425e-09, "grad_condition": 35132803.96387108, "lr": 7.783603724899243e-05, "time_sec": 66.75957775115967 }, { "epoch": 124, "train_loss": 2.94895947555542, "train_acc": 0.25956, "test_loss": 6.959716784667969, "test_acc": 0.0344, "lyapunov": null, "grad_norm": 0.5043618033931743, "grad_max_sv": 0.16490019261837005, "grad_min_sv": 9.45151938935851e-09, "grad_condition": 20739176.963236075, "lr": 7.231786991974666e-05, "time_sec": 66.76986241340637 }, { "epoch": 125, "train_loss": 2.9465578133392336, "train_acc": 0.2615, "test_loss": 6.6146667854309085, "test_acc": 0.0372, "lyapunov": null, "grad_norm": 0.50165695568463, "grad_max_sv": 0.16004594042897224, "grad_min_sv": 9.333669109823362e-09, "grad_condition": 27696527.631483592, "lr": 6.698729810778072e-05, "time_sec": 66.79878735542297 }, { "epoch": 126, "train_loss": 2.944279951171875, "train_acc": 0.25922, "test_loss": 6.776188401794434, "test_acc": 0.0359, "lyapunov": null, "grad_norm": 0.5004778327715103, "grad_max_sv": 0.1615132074803114, "grad_min_sv": 9.285796417901615e-09, "grad_condition": 20380420.794493236, "lr": 6.184665997806817e-05, "time_sec": 66.81306886672974 }, { "epoch": 127, "train_loss": 2.9345046046447756, "train_acc": 0.26554, "test_loss": 6.409585705566406, "test_acc": 0.0365, "lyapunov": null, "grad_norm": 0.5009056150070453, "grad_max_sv": 0.16262583658099175, "grad_min_sv": 9.41551325135681e-09, "grad_condition": 92271454.95901966, "lr": 5.6898210384392595e-05, "time_sec": 66.77955317497253 }, { "epoch": 128, "train_loss": 2.9406036145782473, "train_acc": 0.26226, "test_loss": 6.883744766235352, "test_acc": 0.0362, "lyapunov": null, "grad_norm": 0.5019103000513857, "grad_max_sv": 0.15915893130004405, "grad_min_sv": 9.27946301465532e-09, "grad_condition": 26892136.241638493, "lr": 5.214411988029363e-05, "time_sec": 66.7971682548523 }, { "epoch": 129, "train_loss": 2.9357696857452393, "train_acc": 0.26482, "test_loss": 6.798914263916016, "test_acc": 0.0371, "lyapunov": null, "grad_norm": 0.502875147430765, "grad_max_sv": 0.16597487404942513, "grad_min_sv": 9.331743605622833e-09, "grad_condition": 21894734.234583445, "lr": 4.7586473766990294e-05, "time_sec": 66.76526641845703 }, { "epoch": 130, "train_loss": 2.931978320159912, "train_acc": 0.2632, "test_loss": 6.588931091308594, "test_acc": 0.0383, "lyapunov": null, "grad_norm": 0.5024988425718886, "grad_max_sv": 0.16058847755193711, "grad_min_sv": 9.346998992854072e-09, "grad_condition": 23689235.71364718, "lr": 4.32272711786996e-05, "time_sec": 66.73650169372559 }, { "epoch": 131, "train_loss": 2.9257036571502684, "train_acc": 0.26346, "test_loss": 6.79047756652832, "test_acc": 0.037, "lyapunov": null, "grad_norm": 0.5025936155191698, "grad_max_sv": 0.1606222338974476, "grad_min_sv": 9.344622825535609e-09, "grad_condition": 19448498.594337363, "lr": 3.906842420574966e-05, "time_sec": 66.72977805137634 }, { "epoch": 132, "train_loss": 2.9238443630981443, "train_acc": 0.26652, "test_loss": 6.582272483825683, "test_acc": 0.0359, "lyapunov": null, "grad_norm": 0.5057115235264575, "grad_max_sv": 0.1622081771492958, "grad_min_sv": 9.322094066382264e-09, "grad_condition": 110706873.75285177, "lr": 3.5111757055874305e-05, "time_sec": 66.74127459526062 }, { "epoch": 133, "train_loss": 2.9275563074493407, "train_acc": 0.26798, "test_loss": 6.701000856018067, "test_acc": 0.0403, "lyapunov": null, "grad_norm": 0.5047358455148018, "grad_max_sv": 0.1596795056015253, "grad_min_sv": 9.385729068944748e-09, "grad_condition": 24899256.961485635, "lr": 3.1359005254054254e-05, "time_sec": 66.78476786613464 }, { "epoch": 134, "train_loss": 2.922698397293091, "train_acc": 0.2656, "test_loss": 6.822336962890625, "test_acc": 0.0348, "lyapunov": null, "grad_norm": 0.5011816329114258, "grad_max_sv": 0.16208452992141248, "grad_min_sv": 9.367489639533489e-09, "grad_condition": 21334456.488015514, "lr": 2.7811814881259484e-05, "time_sec": 66.77467155456543 }, { "epoch": 135, "train_loss": 2.9318275360870363, "train_acc": 0.26446, "test_loss": 6.82299095916748, "test_acc": 0.0375, "lyapunov": null, "grad_norm": 0.5036159796429942, "grad_max_sv": 0.16086461171507835, "grad_min_sv": 9.421430274825227e-09, "grad_condition": 23697065.511433274, "lr": 2.4471741852423218e-05, "time_sec": 66.81163048744202 }, { "epoch": 136, "train_loss": 2.924918181915283, "train_acc": 0.26562, "test_loss": 6.8049731414794925, "test_acc": 0.0379, "lyapunov": null, "grad_norm": 0.5025705246301901, "grad_max_sv": 0.1608381040394306, "grad_min_sv": 9.298360864606891e-09, "grad_condition": 21070247.46761896, "lr": 2.1340251233966362e-05, "time_sec": 66.75751781463623 }, { "epoch": 137, "train_loss": 2.9179174461364745, "train_acc": 0.267, "test_loss": 7.41930817565918, "test_acc": 0.0354, "lyapunov": null, "grad_norm": 0.5020038013732862, "grad_max_sv": 0.16103104539215565, "grad_min_sv": 9.377383154707264e-09, "grad_condition": 25924694.766624488, "lr": 1.8418716601170932e-05, "time_sec": 66.75570106506348 }, { "epoch": 138, "train_loss": 2.923201954345703, "train_acc": 0.26658, "test_loss": 6.757112614440918, "test_acc": 0.0368, "lyapunov": null, "grad_norm": 0.5024810225531171, "grad_max_sv": 0.1589697927236557, "grad_min_sv": 9.370084333437667e-09, "grad_condition": 21088389.845349483, "lr": 1.570841943568445e-05, "time_sec": 66.72540855407715 }, { "epoch": 139, "train_loss": 2.91647822807312, "train_acc": 0.26728, "test_loss": 6.73676093826294, "test_acc": 0.0367, "lyapunov": null, "grad_norm": 0.5029392119297419, "grad_max_sv": 0.16374287530779838, "grad_min_sv": 9.458621610947127e-09, "grad_condition": 21151341.282133214, "lr": 1.3210548563419845e-05, "time_sec": 66.74242377281189 }, { "epoch": 140, "train_loss": 2.9202518330383302, "train_acc": 0.2648, "test_loss": 7.060108929443359, "test_acc": 0.0321, "lyapunov": null, "grad_norm": 0.5033375321825745, "grad_max_sv": 0.1628003478050232, "grad_min_sv": 9.350477757699705e-09, "grad_condition": 42538003.149772, "lr": 1.0926199633097203e-05, "time_sec": 66.72664403915405 }, { "epoch": 141, "train_loss": 2.9214018739318846, "train_acc": 0.26676, "test_loss": 7.03288666305542, "test_acc": 0.0373, "lyapunov": null, "grad_norm": 0.5040934974077137, "grad_max_sv": 0.1631232462823391, "grad_min_sv": 9.429894434753727e-09, "grad_condition": 22205151.285805613, "lr": 8.856374635655688e-06, "time_sec": 66.73880624771118 }, { "epoch": 142, "train_loss": 2.9171245983886718, "train_acc": 0.26776, "test_loss": 7.131447039031983, "test_acc": 0.0347, "lyapunov": null, "grad_norm": 0.502296749693395, "grad_max_sv": 0.16366422846913337, "grad_min_sv": 9.319274187069571e-09, "grad_condition": 23643079.173571, "lr": 7.001981464747503e-06, "time_sec": 66.7779552936554 }, { "epoch": 143, "train_loss": 2.922498332595825, "train_acc": 0.26552, "test_loss": 6.954830606079102, "test_acc": 0.0348, "lyapunov": null, "grad_norm": 0.5043546674267846, "grad_max_sv": 0.1646194864064455, "grad_min_sv": 9.327249025914419e-09, "grad_condition": 20109722.273851108, "lr": 5.3638335185058295e-06, "time_sec": 66.78727650642395 }, { "epoch": 144, "train_loss": 2.9214989219665526, "train_acc": 0.26862, "test_loss": 7.012627954101562, "test_acc": 0.0377, "lyapunov": null, "grad_norm": 0.5036510560585029, "grad_max_sv": 0.1648405112326145, "grad_min_sv": 9.423214848702788e-09, "grad_condition": 39000025.89670716, "lr": 3.942649342761114e-06, "time_sec": 66.78706383705139 }, { "epoch": 145, "train_loss": 2.922225288314819, "train_acc": 0.2672, "test_loss": 6.957889157104492, "test_acc": 0.0364, "lyapunov": null, "grad_norm": 0.503867068026341, "grad_max_sv": 0.16379656754434108, "grad_min_sv": 9.359998385562173e-09, "grad_condition": 77281010.69187385, "lr": 2.7390523158633524e-06, "time_sec": 66.7628915309906 }, { "epoch": 146, "train_loss": 2.9163033376312257, "train_acc": 0.2685, "test_loss": 6.855587731933594, "test_acc": 0.0358, "lyapunov": null, "grad_norm": 0.5029204495133565, "grad_max_sv": 0.16139821223914624, "grad_min_sv": 9.274698062333719e-09, "grad_condition": 20548752.94100132, "lr": 1.7535703752478133e-06, "time_sec": 66.76251316070557 }, { "epoch": 147, "train_loss": 2.9199572286987303, "train_acc": 0.2662, "test_loss": 7.004822827148438, "test_acc": 0.0334, "lyapunov": null, "grad_norm": 0.5038995262415072, "grad_max_sv": 0.15897907465696334, "grad_min_sv": 9.380836815675586e-09, "grad_condition": 19124324.302936584, "lr": 9.866357858642196e-07, "time_sec": 66.77228903770447 }, { "epoch": 148, "train_loss": 2.9100856079101565, "train_acc": 0.26856, "test_loss": 7.008816410064697, "test_acc": 0.0333, "lyapunov": null, "grad_norm": 0.5033801740007838, "grad_max_sv": 0.16318991631269456, "grad_min_sv": 9.304624077298429e-09, "grad_condition": 88163387.15126483, "lr": 4.38584950570808e-07, "time_sec": 66.73154377937317 }, { "epoch": 149, "train_loss": 2.918438820800781, "train_acc": 0.26988, "test_loss": 7.183802980041504, "test_acc": 0.0335, "lyapunov": null, "grad_norm": 0.5034594519443074, "grad_max_sv": 0.16287193521857263, "grad_min_sv": 9.228533171673492e-09, "grad_condition": 31684078.48425772, "lr": 1.096582625772501e-07, "time_sec": 66.71334385871887 }, { "epoch": 150, "train_loss": 2.9179681867980958, "train_acc": 0.26896, "test_loss": 7.132198828887939, "test_acc": 0.0374, "lyapunov": null, "grad_norm": 0.5039379693049055, "grad_max_sv": 0.16534604988992213, "grad_min_sv": 9.358835868777949e-09, "grad_condition": 24483022.85106538, "lr": 0.0, "time_sec": 66.76589560508728 } ], "20": [ { "epoch": 1, "train_loss": 5.21357828704834, "train_acc": 0.00958, "test_loss": 4.717830415344238, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 6.028281164907647, "grad_max_sv": 5.586896324157715, "grad_min_sv": 8.321505736708091e-08, "grad_condition": 126391405.93672016, "lr": 0.0009998903417374227, "time_sec": 83.75971913337708 }, { "epoch": 2, "train_loss": 5.002406215209961, "train_acc": 0.01054, "test_loss": 4.706539186859131, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.942916858382687, "grad_max_sv": 4.443458986282349, "grad_min_sv": 6.176679956948483e-08, "grad_condition": 368514713.27491444, "lr": 0.0009995614150494292, "time_sec": 83.72638368606567 }, { "epoch": 3, "train_loss": 4.941021067657471, "train_acc": 0.0102, "test_loss": 4.685369007110595, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.551335199238429, "grad_max_sv": 4.130530917644501, "grad_min_sv": 5.607447592093085e-08, "grad_condition": 379082253.2858798, "lr": 0.0009990133642141358, "time_sec": 83.7252631187439 }, { "epoch": 4, "train_loss": 4.901978406677246, "train_acc": 0.00948, "test_loss": 4.704164950561523, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.292365216371512, "grad_max_sv": 3.9344047129154207, "grad_min_sv": 5.476369089318922e-08, "grad_condition": 96219244.721114, "lr": 0.0009982464296247522, "time_sec": 83.74504327774048 }, { "epoch": 5, "train_loss": 4.875739136657715, "train_acc": 0.00976, "test_loss": 4.67882677154541, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.102770691913926, "grad_max_sv": 3.7305591464042664, "grad_min_sv": 5.105303844121778e-08, "grad_condition": 114422829.17041938, "lr": 0.0009972609476841367, "time_sec": 83.7535228729248 }, { "epoch": 6, "train_loss": 4.854646638641357, "train_acc": 0.01, "test_loss": 4.6779319816589355, "test_acc": 0.0094, "lyapunov": null, "grad_norm": 3.9533090018879022, "grad_max_sv": 3.569680255651474, "grad_min_sv": 4.9375477451096826e-08, "grad_condition": 120982864.11796215, "lr": 0.000996057350657239, "time_sec": 83.76437997817993 }, { "epoch": 7, "train_loss": 4.843388534240723, "train_acc": 0.0093, "test_loss": 4.688051298522949, "test_acc": 0.01, "lyapunov": null, "grad_norm": 3.808254303294448, "grad_max_sv": 3.401720005273819, "grad_min_sv": 4.769865569742571e-08, "grad_condition": 124322938.54178014, "lr": 0.000994636166481494, "time_sec": 83.73754358291626 }, { "epoch": 8, "train_loss": 4.831099078216552, "train_acc": 0.0098, "test_loss": 4.686168608093261, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 3.638633817460268, "grad_max_sv": 3.29349827170372, "grad_min_sv": 4.562366222038428e-08, "grad_condition": 130991249.85200353, "lr": 0.0009929980185352525, "time_sec": 83.75114607810974 }, { "epoch": 9, "train_loss": 4.8127050201416015, "train_acc": 0.01066, "test_loss": 4.702382767486572, "test_acc": 0.01, "lyapunov": null, "grad_norm": 3.500656504897414, "grad_max_sv": 3.2044365644454955, "grad_min_sv": 4.392227098831691e-08, "grad_condition": 228917141.42878217, "lr": 0.0009911436253643444, "time_sec": 83.75008654594421 }, { "epoch": 10, "train_loss": 4.809432870025635, "train_acc": 0.00958, "test_loss": 4.662561440277099, "test_acc": 0.0105, "lyapunov": null, "grad_norm": 3.3981948131519792, "grad_max_sv": 3.0618119478225707, "grad_min_sv": 4.221159614070658e-08, "grad_condition": 89285987.82360582, "lr": 0.0009890738003669028, "time_sec": 83.75357627868652 }, { "epoch": 11, "train_loss": 4.788434708251953, "train_acc": 0.01052, "test_loss": 4.672326850891113, "test_acc": 0.01, "lyapunov": null, "grad_norm": 3.239567320080417, "grad_max_sv": 2.9396412312984466, "grad_min_sv": 3.992155273024878e-08, "grad_condition": 91783422.62374839, "lr": 0.00098678945143658, "time_sec": 83.73260736465454 }, { "epoch": 12, "train_loss": 4.779874237365723, "train_acc": 0.01008, "test_loss": 4.67001594543457, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 3.103566946411183, "grad_max_sv": 2.861602544784546, "grad_min_sv": 3.936066093057633e-08, "grad_condition": 119851949.4663836, "lr": 0.0009842915805643154, "time_sec": 83.817462682724 }, { "epoch": 13, "train_loss": 4.770841501159668, "train_acc": 0.00992, "test_loss": 4.656426369476319, "test_acc": 0.01, "lyapunov": null, "grad_norm": 3.0009960370081323, "grad_max_sv": 2.656493490934372, "grad_min_sv": 3.707013069217946e-08, "grad_condition": 498107586.22724324, "lr": 0.000981581283398829, "time_sec": 83.74097108840942 }, { "epoch": 14, "train_loss": 4.756785203857422, "train_acc": 0.01042, "test_loss": 4.675232955932617, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 2.8493309861575318, "grad_max_sv": 2.5364737689495085, "grad_min_sv": 3.586032745195311e-08, "grad_condition": 113107959.8123773, "lr": 0.0009786597487660333, "time_sec": 83.73817372322083 }, { "epoch": 15, "train_loss": 4.754773846588135, "train_acc": 0.00998, "test_loss": 4.659816702270508, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 2.754495953066911, "grad_max_sv": 2.477891582250595, "grad_min_sv": 3.409575287799394e-08, "grad_condition": 161602481.60469836, "lr": 0.0009755282581475766, "time_sec": 83.75961685180664 }, { "epoch": 16, "train_loss": 4.743301128997802, "train_acc": 0.0101, "test_loss": 4.649964485168457, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 2.6595920331694725, "grad_max_sv": 2.3447550773620605, "grad_min_sv": 3.222141393699474e-08, "grad_condition": 183792258.0998055, "lr": 0.0009721881851187403, "time_sec": 83.78172135353088 }, { "epoch": 17, "train_loss": 4.733358394927978, "train_acc": 0.01016, "test_loss": 4.642168313598633, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 2.5896272478360634, "grad_max_sv": 2.3136182010173796, "grad_min_sv": 3.172710767995745e-08, "grad_condition": 117247363.48613138, "lr": 0.0009686409947459456, "time_sec": 83.75683784484863 }, { "epoch": 18, "train_loss": 4.729640578918457, "train_acc": 0.0106, "test_loss": 4.654958557128906, "test_acc": 0.01, "lyapunov": null, "grad_norm": 2.5388744373274417, "grad_max_sv": 2.2171274721622467, "grad_min_sv": 3.0159331015910953e-08, "grad_condition": 101838677.71373975, "lr": 0.0009648882429441254, "time_sec": 83.75490856170654 }, { "epoch": 19, "train_loss": 4.723793775634766, "train_acc": 0.0104, "test_loss": 4.653732388305664, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 2.4692592532468662, "grad_max_sv": 2.1681156396865844, "grad_min_sv": 2.978641970435847e-08, "grad_condition": 233798757.5515837, "lr": 0.00096093157579425, "time_sec": 83.76724123954773 }, { "epoch": 20, "train_loss": 4.718724663238525, "train_acc": 0.0102, "test_loss": 4.649697755432129, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 2.427591699320917, "grad_max_sv": 2.1466651976108553, "grad_min_sv": 2.9465831946628997e-08, "grad_condition": 88939856.59831895, "lr": 0.0009567727288213001, "time_sec": 83.74052405357361 }, { "epoch": 21, "train_loss": 4.712672980194092, "train_acc": 0.01012, "test_loss": 4.647871576690674, "test_acc": 0.0094, "lyapunov": null, "grad_norm": 2.357057284901842, "grad_max_sv": 2.1047394454479216, "grad_min_sv": 2.8490478837239763e-08, "grad_condition": 91579762.44536874, "lr": 0.0009524135262330095, "time_sec": 83.75857543945312 }, { "epoch": 22, "train_loss": 4.706978241882324, "train_acc": 0.01024, "test_loss": 4.648735240936279, "test_acc": 0.0085, "lyapunov": null, "grad_norm": 2.2900045512493366, "grad_max_sv": 2.081936264038086, "grad_min_sv": 2.8080869171609457e-08, "grad_condition": 136805304.6805451, "lr": 0.0009478558801197061, "time_sec": 83.75628423690796 }, { "epoch": 23, "train_loss": 4.700225740966797, "train_acc": 0.00964, "test_loss": 4.647530085754394, "test_acc": 0.01, "lyapunov": null, "grad_norm": 2.2107587083430276, "grad_max_sv": 1.988323137164116, "grad_min_sv": 2.6475746447984784e-08, "grad_condition": 164008669.76777038, "lr": 0.000943101789615607, "time_sec": 83.77352237701416 }, { "epoch": 24, "train_loss": 4.692355620117188, "train_acc": 0.0096, "test_loss": 4.637314375305176, "test_acc": 0.01, "lyapunov": null, "grad_norm": 2.058860964349953, "grad_max_sv": 1.8445529341697693, "grad_min_sv": 2.4344878213344857e-08, "grad_condition": 86439388.46384792, "lr": 0.0009381533400219313, "time_sec": 83.79498553276062 }, { "epoch": 25, "train_loss": 4.681464791564942, "train_acc": 0.00928, "test_loss": 4.623963987731933, "test_acc": 0.01, "lyapunov": null, "grad_norm": 1.887935665727307, "grad_max_sv": 1.675812867283821, "grad_min_sv": 2.197329014158589e-08, "grad_condition": 136861974.56893334, "lr": 0.0009330127018922189, "time_sec": 83.75438261032104 }, { "epoch": 26, "train_loss": 4.666114781646728, "train_acc": 0.00968, "test_loss": 4.622957837677002, "test_acc": 0.01, "lyapunov": null, "grad_norm": 1.6987317795206707, "grad_max_sv": 1.5008918464183807, "grad_min_sv": 1.8850404182035874e-08, "grad_condition": 396848763.8507156, "lr": 0.000927682130080253, "time_sec": 83.80677318572998 }, { "epoch": 27, "train_loss": 4.656886034545899, "train_acc": 0.0103, "test_loss": 4.618579483032226, "test_acc": 0.01, "lyapunov": null, "grad_norm": 1.49568981841554, "grad_max_sv": 1.3568953216075896, "grad_min_sv": 1.566217179560514e-08, "grad_condition": 103503015.49660948, "lr": 0.0009221639627510072, "time_sec": 83.78064775466919 }, { "epoch": 28, "train_loss": 4.643399444732666, "train_acc": 0.01056, "test_loss": 4.614220301055909, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 1.3088039077662417, "grad_max_sv": 1.1537246599793434, "grad_min_sv": 1.2267503651797185e-08, "grad_condition": 114843460.24858093, "lr": 0.0009164606203550494, "time_sec": 83.7792694568634 }, { "epoch": 29, "train_loss": 4.633547606048584, "train_acc": 0.00896, "test_loss": 4.611564260101319, "test_acc": 0.01, "lyapunov": null, "grad_norm": 1.0933490764935123, "grad_max_sv": 0.9679391533136368, "grad_min_sv": 7.642074995560522e-09, "grad_condition": 804214751.6294578, "lr": 0.0009105746045668516, "time_sec": 83.83227157592773 }, { "epoch": 30, "train_loss": 4.624774245300293, "train_acc": 0.00964, "test_loss": 4.608921669769287, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.8837855695002744, "grad_max_sv": 0.773915484547615, "grad_min_sv": 2.366957635572509e-11, "grad_condition": 237910863465.00665, "lr": 0.0009045084971874733, "time_sec": 83.80770468711853 }, { "epoch": 31, "train_loss": 4.618612337646485, "train_acc": 0.01032, "test_loss": 4.607751036071777, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.7415257832044893, "grad_max_sv": 0.644972386956215, "grad_min_sv": 3.660935201474329e-12, "grad_condition": 261782379031.45782, "lr": 0.0008982649590120977, "time_sec": 83.79283952713013 }, { "epoch": 32, "train_loss": 4.616099582977295, "train_acc": 0.0089, "test_loss": 4.606554626464844, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.6524091899037507, "grad_max_sv": 0.5655980415642261, "grad_min_sv": 1.3079153537243355e-13, "grad_condition": 507838982675.7344, "lr": 0.0008918467286629196, "time_sec": 83.77927327156067 }, { "epoch": 33, "train_loss": 4.613166402130127, "train_acc": 0.00916, "test_loss": 4.606206927490234, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.5720100552333853, "grad_max_sv": 0.4838749781250954, "grad_min_sv": 7.656531138726084e-14, "grad_condition": 452556546253.1081, "lr": 0.0008852566213878943, "time_sec": 83.7956645488739 }, { "epoch": 34, "train_loss": 4.610275639953613, "train_acc": 0.0096, "test_loss": 4.605738200378418, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.4266452221992571, "grad_max_sv": 0.36331126987934115, "grad_min_sv": 5.44079975167954e-15, "grad_condition": 361256197137.27747, "lr": 0.000878497527825878, "time_sec": 83.78154063224792 }, { "epoch": 35, "train_loss": 4.608961817626954, "train_acc": 0.01014, "test_loss": 4.605575282287598, "test_acc": 0.0104, "lyapunov": null, "grad_norm": 0.32905926875005, "grad_max_sv": 0.2839593421667814, "grad_min_sv": 8.941027107756884e-17, "grad_condition": 283933784815.36444, "lr": 0.000871572412738697, "time_sec": 83.76054668426514 }, { "epoch": 36, "train_loss": 4.608401114196777, "train_acc": 0.00938, "test_loss": 4.605348924255371, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.2743447711162471, "grad_max_sv": 0.2315550185739994, "grad_min_sv": 2.4262184593062427e-31, "grad_condition": 231555018573.99936, "lr": 0.0008644843137107055, "time_sec": 83.76748013496399 }, { "epoch": 37, "train_loss": 4.6074152955627445, "train_acc": 0.01014, "test_loss": 4.605235860443115, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.22829204328314687, "grad_max_sv": 0.19001176171004772, "grad_min_sv": 0.0, "grad_condition": 190011761710.0477, "lr": 0.0008572363398164014, "time_sec": 83.82857966423035 }, { "epoch": 38, "train_loss": 4.6074430204772945, "train_acc": 0.00846, "test_loss": 4.605340163421631, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2131689057955099, "grad_max_sv": 0.17414189949631692, "grad_min_sv": 0.0, "grad_condition": 174141899496.3169, "lr": 0.0008498316702566826, "time_sec": 83.7941620349884 }, { "epoch": 39, "train_loss": 4.608160193786621, "train_acc": 0.00878, "test_loss": 4.605639952087403, "test_acc": 0.009, "lyapunov": null, "grad_norm": 0.24317456921386985, "grad_max_sv": 0.2019160557538271, "grad_min_sv": 0.0, "grad_condition": 201916055753.8271, "lr": 0.0008422735529643442, "time_sec": 83.80830645561218 }, { "epoch": 40, "train_loss": 4.606921190032959, "train_acc": 0.00868, "test_loss": 4.605219190216064, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.17887802551259574, "grad_max_sv": 0.14444960467517376, "grad_min_sv": 0.0, "grad_condition": 144449604675.17377, "lr": 0.0008345653031794289, "time_sec": 83.76973342895508 }, { "epoch": 41, "train_loss": 4.606422245941162, "train_acc": 0.00834, "test_loss": 4.605222705078125, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.17289778065418965, "grad_max_sv": 0.13819168899208306, "grad_min_sv": 0.0, "grad_condition": 138191688992.08307, "lr": 0.0008267103019950526, "time_sec": 83.74321436882019 }, { "epoch": 42, "train_loss": 4.606239071655273, "train_acc": 0.01008, "test_loss": 4.605207167053223, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.16994723888320276, "grad_max_sv": 0.13730969540774823, "grad_min_sv": 0.0, "grad_condition": 137309695407.74821, "lr": 0.0008187119948743447, "time_sec": 83.7667281627655 }, { "epoch": 43, "train_loss": 4.606040752410888, "train_acc": 0.00878, "test_loss": 4.605204765319824, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.14038728911483775, "grad_max_sv": 0.10907853152602912, "grad_min_sv": 0.0, "grad_condition": 109078531526.0291, "lr": 0.000810573890139155, "time_sec": 83.71949076652527 }, { "epoch": 44, "train_loss": 4.605822370910644, "train_acc": 0.00892, "test_loss": 4.605195722198486, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.11252097462442588, "grad_max_sv": 0.05359459263272583, "grad_min_sv": 0.0, "grad_condition": 53594592632.72584, "lr": 0.0008022995574311873, "time_sec": 83.74685764312744 }, { "epoch": 45, "train_loss": 4.605744844055176, "train_acc": 0.0091, "test_loss": 4.605188182067871, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.09696133635132191, "grad_max_sv": 0.02572248433716595, "grad_min_sv": 0.0, "grad_condition": 25722484337.16595, "lr": 0.0007938926261462363, "time_sec": 83.688485622406 }, { "epoch": 46, "train_loss": 4.605597140960693, "train_acc": 0.00844, "test_loss": 4.605181010437012, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.09018030151754076, "grad_max_sv": 0.008408381370827556, "grad_min_sv": 0.0, "grad_condition": 8408381370.827555, "lr": 0.0007853567838422158, "time_sec": 83.6915934085846 }, { "epoch": 47, "train_loss": 4.605502964324951, "train_acc": 0.00962, "test_loss": 4.605176095581054, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.08904470683636952, "grad_max_sv": 0.006156692747026682, "grad_min_sv": 0.0, "grad_condition": 6156692747.026682, "lr": 0.0007766957746216719, "time_sec": 83.68823766708374 }, { "epoch": 48, "train_loss": 4.605539189758301, "train_acc": 0.00832, "test_loss": 4.605174793243409, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.08881260926985375, "grad_max_sv": 0.005750873032957316, "grad_min_sv": 0.0, "grad_condition": 5750873032.957315, "lr": 0.0007679133974894982, "time_sec": 83.71515822410583 }, { "epoch": 49, "train_loss": 4.605639272460937, "train_acc": 0.00838, "test_loss": 4.605174536132813, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.09166121492862447, "grad_max_sv": 0.012213990930467844, "grad_min_sv": 0.0, "grad_condition": 12213990930.467844, "lr": 0.000759013504686565, "time_sec": 83.6816132068634 }, { "epoch": 50, "train_loss": 4.605558903808594, "train_acc": 0.00886, "test_loss": 4.605173831939697, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.09052173034897262, "grad_max_sv": 0.015108420280739665, "grad_min_sv": 0.0, "grad_condition": 15108420280.739666, "lr": 0.0007499999999999998, "time_sec": 83.65550971031189 }, { "epoch": 51, "train_loss": 4.606378012390136, "train_acc": 0.00982, "test_loss": 4.605191948699951, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.13316554004595244, "grad_max_sv": 0.08486739061772823, "grad_min_sv": 5.639984459982783e-14, "grad_condition": 78828935747.45195, "lr": 0.0007408768370508575, "time_sec": 83.73471426963806 }, { "epoch": 52, "train_loss": 4.548985960083008, "train_acc": 0.01534, "test_loss": 6.090479849243164, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.31291438549111006, "grad_max_sv": 0.21921597719192504, "grad_min_sv": 1.8728595782364096e-11, "grad_condition": 72581711957.44724, "lr": 0.0007316480175599307, "time_sec": 83.83673882484436 }, { "epoch": 53, "train_loss": 4.517283289031982, "train_acc": 0.01706, "test_loss": 6.098530506896973, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.298946556890386, "grad_max_sv": 0.21190068013966085, "grad_min_sv": 3.1303262042079113e-12, "grad_condition": 83525509037.16917, "lr": 0.0007223175895924635, "time_sec": 83.79953289031982 }, { "epoch": 54, "train_loss": 4.506922316894531, "train_acc": 0.01826, "test_loss": 6.029461811828614, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2872016386861535, "grad_max_sv": 0.2001660715788603, "grad_min_sv": 2.1477832165699736e-12, "grad_condition": 93342369625.0347, "lr": 0.0007128896457825361, "time_sec": 83.83765316009521 }, { "epoch": 55, "train_loss": 4.500352125549316, "train_acc": 0.01822, "test_loss": 6.254561413574219, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2840675312383032, "grad_max_sv": 0.19858233965933322, "grad_min_sv": 2.2369640777182348e-12, "grad_condition": 84452645725.82004, "lr": 0.0007033683215378998, "time_sec": 83.87366318702698 }, { "epoch": 56, "train_loss": 4.494334082946778, "train_acc": 0.01898, "test_loss": 6.176936679077149, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.28473204888904313, "grad_max_sv": 0.20153928063809873, "grad_min_sv": 2.5336075244057393e-12, "grad_condition": 84473652713.76613, "lr": 0.0006937577932260512, "time_sec": 83.85195803642273 }, { "epoch": 57, "train_loss": 4.491042407073975, "train_acc": 0.01962, "test_loss": 6.597558038330078, "test_acc": 0.009, "lyapunov": null, "grad_norm": 0.27666587557698485, "grad_max_sv": 0.19496511965990065, "grad_min_sv": 2.6691194986502985e-12, "grad_condition": 76747509393.5625, "lr": 0.0006840622763423388, "time_sec": 83.8267707824707 }, { "epoch": 58, "train_loss": 4.48429320526123, "train_acc": 0.0202, "test_loss": 6.6381898071289065, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2720732789744726, "grad_max_sv": 0.189533968269825, "grad_min_sv": 2.6686336090421275e-12, "grad_condition": 76958091069.54593, "lr": 0.0006742860236609073, "time_sec": 83.81882667541504 }, { "epoch": 59, "train_loss": 4.479027882080078, "train_acc": 0.02112, "test_loss": 6.593468840026856, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.28013135845208736, "grad_max_sv": 0.1970901783555746, "grad_min_sv": 3.427181970598606e-12, "grad_condition": 77152467146.4727, "lr": 0.0006644333233692913, "time_sec": 83.80582737922668 }, { "epoch": 60, "train_loss": 4.455229897613525, "train_acc": 0.02522, "test_loss": 7.094032968139649, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2984456215457652, "grad_max_sv": 0.20514705888926982, "grad_min_sv": 1.3113472435618547e-11, "grad_condition": 46710044351.44385, "lr": 0.0006545084971874734, "time_sec": 83.83238410949707 }, { "epoch": 61, "train_loss": 4.434012725677491, "train_acc": 0.02664, "test_loss": 7.727159403991699, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.31670091276798196, "grad_max_sv": 0.22147773541510105, "grad_min_sv": 2.0530699328249547e-10, "grad_condition": 23070127911.0107, "lr": 0.0006445158984722354, "time_sec": 83.8679609298706 }, { "epoch": 62, "train_loss": 4.419747852783203, "train_acc": 0.02636, "test_loss": 7.459843544006348, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 0.3192666281191851, "grad_max_sv": 0.22665422596037388, "grad_min_sv": 2.7867287440722047e-10, "grad_condition": 28668691596.510204, "lr": 0.0006344599103076324, "time_sec": 83.7790117263794 }, { "epoch": 63, "train_loss": 4.410167588043213, "train_acc": 0.0297, "test_loss": 6.561855883789063, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.30978499796993897, "grad_max_sv": 0.21358359269797803, "grad_min_sv": 1.0904945902848835e-10, "grad_condition": 28758391079.590137, "lr": 0.0006243449435824269, "time_sec": 83.8552029132843 }, { "epoch": 64, "train_loss": 4.398182756958008, "train_acc": 0.02932, "test_loss": 7.0834544662475585, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.2981823968653719, "grad_max_sv": 0.2038045074790716, "grad_min_sv": 4.896934048336616e-10, "grad_condition": 6480139621.348356, "lr": 0.0006141754350553275, "time_sec": 83.81044340133667 }, { "epoch": 65, "train_loss": 4.39155801651001, "train_acc": 0.0299, "test_loss": 6.743014807128906, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2915326524043412, "grad_max_sv": 0.19417541958391665, "grad_min_sv": 1.18620941511223e-09, "grad_condition": 1528876877.7676086, "lr": 0.0006039558454088793, "time_sec": 83.8169424533844 }, { "epoch": 66, "train_loss": 4.383871633453369, "train_acc": 0.03122, "test_loss": 6.343855700683593, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2920918221308499, "grad_max_sv": 0.19423219338059425, "grad_min_sv": 1.1915352001942714e-09, "grad_condition": 890331184.9718037, "lr": 0.000593690657292862, "time_sec": 83.8088231086731 }, { "epoch": 67, "train_loss": 4.380996891784668, "train_acc": 0.03214, "test_loss": 6.3810079963684085, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.28877371474045604, "grad_max_sv": 0.193271204829216, "grad_min_sv": 1.6600884500828778e-09, "grad_condition": 372383180.6138096, "lr": 0.0005833843733580507, "time_sec": 83.78432846069336 }, { "epoch": 68, "train_loss": 4.376522983703613, "train_acc": 0.0316, "test_loss": 6.291935075378418, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 0.2862661185936042, "grad_max_sv": 0.18648179918527602, "grad_min_sv": 1.468030542869361e-09, "grad_condition": 2139805441.5710232, "lr": 0.0005730415142812054, "time_sec": 83.7891354560852 }, { "epoch": 69, "train_loss": 4.372224440612793, "train_acc": 0.03352, "test_loss": 6.681443427276611, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2796495478797956, "grad_max_sv": 0.18046599105000496, "grad_min_sv": 1.2168376441450828e-09, "grad_condition": 721985908.0902131, "lr": 0.0005626666167821517, "time_sec": 83.80607604980469 }, { "epoch": 70, "train_loss": 4.369470675811767, "train_acc": 0.03222, "test_loss": 6.483533153533935, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 0.28218706578232045, "grad_max_sv": 0.18038711175322533, "grad_min_sv": 1.6886237430915884e-09, "grad_condition": 284801174.2502399, "lr": 0.0005522642316338265, "time_sec": 83.80915093421936 }, { "epoch": 71, "train_loss": 4.36190840423584, "train_acc": 0.03452, "test_loss": 6.448402415466308, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.27607671132097, "grad_max_sv": 0.17782694809138774, "grad_min_sv": 1.594215062207787e-09, "grad_condition": 2097996064.0572019, "lr": 0.0005418389216661573, "time_sec": 83.82332372665405 }, { "epoch": 72, "train_loss": 4.354908424377442, "train_acc": 0.03596, "test_loss": 6.558257571411133, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 0.2756995722839523, "grad_max_sv": 0.16976643167436123, "grad_min_sv": 1.6113121665065067e-09, "grad_condition": 277986841.7750164, "lr": 0.0005313952597646563, "time_sec": 83.79193758964539 }, { "epoch": 73, "train_loss": 4.354222341156006, "train_acc": 0.03476, "test_loss": 6.309269012451172, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.26842599931569244, "grad_max_sv": 0.1654328290373087, "grad_min_sv": 1.5355291571898453e-09, "grad_condition": 494546718.69761646, "lr": 0.0005209378268645994, "time_sec": 83.83719944953918 }, { "epoch": 74, "train_loss": 4.348915999755859, "train_acc": 0.03656, "test_loss": 6.48945037689209, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2721751559070442, "grad_max_sv": 0.1733177002519369, "grad_min_sv": 1.6353850840794179e-09, "grad_condition": 4394906218.143788, "lr": 0.0005104712099416781, "time_sec": 83.87231683731079 }, { "epoch": 75, "train_loss": 4.344389753723145, "train_acc": 0.0362, "test_loss": 6.536355171203613, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.2762971427042467, "grad_max_sv": 0.17327322103083134, "grad_min_sv": 1.6745484680748961e-09, "grad_condition": 296861622.65127766, "lr": 0.0004999999999999996, "time_sec": 83.7963707447052 }, { "epoch": 76, "train_loss": 4.336879919433594, "train_acc": 0.0385, "test_loss": 6.207801509094239, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.27617831363540746, "grad_max_sv": 0.17525496631860732, "grad_min_sv": 1.712406004191272e-09, "grad_condition": 355194777.2860588, "lr": 0.0004895287900583212, "time_sec": 83.78706455230713 }, { "epoch": 77, "train_loss": 4.334291800689697, "train_acc": 0.03816, "test_loss": 5.998904524230957, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 0.27646822759404405, "grad_max_sv": 0.17449169531464576, "grad_min_sv": 1.7281031508770487e-09, "grad_condition": 617370975.1793921, "lr": 0.0004790621731353997, "time_sec": 83.79909944534302 }, { "epoch": 78, "train_loss": 4.33249505783081, "train_acc": 0.0375, "test_loss": 6.079836444854736, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.28240731905667205, "grad_max_sv": 0.17906831130385398, "grad_min_sv": 1.832980646302232e-09, "grad_condition": 570608704.9054655, "lr": 0.000468604740235343, "time_sec": 83.78829288482666 }, { "epoch": 79, "train_loss": 4.327211993713379, "train_acc": 0.0372, "test_loss": 6.010349069976806, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.26579955843267283, "grad_max_sv": 0.16206405386328698, "grad_min_sv": 1.8076382385400804e-09, "grad_condition": 680257720.1741323, "lr": 0.00045816107833384175, "time_sec": 83.79378890991211 }, { "epoch": 80, "train_loss": 4.325840251617431, "train_acc": 0.0399, "test_loss": 6.453493260192871, "test_acc": 0.0104, "lyapunov": null, "grad_norm": 0.2678340843927439, "grad_max_sv": 0.16088486537337304, "grad_min_sv": 1.8230197001067525e-09, "grad_condition": 491813566.00292075, "lr": 0.0004477357683661729, "time_sec": 83.77716493606567 }, { "epoch": 81, "train_loss": 4.324064207763672, "train_acc": 0.03872, "test_loss": 6.066691808319092, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.27284601483817317, "grad_max_sv": 0.1656409576535225, "grad_min_sv": 1.966192943528289e-09, "grad_condition": 120565010.54568236, "lr": 0.00043733338321784746, "time_sec": 83.78050255775452 }, { "epoch": 82, "train_loss": 4.3167226469421385, "train_acc": 0.04004, "test_loss": 6.479253450012207, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.266468676835963, "grad_max_sv": 0.16226925253868102, "grad_min_sv": 1.8786357255094232e-09, "grad_condition": 832620477.3818345, "lr": 0.0004269584857187939, "time_sec": 83.77594256401062 }, { "epoch": 83, "train_loss": 4.314026451263428, "train_acc": 0.04066, "test_loss": 6.491674769592285, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2618645063357135, "grad_max_sv": 0.15328656397759916, "grad_min_sv": 1.8954250842473375e-09, "grad_condition": 324046081.6731597, "lr": 0.0004166156266419484, "time_sec": 83.79970407485962 }, { "epoch": 84, "train_loss": 4.307831993713379, "train_acc": 0.04056, "test_loss": 6.641959228515625, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.2686563253168225, "grad_max_sv": 0.16125894524157047, "grad_min_sv": 2.0374150564578254e-09, "grad_condition": 160522665.97837877, "lr": 0.0004063093427071373, "time_sec": 83.82930493354797 }, { "epoch": 85, "train_loss": 4.308941020507812, "train_acc": 0.0418, "test_loss": 6.508579216003418, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.27160717763788633, "grad_max_sv": 0.1655819222331047, "grad_min_sv": 2.023065160186577e-09, "grad_condition": 120462376.21506557, "lr": 0.0003960441545911199, "time_sec": 83.7900025844574 }, { "epoch": 86, "train_loss": 4.304050233764649, "train_acc": 0.03994, "test_loss": 6.396804527282715, "test_acc": 0.0107, "lyapunov": null, "grad_norm": 0.2729810873547816, "grad_max_sv": 0.16440293304622172, "grad_min_sv": 2.151508744253905e-09, "grad_condition": 132130608.9556226, "lr": 0.0003858245649446718, "time_sec": 83.80140709877014 }, { "epoch": 87, "train_loss": 4.299405968475342, "train_acc": 0.04196, "test_loss": 6.600989144897461, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2695479470251096, "grad_max_sv": 0.1591991312801838, "grad_min_sv": 1.9906060319194175e-09, "grad_condition": 119698677.25192289, "lr": 0.00037565505641757235, "time_sec": 83.82861065864563 }, { "epoch": 88, "train_loss": 4.301599495544433, "train_acc": 0.04232, "test_loss": 6.554762725830078, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2647703969850391, "grad_max_sv": 0.15560886412858962, "grad_min_sv": 1.9747980002995937e-09, "grad_condition": 122983202.1326602, "lr": 0.00036554008969236695, "time_sec": 83.82960343360901 }, { "epoch": 89, "train_loss": 4.297747989654541, "train_acc": 0.04348, "test_loss": 6.357062748718262, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.26734470016505596, "grad_max_sv": 0.15722180251032114, "grad_min_sv": 1.981925610086699e-09, "grad_condition": 100233762.481437, "lr": 0.0003554841015277638, "time_sec": 83.85219097137451 }, { "epoch": 90, "train_loss": 4.294689517669678, "train_acc": 0.04346, "test_loss": 6.4904538467407225, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.26448991829060364, "grad_max_sv": 0.1514646142721176, "grad_min_sv": 2.0380848893969404e-09, "grad_condition": 115297831.8608543, "lr": 0.000345491502812526, "time_sec": 83.78560423851013 }, { "epoch": 91, "train_loss": 4.288459105834961, "train_acc": 0.04228, "test_loss": 6.363833187866211, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2716021382283501, "grad_max_sv": 0.16101026125252246, "grad_min_sv": 2.0529807125135857e-09, "grad_condition": 111422037.25124231, "lr": 0.0003355666766307081, "time_sec": 83.80491185188293 }, { "epoch": 92, "train_loss": 4.2877139868164065, "train_acc": 0.04416, "test_loss": 6.387586988067627, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2675364217657968, "grad_max_sv": 0.1556147363036871, "grad_min_sv": 2.072003611047757e-09, "grad_condition": 100163844.77093126, "lr": 0.00032571397633909225, "time_sec": 83.80176591873169 }, { "epoch": 93, "train_loss": 4.286743914489746, "train_acc": 0.04442, "test_loss": 6.614454327392578, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.2696169338715711, "grad_max_sv": 0.1587842211127281, "grad_min_sv": 2.1451849420948964e-09, "grad_condition": 175440678.68888003, "lr": 0.00031593772365766094, "time_sec": 83.81897950172424 }, { "epoch": 94, "train_loss": 4.281456643066406, "train_acc": 0.04426, "test_loss": 6.365528283691407, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.27294877944821766, "grad_max_sv": 0.16244313083589076, "grad_min_sv": 2.1448280498881368e-09, "grad_condition": 93958550.86214396, "lr": 0.0003062422067739483, "time_sec": 83.78250980377197 }, { "epoch": 95, "train_loss": 4.280488971710205, "train_acc": 0.04608, "test_loss": 6.470796231842041, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.273056993639001, "grad_max_sv": 0.16184688359498978, "grad_min_sv": 2.2206805599250813e-09, "grad_condition": 185414259.9896317, "lr": 0.00029663167846209965, "time_sec": 83.82439541816711 }, { "epoch": 96, "train_loss": 4.279716082458496, "train_acc": 0.04314, "test_loss": 6.52447133026123, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 0.27442923945512043, "grad_max_sv": 0.1630928661674261, "grad_min_sv": 2.3233001415073897e-09, "grad_condition": 103462231.52886583, "lr": 0.00028711035421746345, "time_sec": 83.83807969093323 }, { "epoch": 97, "train_loss": 4.274856643218994, "train_acc": 0.04572, "test_loss": 6.772166311645508, "test_acc": 0.0109, "lyapunov": null, "grad_norm": 0.2771278283509764, "grad_max_sv": 0.17104111909866332, "grad_min_sv": 2.4184343061159352e-09, "grad_condition": 271014828.3038153, "lr": 0.00027768241040753615, "time_sec": 83.85514092445374 }, { "epoch": 98, "train_loss": 4.2779387315368655, "train_acc": 0.04608, "test_loss": 6.668636999511719, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.27463112819076785, "grad_max_sv": 0.16144732832908631, "grad_min_sv": 2.2677979229649758e-09, "grad_condition": 4419130655.463402, "lr": 0.00026835198244006903, "time_sec": 83.83084058761597 }, { "epoch": 99, "train_loss": 4.276140930480957, "train_acc": 0.04544, "test_loss": 6.88837735748291, "test_acc": 0.0107, "lyapunov": null, "grad_norm": 0.26886350994697167, "grad_max_sv": 0.15219354666769505, "grad_min_sv": 2.2166218230715296e-09, "grad_condition": 103754705.283932, "lr": 0.0002591231629491421, "time_sec": 83.79713916778564 }, { "epoch": 100, "train_loss": 4.273054361877441, "train_acc": 0.04564, "test_loss": 6.783898326873779, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.26691489320326656, "grad_max_sv": 0.14936545640230178, "grad_min_sv": 2.2781338981925358e-09, "grad_condition": 87358992.35708968, "lr": 0.0002499999999999997, "time_sec": 83.80319023132324 }, { "epoch": 101, "train_loss": 4.26914766998291, "train_acc": 0.04564, "test_loss": 6.513159948730468, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.26611169562468134, "grad_max_sv": 0.15025373138487338, "grad_min_sv": 2.2174503035848892e-09, "grad_condition": 96439723.92469814, "lr": 0.00024098649531343477, "time_sec": 83.83437013626099 }, { "epoch": 102, "train_loss": 4.26979032119751, "train_acc": 0.04642, "test_loss": 6.493202007293701, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.26813810856759995, "grad_max_sv": 0.1489817149937153, "grad_min_sv": 2.380725915018811e-09, "grad_condition": 76215277.93021134, "lr": 0.0002320866025105016, "time_sec": 83.80248379707336 }, { "epoch": 103, "train_loss": 4.260873723297119, "train_acc": 0.04782, "test_loss": 6.493594526672363, "test_acc": 0.0111, "lyapunov": null, "grad_norm": 0.2688305350715821, "grad_max_sv": 0.1512874387204647, "grad_min_sv": 2.453062892919522e-09, "grad_condition": 134347199.1051014, "lr": 0.0002233042253783278, "time_sec": 83.81874346733093 }, { "epoch": 104, "train_loss": 4.262198150939941, "train_acc": 0.04738, "test_loss": 6.605858857727051, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 0.27225916391154686, "grad_max_sv": 0.15373125690966843, "grad_min_sv": 2.44866176035783e-09, "grad_condition": 419013949.5031613, "lr": 0.000214643216157784, "time_sec": 84.03694415092468 }, { "epoch": 105, "train_loss": 4.262576495056153, "train_acc": 0.04672, "test_loss": 6.746639459991455, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2762952402363064, "grad_max_sv": 0.15909811817109584, "grad_min_sv": 2.4671919398103204e-09, "grad_condition": 139499125.202051, "lr": 0.00020610737385376332, "time_sec": 83.83756351470947 }, { "epoch": 106, "train_loss": 4.256981732330322, "train_acc": 0.04834, "test_loss": 6.714322766113281, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.27463124817104645, "grad_max_sv": 0.15689255371689798, "grad_min_sv": 2.5142482939360944e-09, "grad_condition": 118433721.44138017, "lr": 0.00019770044256881242, "time_sec": 83.83591985702515 }, { "epoch": 107, "train_loss": 4.2602463818359375, "train_acc": 0.04698, "test_loss": 6.657286577606201, "test_acc": 0.0109, "lyapunov": null, "grad_norm": 0.2689041932222791, "grad_max_sv": 0.15177576132118703, "grad_min_sv": 2.4187723310364893e-09, "grad_condition": 94992794.34351222, "lr": 0.0001894261098608447, "time_sec": 83.80453681945801 }, { "epoch": 108, "train_loss": 4.2544874598693845, "train_acc": 0.04844, "test_loss": 6.59372087097168, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2710712522794079, "grad_max_sv": 0.15038638189435005, "grad_min_sv": 2.514627481589593e-09, "grad_condition": 93107492.33691652, "lr": 0.000181288005125655, "time_sec": 83.77546954154968 }, { "epoch": 109, "train_loss": 4.253146978759766, "train_acc": 0.04824, "test_loss": 6.575524732208252, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.2727669683249611, "grad_max_sv": 0.15002147294580936, "grad_min_sv": 2.4739045799762604e-09, "grad_condition": 125566166.74099617, "lr": 0.0001732896980049473, "time_sec": 83.82711911201477 }, { "epoch": 110, "train_loss": 4.250933767089844, "train_acc": 0.04966, "test_loss": 6.632392105102539, "test_acc": 0.011, "lyapunov": null, "grad_norm": 0.27898350710296843, "grad_max_sv": 0.15593392103910447, "grad_min_sv": 2.5894539202545724e-09, "grad_condition": 625752503.9437258, "lr": 0.00016543469682057076, "time_sec": 83.74293255805969 }, { "epoch": 111, "train_loss": 4.24997673614502, "train_acc": 0.04972, "test_loss": 6.568419965362549, "test_acc": 0.0109, "lyapunov": null, "grad_norm": 0.27772763472261885, "grad_max_sv": 0.15495621263980866, "grad_min_sv": 2.661621495425592e-09, "grad_condition": 70119073.46937823, "lr": 0.00015772644703565552, "time_sec": 83.79197788238525 }, { "epoch": 112, "train_loss": 4.249247148590088, "train_acc": 0.0507, "test_loss": 6.707973278045654, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 0.27686969610418316, "grad_max_sv": 0.15229813233017922, "grad_min_sv": 2.662702908856618e-09, "grad_condition": 153958977.83635777, "lr": 0.00015016832974331713, "time_sec": 83.80273818969727 }, { "epoch": 113, "train_loss": 4.250667928771973, "train_acc": 0.0492, "test_loss": 6.8461118530273435, "test_acc": 0.0096, "lyapunov": null, "grad_norm": 0.28055092675814575, "grad_max_sv": 0.1576558079570532, "grad_min_sv": 2.742332778221668e-09, "grad_condition": 137456876.77179033, "lr": 0.00014276366018359834, "time_sec": 83.80364871025085 }, { "epoch": 114, "train_loss": 4.2449106436157225, "train_acc": 0.05016, "test_loss": 6.787322373962402, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.27979119322019597, "grad_max_sv": 0.15479157418012618, "grad_min_sv": 2.6695785599467614e-09, "grad_condition": 81382647.58523288, "lr": 0.00013551568628929425, "time_sec": 83.82229542732239 }, { "epoch": 115, "train_loss": 4.244952727355957, "train_acc": 0.05002, "test_loss": 6.741559551239014, "test_acc": 0.0092, "lyapunov": null, "grad_norm": 0.2773863197316903, "grad_max_sv": 0.15171751268208028, "grad_min_sv": 2.682797061023465e-09, "grad_condition": 212074169.4590431, "lr": 0.00012842758726130276, "time_sec": 83.82812428474426 }, { "epoch": 116, "train_loss": 4.242339648132324, "train_acc": 0.04982, "test_loss": 6.755374185180664, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2805527611657844, "grad_max_sv": 0.1574402242898941, "grad_min_sv": 2.8019030511548804e-09, "grad_condition": 238625880.71394747, "lr": 0.0001215024721741218, "time_sec": 83.79120373725891 }, { "epoch": 117, "train_loss": 4.240206247253418, "train_acc": 0.04966, "test_loss": 6.836046894073486, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.2758039178422697, "grad_max_sv": 0.1517912581562996, "grad_min_sv": 2.68810798897956e-09, "grad_condition": 72825643.14736441, "lr": 0.00011474337861210538, "time_sec": 83.7668628692627 }, { "epoch": 118, "train_loss": 4.2366791255187985, "train_acc": 0.05162, "test_loss": 6.8930122108459475, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.28097411795628907, "grad_max_sv": 0.15138982199132442, "grad_min_sv": 2.6724390362123373e-09, "grad_condition": 105031519.49257562, "lr": 0.00010815327133708009, "time_sec": 83.7777681350708 }, { "epoch": 119, "train_loss": 4.239317052307129, "train_acc": 0.05098, "test_loss": 6.895288885498047, "test_acc": 0.0107, "lyapunov": null, "grad_norm": 0.28557653268704064, "grad_max_sv": 0.15877793319523334, "grad_min_sv": 2.852896488665657e-09, "grad_condition": 130124221.77470978, "lr": 0.00010173504098790182, "time_sec": 83.770183801651 }, { "epoch": 120, "train_loss": 4.238326491088867, "train_acc": 0.04944, "test_loss": 6.971952970123291, "test_acc": 0.0116, "lyapunov": null, "grad_norm": 0.28330987147198217, "grad_max_sv": 0.15257025621831416, "grad_min_sv": 2.890761002100062e-09, "grad_condition": 92481164.9877267, "lr": 9.549150281252629e-05, "time_sec": 83.78682947158813 }, { "epoch": 121, "train_loss": 4.238821759033203, "train_acc": 0.05118, "test_loss": 6.903655708312988, "test_acc": 0.0107, "lyapunov": null, "grad_norm": 0.2844816880687477, "grad_max_sv": 0.15047130659222602, "grad_min_sv": 2.9364908977515257e-09, "grad_condition": 155468550.15943855, "lr": 8.942539543314794e-05, "time_sec": 83.74171853065491 }, { "epoch": 122, "train_loss": 4.231929050292969, "train_acc": 0.05106, "test_loss": 6.9859304649353025, "test_acc": 0.011, "lyapunov": null, "grad_norm": 0.28661742540946805, "grad_max_sv": 0.15440320819616318, "grad_min_sv": 3.0144829410438945e-09, "grad_condition": 58782400.13901849, "lr": 8.353937964495024e-05, "time_sec": 83.77999758720398 }, { "epoch": 123, "train_loss": 4.234138116607666, "train_acc": 0.05334, "test_loss": 6.891355895996094, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.28893265325047696, "grad_max_sv": 0.15679317489266395, "grad_min_sv": 3.0731328568706083e-09, "grad_condition": 83816649.99544896, "lr": 7.783603724899243e-05, "time_sec": 83.76851487159729 }, { "epoch": 124, "train_loss": 4.229343013763428, "train_acc": 0.05258, "test_loss": 7.009951159667969, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.2863743887145036, "grad_max_sv": 0.15191952474415302, "grad_min_sv": 3.0230644397499785e-09, "grad_condition": 211100331.6657278, "lr": 7.231786991974666e-05, "time_sec": 83.76139807701111 }, { "epoch": 125, "train_loss": 4.232501866760254, "train_acc": 0.05186, "test_loss": 6.96674277420044, "test_acc": 0.0111, "lyapunov": null, "grad_norm": 0.2858550264764349, "grad_max_sv": 0.15213587880134583, "grad_min_sv": 3.046650505489357e-09, "grad_condition": 63383717.426429704, "lr": 6.698729810778072e-05, "time_sec": 83.78086757659912 }, { "epoch": 126, "train_loss": 4.229700404968262, "train_acc": 0.0524, "test_loss": 7.008199283599853, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.2850115287876514, "grad_max_sv": 0.14953349605202676, "grad_min_sv": 2.9821331362644977e-09, "grad_condition": 76613514.19037959, "lr": 6.184665997806817e-05, "time_sec": 83.765873670578 }, { "epoch": 127, "train_loss": 4.226065429992675, "train_acc": 0.05148, "test_loss": 6.9513890808105465, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.28929346428701186, "grad_max_sv": 0.15673540011048318, "grad_min_sv": 3.046475822998662e-09, "grad_condition": 68840265.65077923, "lr": 5.6898210384392595e-05, "time_sec": 83.76980423927307 }, { "epoch": 128, "train_loss": 4.223751395874023, "train_acc": 0.05446, "test_loss": 6.981657604980469, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.2886516286895676, "grad_max_sv": 0.15273929238319398, "grad_min_sv": 3.0959206469283186e-09, "grad_condition": 61503758.19812535, "lr": 5.214411988029363e-05, "time_sec": 83.77617073059082 }, { "epoch": 129, "train_loss": 4.223811264648438, "train_acc": 0.05404, "test_loss": 6.9342261474609375, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.2869141420134922, "grad_max_sv": 0.15136036798357963, "grad_min_sv": 3.047223613023009e-09, "grad_condition": 97351366.2154063, "lr": 4.7586473766990294e-05, "time_sec": 83.78148245811462 }, { "epoch": 130, "train_loss": 4.224827704467773, "train_acc": 0.0532, "test_loss": 7.028645568084717, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.2903989310802725, "grad_max_sv": 0.15144419111311436, "grad_min_sv": 3.1437888660390544e-09, "grad_condition": 118830904.24527971, "lr": 4.32272711786996e-05, "time_sec": 83.79948663711548 }, { "epoch": 131, "train_loss": 4.221605782775879, "train_acc": 0.05298, "test_loss": 6.999451491546631, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.29092754210208693, "grad_max_sv": 0.15410602577030658, "grad_min_sv": 3.2033975992662445e-09, "grad_condition": 57038304.52076046, "lr": 3.906842420574966e-05, "time_sec": 83.77110433578491 }, { "epoch": 132, "train_loss": 4.218992453613281, "train_acc": 0.05284, "test_loss": 7.0255691505432125, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2914825249386215, "grad_max_sv": 0.15589108187705278, "grad_min_sv": 3.206146753816086e-09, "grad_condition": 122587816.51957992, "lr": 3.5111757055874305e-05, "time_sec": 83.75379085540771 }, { "epoch": 133, "train_loss": 4.220229903869629, "train_acc": 0.05394, "test_loss": 6.9970667213439945, "test_acc": 0.0106, "lyapunov": null, "grad_norm": 0.293170941298062, "grad_max_sv": 0.15195444263517857, "grad_min_sv": 3.1603012576666978e-09, "grad_condition": 99833022.93899234, "lr": 3.1359005254054254e-05, "time_sec": 83.83364748954773 }, { "epoch": 134, "train_loss": 4.221537724761963, "train_acc": 0.05412, "test_loss": 7.081800342559815, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.29192289713649316, "grad_max_sv": 0.1527898743748665, "grad_min_sv": 3.242900753486211e-09, "grad_condition": 53839731.29661299, "lr": 2.7811814881259484e-05, "time_sec": 83.77570366859436 }, { "epoch": 135, "train_loss": 4.224225687103272, "train_acc": 0.0536, "test_loss": 7.031653879547119, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.2928013245487039, "grad_max_sv": 0.15023601055145264, "grad_min_sv": 3.1499084042485583e-09, "grad_condition": 56443800.83675871, "lr": 2.4471741852423218e-05, "time_sec": 83.79031038284302 }, { "epoch": 136, "train_loss": 4.2209420147705075, "train_acc": 0.05542, "test_loss": 7.0730202087402345, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.29383612459846997, "grad_max_sv": 0.1526225544512272, "grad_min_sv": 3.216327003211297e-09, "grad_condition": 488112741.3165139, "lr": 2.1340251233966362e-05, "time_sec": 83.78721952438354 }, { "epoch": 137, "train_loss": 4.217904202728271, "train_acc": 0.0547, "test_loss": 7.029183413696289, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.29146081115101274, "grad_max_sv": 0.14856699295341969, "grad_min_sv": 3.193107374344084e-09, "grad_condition": 54362425.00069554, "lr": 1.8418716601170932e-05, "time_sec": 83.76650714874268 }, { "epoch": 138, "train_loss": 4.222578598480225, "train_acc": 0.05248, "test_loss": 7.08011364440918, "test_acc": 0.01, "lyapunov": null, "grad_norm": 0.29305556036271213, "grad_max_sv": 0.1505037024617195, "grad_min_sv": 3.2047648587836542e-09, "grad_condition": 326741808.1820611, "lr": 1.570841943568445e-05, "time_sec": 83.7816994190216 }, { "epoch": 139, "train_loss": 4.218749967193603, "train_acc": 0.05366, "test_loss": 7.0575081214904785, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.29397952766323676, "grad_max_sv": 0.148932196572423, "grad_min_sv": 3.2381111236823303e-09, "grad_condition": 52412171.837261274, "lr": 1.3210548563419845e-05, "time_sec": 83.8086462020874 }, { "epoch": 140, "train_loss": 4.217845681304931, "train_acc": 0.05502, "test_loss": 7.102373625946045, "test_acc": 0.0104, "lyapunov": null, "grad_norm": 0.2935367604869691, "grad_max_sv": 0.14902403093874456, "grad_min_sv": 3.2832004351335264e-09, "grad_condition": 52749321.36829077, "lr": 1.0926199633097203e-05, "time_sec": 83.79147672653198 }, { "epoch": 141, "train_loss": 4.214903557434082, "train_acc": 0.05414, "test_loss": 7.033845091247558, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.29612387661640516, "grad_max_sv": 0.15556762106716632, "grad_min_sv": 3.2642252397602213e-09, "grad_condition": 123272892.75406721, "lr": 8.856374635655688e-06, "time_sec": 83.81054306030273 }, { "epoch": 142, "train_loss": 4.215419233093262, "train_acc": 0.05478, "test_loss": 7.08431992111206, "test_acc": 0.0097, "lyapunov": null, "grad_norm": 0.29494037543034185, "grad_max_sv": 0.15155189596116542, "grad_min_sv": 3.2587884789964106e-09, "grad_condition": 76214087.81495127, "lr": 7.001981464747503e-06, "time_sec": 83.78057074546814 }, { "epoch": 143, "train_loss": 4.217841682281494, "train_acc": 0.05398, "test_loss": 7.037088000488281, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.2932160255751842, "grad_max_sv": 0.14940347485244274, "grad_min_sv": 3.258327102573233e-09, "grad_condition": 73149202.84067681, "lr": 5.3638335185058295e-06, "time_sec": 83.79549980163574 }, { "epoch": 144, "train_loss": 4.215883382873535, "train_acc": 0.0537, "test_loss": 7.091348276519775, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.2950445450440956, "grad_max_sv": 0.153789921104908, "grad_min_sv": 3.312160905266648e-09, "grad_condition": 52811849.90694652, "lr": 3.942649342761114e-06, "time_sec": 83.8086678981781 }, { "epoch": 145, "train_loss": 4.2175880349731445, "train_acc": 0.05522, "test_loss": 7.115469957733154, "test_acc": 0.0098, "lyapunov": null, "grad_norm": 0.29403172002116806, "grad_max_sv": 0.15080158710479735, "grad_min_sv": 3.237252350907216e-09, "grad_condition": 52283776.27412096, "lr": 2.7390523158633524e-06, "time_sec": 83.78764986991882 }, { "epoch": 146, "train_loss": 4.211100564270019, "train_acc": 0.05546, "test_loss": 7.0454746505737305, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.2953687426258213, "grad_max_sv": 0.1488959614187479, "grad_min_sv": 3.3052532932842382e-09, "grad_condition": 57195017.16791941, "lr": 1.7535703752478133e-06, "time_sec": 83.81411933898926 }, { "epoch": 147, "train_loss": 4.215898538208008, "train_acc": 0.0547, "test_loss": 7.0791287528991695, "test_acc": 0.0099, "lyapunov": null, "grad_norm": 0.29507184047055474, "grad_max_sv": 0.1496420454233885, "grad_min_sv": 3.2882809359756003e-09, "grad_condition": 440797367.90569246, "lr": 9.866357858642196e-07, "time_sec": 83.83466935157776 }, { "epoch": 148, "train_loss": 4.21191631515503, "train_acc": 0.05502, "test_loss": 6.993793771362305, "test_acc": 0.0102, "lyapunov": null, "grad_norm": 0.29572223257711466, "grad_max_sv": 0.1509379804134369, "grad_min_sv": 3.2624034737582796e-09, "grad_condition": 53696330.15699832, "lr": 4.38584950570808e-07, "time_sec": 83.83085513114929 }, { "epoch": 149, "train_loss": 4.214856278686524, "train_acc": 0.05504, "test_loss": 7.080280429077148, "test_acc": 0.0103, "lyapunov": null, "grad_norm": 0.29551682436364557, "grad_max_sv": 0.1497094627469778, "grad_min_sv": 3.273750590060409e-09, "grad_condition": 73934031.32038581, "lr": 1.096582625772501e-07, "time_sec": 83.84602665901184 }, { "epoch": 150, "train_loss": 4.2193192990112305, "train_acc": 0.0535, "test_loss": 7.083986274719238, "test_acc": 0.0101, "lyapunov": null, "grad_norm": 0.2957722763250381, "grad_max_sv": 0.15103124249726535, "grad_min_sv": 3.2879624276699325e-09, "grad_condition": 65137818.05484857, "lr": 0.0, "time_sec": 83.81010937690735 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 8.745512613220216, "train_acc": 0.02574, "test_loss": 4.55846024017334, "test_acc": 0.0339, "lyapunov": 3.2288631459941035, "grad_norm": 7.160399518281865, "grad_max_sv": 5.050605493783951, "grad_min_sv": 1.0948114780862107e-07, "grad_condition": 174574426.40620375, "lr": 0.0009998903417374227, "time_sec": 38.78080153465271 }, { "epoch": 2, "train_loss": 6.857188781433106, "train_acc": 0.03116, "test_loss": 4.409567827606201, "test_acc": 0.0498, "lyapunov": 2.566672464160968, "grad_norm": 4.581532406245075, "grad_max_sv": 3.4727421343326568, "grad_min_sv": 6.695858347782747e-08, "grad_condition": 100510712.5879864, "lr": 0.0009995614150494292, "time_sec": 38.758466482162476 }, { "epoch": 3, "train_loss": 6.406850777893067, "train_acc": 0.03836, "test_loss": 4.3329737182617185, "test_acc": 0.0541, "lyapunov": 2.4151331805207237, "grad_norm": 2.8463282070399885, "grad_max_sv": 2.2940395712852477, "grad_min_sv": 3.7823234264044994e-08, "grad_condition": 106198851.94331202, "lr": 0.0009990133642141358, "time_sec": 38.77664065361023 }, { "epoch": 4, "train_loss": 6.1679999932861325, "train_acc": 0.04216, "test_loss": 4.314407443237305, "test_acc": 0.0539, "lyapunov": 2.324155716030189, "grad_norm": 1.4958218707983646, "grad_max_sv": 1.126097397506237, "grad_min_sv": 1.8212272229894964e-08, "grad_condition": 178099339.46093446, "lr": 0.0009982464296247522, "time_sec": 38.772703409194946 }, { "epoch": 5, "train_loss": 6.023621784973145, "train_acc": 0.04472, "test_loss": 4.327248037719727, "test_acc": 0.0523, "lyapunov": 2.24559463046091, "grad_norm": 0.8361636453752828, "grad_max_sv": 0.5582518823444843, "grad_min_sv": 9.160982232525595e-09, "grad_condition": 218277432.54054898, "lr": 0.0009972609476841367, "time_sec": 38.792168855667114 }, { "epoch": 6, "train_loss": 5.923550573730469, "train_acc": 0.03788, "test_loss": 4.373689149475098, "test_acc": 0.0448, "lyapunov": 2.143530731615813, "grad_norm": 0.6125747823801606, "grad_max_sv": 0.3806876644492149, "grad_min_sv": 4.764090941352089e-09, "grad_condition": 2115444033.3075993, "lr": 0.000996057350657239, "time_sec": 38.80649399757385 }, { "epoch": 7, "train_loss": 5.819468310699463, "train_acc": 0.03402, "test_loss": 4.396667736816406, "test_acc": 0.0409, "lyapunov": 2.047879105028899, "grad_norm": 0.5012166631957408, "grad_max_sv": 0.29988972246646883, "grad_min_sv": 2.6462318619344118e-09, "grad_condition": 1674717584.2678788, "lr": 0.000994636166481494, "time_sec": 38.8136990070343 }, { "epoch": 8, "train_loss": 5.776593683929443, "train_acc": 0.02754, "test_loss": 4.459617399597168, "test_acc": 0.0288, "lyapunov": 1.982207260168422, "grad_norm": 0.48582047366784137, "grad_max_sv": 0.2761614330112934, "grad_min_sv": 2.1785290433868222e-10, "grad_condition": 40862120030.312584, "lr": 0.0009929980185352525, "time_sec": 38.845232248306274 }, { "epoch": 9, "train_loss": 5.781761088104248, "train_acc": 0.0231, "test_loss": 4.675199285888672, "test_acc": 0.0029, "lyapunov": 1.954250096360131, "grad_norm": 0.46266769063149876, "grad_max_sv": 0.2622381761670113, "grad_min_sv": 5.480658221434448e-10, "grad_condition": 100986477853.47366, "lr": 0.0009911436253643444, "time_sec": 38.80020809173584 }, { "epoch": 10, "train_loss": 5.8479565664672855, "train_acc": 0.01186, "test_loss": 4.6061001365661625, "test_acc": 0.01, "lyapunov": 1.9396185356637705, "grad_norm": 0.261511927042467, "grad_max_sv": 0.09869588532019406, "grad_min_sv": 2.728127020095826e-13, "grad_condition": 88878548722.67065, "lr": 0.0009890738003669028, "time_sec": 38.743908405303955 }, { "epoch": 11, "train_loss": 5.8408165109252925, "train_acc": 0.01034, "test_loss": 4.6082617340087895, "test_acc": 0.01, "lyapunov": 1.9296608300465148, "grad_norm": 0.2344195135575755, "grad_max_sv": 0.08715516603551805, "grad_min_sv": 2.4710747756651273e-15, "grad_condition": 86872648368.75877, "lr": 0.00098678945143658, "time_sec": 38.751142263412476 }, { "epoch": 12, "train_loss": 5.84793187210083, "train_acc": 0.00954, "test_loss": 4.6062534797668455, "test_acc": 0.01, "lyapunov": 1.932467032881344, "grad_norm": 0.24986425241000795, "grad_max_sv": 0.07697397316806018, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 76973973168.06018, "lr": 0.0009842915805643154, "time_sec": 38.75897789001465 }, { "epoch": 13, "train_loss": 5.845315325927734, "train_acc": 0.01, "test_loss": 4.606490065002442, "test_acc": 0.01, "lyapunov": 1.9308954513896153, "grad_norm": 0.2234501732158856, "grad_max_sv": 0.07171829692088068, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 71718296920.88069, "lr": 0.000981581283398829, "time_sec": 38.77409482002258 }, { "epoch": 14, "train_loss": 5.844472907714843, "train_acc": 0.00932, "test_loss": 4.611052139282227, "test_acc": 0.01, "lyapunov": 1.9302553133586484, "grad_norm": 0.2546366793913816, "grad_max_sv": 0.0627493538428098, "grad_min_sv": 5.442503105591157e-42, "grad_condition": 62749353842.80979, "lr": 0.0009786597487660333, "time_sec": 38.75410294532776 }, { "epoch": 15, "train_loss": 5.839373329620361, "train_acc": 0.01012, "test_loss": 4.605493424987793, "test_acc": 0.01, "lyapunov": 1.9264278128323957, "grad_norm": 0.33195464165742516, "grad_max_sv": 0.0596250070258975, "grad_min_sv": 1.1532839803575087e-39, "grad_condition": 59625007025.89751, "lr": 0.0009755282581475766, "time_sec": 38.737260818481445 }, { "epoch": 16, "train_loss": 5.840845001983642, "train_acc": 0.01006, "test_loss": 4.606367964935303, "test_acc": 0.01, "lyapunov": 1.9284262577895923, "grad_norm": 0.41972925674223915, "grad_max_sv": 0.04947211216203869, "grad_min_sv": 0.0, "grad_condition": 49472112162.03868, "lr": 0.0009721881851187403, "time_sec": 38.72240591049194 }, { "epoch": 17, "train_loss": 5.838009662322998, "train_acc": 0.01014, "test_loss": 4.607442309570312, "test_acc": 0.01, "lyapunov": 1.927741524203659, "grad_norm": 0.41171422252176765, "grad_max_sv": 0.06055757296271622, "grad_min_sv": 6.063498673792123e-17, "grad_condition": 60551208649.85646, "lr": 0.0009686409947459456, "time_sec": 38.7178897857666 }, { "epoch": 18, "train_loss": 5.8419268412780765, "train_acc": 0.00974, "test_loss": 4.605891960144043, "test_acc": 0.01, "lyapunov": 1.9291500267775163, "grad_norm": 0.3483236145113203, "grad_max_sv": 0.03731603529304266, "grad_min_sv": 6.04933030713951e-30, "grad_condition": 37316035293.042656, "lr": 0.0009648882429441254, "time_sec": 38.760350704193115 }, { "epoch": 19, "train_loss": 5.826735510559082, "train_acc": 0.01202, "test_loss": 4.605664205932618, "test_acc": 0.01, "lyapunov": 1.9298754738419868, "grad_norm": 0.3207639814137615, "grad_max_sv": 0.06981198373250663, "grad_min_sv": 1.9222199366026642e-14, "grad_condition": 67062140845.185585, "lr": 0.00096093157579425, "time_sec": 38.76730132102966 }, { "epoch": 20, "train_loss": 5.84202998046875, "train_acc": 0.00976, "test_loss": 4.606653337097168, "test_acc": 0.01, "lyapunov": 1.9302551270750783, "grad_norm": 0.20194476347748866, "grad_max_sv": 0.03701699019875378, "grad_min_sv": 0.0, "grad_condition": 37016990198.75377, "lr": 0.0009567727288213001, "time_sec": 38.725250244140625 }, { "epoch": 21, "train_loss": 5.84192676071167, "train_acc": 0.00982, "test_loss": 4.614536486816406, "test_acc": 0.01, "lyapunov": 1.9300702325523358, "grad_norm": 0.2358565070101103, "grad_max_sv": 0.033911947428714485, "grad_min_sv": 0.0, "grad_condition": 33911947428.714485, "lr": 0.0009524135262330095, "time_sec": 38.72857594490051 }, { "epoch": 22, "train_loss": 5.839627782592774, "train_acc": 0.00992, "test_loss": 4.606048239898682, "test_acc": 0.01, "lyapunov": 1.9269078469947172, "grad_norm": 0.17845225075047805, "grad_max_sv": 0.025568678742274642, "grad_min_sv": 0.0, "grad_condition": 25568678742.274643, "lr": 0.0009478558801197061, "time_sec": 38.68861746788025 }, { "epoch": 23, "train_loss": 5.838393308258056, "train_acc": 0.00958, "test_loss": 4.586302839660645, "test_acc": 0.0188, "lyapunov": 1.9266618383510032, "grad_norm": 0.13466647962688946, "grad_max_sv": 0.01349067515693605, "grad_min_sv": 0.0, "grad_condition": 13490675156.936049, "lr": 0.000943101789615607, "time_sec": 38.702245473861694 }, { "epoch": 24, "train_loss": 5.835893999938965, "train_acc": 0.0103, "test_loss": 4.605248524475098, "test_acc": 0.01, "lyapunov": 1.9250504610788486, "grad_norm": 0.1306925374207253, "grad_max_sv": 0.021706052590161562, "grad_min_sv": 4.2115888976736585e-17, "grad_condition": 21702749025.936443, "lr": 0.0009381533400219313, "time_sec": 38.70141124725342 }, { "epoch": 25, "train_loss": 5.839240811767578, "train_acc": 0.00906, "test_loss": 4.605221250915528, "test_acc": 0.01, "lyapunov": 1.9273294420803295, "grad_norm": 0.12078726665544544, "grad_max_sv": 0.010838619247078896, "grad_min_sv": 0.0, "grad_condition": 10838619247.078896, "lr": 0.0009330127018922189, "time_sec": 38.68912363052368 }, { "epoch": 26, "train_loss": 5.832334176635742, "train_acc": 0.00902, "test_loss": 4.605214032745361, "test_acc": 0.01, "lyapunov": 1.92168139923564, "grad_norm": 0.11780855950452304, "grad_max_sv": 0.012504769628867507, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 12504769628.867508, "lr": 0.000927682130080253, "time_sec": 38.69681906700134 }, { "epoch": 27, "train_loss": 5.832823591003418, "train_acc": 0.00856, "test_loss": 4.605198753356934, "test_acc": 0.01, "lyapunov": 1.9220849495104817, "grad_norm": 0.1307395775308225, "grad_max_sv": 0.00955222793854773, "grad_min_sv": 0.0, "grad_condition": 9552227938.54773, "lr": 0.0009221639627510072, "time_sec": 38.67968559265137 }, { "epoch": 28, "train_loss": 5.8319349609375, "train_acc": 0.00908, "test_loss": 4.60519333190918, "test_acc": 0.01, "lyapunov": 1.9214767400565964, "grad_norm": 0.11312977194763361, "grad_max_sv": 0.007689819484949112, "grad_min_sv": 0.0, "grad_condition": 7689819484.949112, "lr": 0.0009164606203550494, "time_sec": 38.693461418151855 }, { "epoch": 29, "train_loss": 5.832658680419922, "train_acc": 0.0089, "test_loss": 4.605188513946533, "test_acc": 0.01, "lyapunov": 1.9219111963306241, "grad_norm": 0.1139488031414971, "grad_max_sv": 0.009555681003257632, "grad_min_sv": 0.0, "grad_condition": 9555681003.257633, "lr": 0.0009105746045668516, "time_sec": 38.88858246803284 }, { "epoch": 30, "train_loss": 5.8301619506835936, "train_acc": 0.00936, "test_loss": 4.605182504272461, "test_acc": 0.01, "lyapunov": 1.9200728305465424, "grad_norm": 0.10113831163550316, "grad_max_sv": 0.004735648166388273, "grad_min_sv": 0.0, "grad_condition": 4735648166.388273, "lr": 0.0009045084971874733, "time_sec": 38.682101011276245 }, { "epoch": 31, "train_loss": 5.832088593292236, "train_acc": 0.00848, "test_loss": 4.60520027999878, "test_acc": 0.01, "lyapunov": 1.921536988309582, "grad_norm": 0.11928153797201548, "grad_max_sv": 0.005120814079418778, "grad_min_sv": 0.0, "grad_condition": 5120814079.418779, "lr": 0.0008982649590120977, "time_sec": 38.66986131668091 }, { "epoch": 32, "train_loss": 5.830597168426514, "train_acc": 0.009, "test_loss": 4.605257048797608, "test_acc": 0.01, "lyapunov": 1.9206426658898668, "grad_norm": 0.09874780482605999, "grad_max_sv": 0.0029883835930377247, "grad_min_sv": 0.0, "grad_condition": 2988383593.0377245, "lr": 0.0008918467286629196, "time_sec": 38.69553232192993 }, { "epoch": 33, "train_loss": 5.829611896514892, "train_acc": 0.00884, "test_loss": 4.60517430267334, "test_acc": 0.01, "lyapunov": 1.9195137139781357, "grad_norm": 0.09972362630787891, "grad_max_sv": 0.00664278594776988, "grad_min_sv": 0.0, "grad_condition": 6642785947.76988, "lr": 0.0008852566213878943, "time_sec": 38.67990040779114 }, { "epoch": 34, "train_loss": 5.828044633636474, "train_acc": 0.0083, "test_loss": 4.605173886871338, "test_acc": 0.01, "lyapunov": 1.918492463848475, "grad_norm": 0.0974792016961528, "grad_max_sv": 0.001599628059193492, "grad_min_sv": 0.0, "grad_condition": 1599628059.193492, "lr": 0.000878497527825878, "time_sec": 38.68664336204529 }, { "epoch": 35, "train_loss": 5.830746371154786, "train_acc": 0.00894, "test_loss": 4.6051726875305175, "test_acc": 0.01, "lyapunov": 1.920728165475304, "grad_norm": 0.0938240145066066, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000871572412738697, "time_sec": 38.67132115364075 }, { "epoch": 36, "train_loss": 5.829937998809815, "train_acc": 0.00866, "test_loss": 4.605172854614258, "test_acc": 0.01, "lyapunov": 1.920135024868314, "grad_norm": 0.09205400750487011, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107055, "time_sec": 38.64905834197998 }, { "epoch": 37, "train_loss": 5.829817896728516, "train_acc": 0.00818, "test_loss": 4.6051733100891115, "test_acc": 0.01, "lyapunov": 1.9200208934066851, "grad_norm": 0.09228371311542864, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008572363398164014, "time_sec": 38.657002210617065 }, { "epoch": 38, "train_loss": 5.831039802246094, "train_acc": 0.0088, "test_loss": 4.6051726837158204, "test_acc": 0.01, "lyapunov": 1.9210114238207296, "grad_norm": 0.09181178733619569, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008498316702566826, "time_sec": 38.66207027435303 }, { "epoch": 39, "train_loss": 5.829483923492432, "train_acc": 0.00886, "test_loss": 4.605172607421875, "test_acc": 0.01, "lyapunov": 1.919772486552558, "grad_norm": 0.09053836987454536, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643442, "time_sec": 38.67074227333069 }, { "epoch": 40, "train_loss": 5.829308145904541, "train_acc": 0.00862, "test_loss": 4.605172937774658, "test_acc": 0.01, "lyapunov": 1.9195958787522962, "grad_norm": 0.09302966072405643, "grad_max_sv": 0.0028064717072993515, "grad_min_sv": 0.0, "grad_condition": 2806471707.2993517, "lr": 0.0008345653031794289, "time_sec": 38.66209268569946 }, { "epoch": 41, "train_loss": 5.828913317565918, "train_acc": 0.00894, "test_loss": 4.605173394775391, "test_acc": 0.01, "lyapunov": 1.9192491733204677, "grad_norm": 0.09010018258992165, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008267103019950526, "time_sec": 38.68193006515503 }, { "epoch": 42, "train_loss": 5.83203209274292, "train_acc": 0.0089, "test_loss": 4.6051725547790525, "test_acc": 0.01, "lyapunov": 1.9218718840947846, "grad_norm": 0.09554864716201418, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743447, "time_sec": 38.67262053489685 }, { "epoch": 43, "train_loss": 5.836768571929932, "train_acc": 0.00868, "test_loss": 4.605172836303711, "test_acc": 0.01, "lyapunov": 1.9252831368800014, "grad_norm": 0.11288803301983473, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000810573890139155, "time_sec": 38.673030853271484 }, { "epoch": 44, "train_loss": 5.830244238128662, "train_acc": 0.00862, "test_loss": 4.605172270202637, "test_acc": 0.01, "lyapunov": 1.9203159440204005, "grad_norm": 0.09075156234022023, "grad_max_sv": 0.0006292640697211027, "grad_min_sv": 0.0, "grad_condition": 629264069.7211027, "lr": 0.0008022995574311873, "time_sec": 38.67639136314392 }, { "epoch": 45, "train_loss": 5.831813296051026, "train_acc": 0.00798, "test_loss": 4.605172733306885, "test_acc": 0.01, "lyapunov": 1.9216700673408216, "grad_norm": 0.09800318179113622, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462363, "time_sec": 38.66922402381897 }, { "epoch": 46, "train_loss": 5.829525221710205, "train_acc": 0.0088, "test_loss": 4.605172639465332, "test_acc": 0.01, "lyapunov": 1.9197535209948449, "grad_norm": 0.09607771134569527, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007853567838422158, "time_sec": 38.6734299659729 }, { "epoch": 47, "train_loss": 5.831378362731933, "train_acc": 0.00896, "test_loss": 4.605172109985352, "test_acc": 0.01, "lyapunov": 1.9213088927671427, "grad_norm": 0.09002095025572443, "grad_max_sv": 0.0022390282712876795, "grad_min_sv": 0.0, "grad_condition": 2239028271.2876797, "lr": 0.0007766957746216719, "time_sec": 38.681992530822754 }, { "epoch": 48, "train_loss": 5.8296267512512205, "train_acc": 0.00852, "test_loss": 4.605172399902344, "test_acc": 0.01, "lyapunov": 1.9198472441919625, "grad_norm": 0.08948131522401738, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894982, "time_sec": 38.69184613227844 }, { "epoch": 49, "train_loss": 5.82939344329834, "train_acc": 0.009, "test_loss": 4.6051721862792965, "test_acc": 0.01, "lyapunov": 1.919716474345273, "grad_norm": 0.08962129117217822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000759013504686565, "time_sec": 38.66769075393677 }, { "epoch": 50, "train_loss": 5.829856867675781, "train_acc": 0.00824, "test_loss": 4.605171932983398, "test_acc": 0.01, "lyapunov": 1.9200777041027919, "grad_norm": 0.08949650095695762, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 38.6767897605896 }, { "epoch": 51, "train_loss": 5.831189596557617, "train_acc": 0.00886, "test_loss": 4.605172845458984, "test_acc": 0.01, "lyapunov": 1.9211604323838374, "grad_norm": 0.08928877604280225, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508575, "time_sec": 38.669432640075684 }, { "epoch": 52, "train_loss": 5.827941221618652, "train_acc": 0.00906, "test_loss": 4.605172493743897, "test_acc": 0.01, "lyapunov": 1.9184872210787995, "grad_norm": 0.08912832082902897, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 38.65984392166138 }, { "epoch": 53, "train_loss": 5.829616719360351, "train_acc": 0.00856, "test_loss": 4.6051721878051755, "test_acc": 0.01, "lyapunov": 1.9199278674772025, "grad_norm": 0.08891740863163855, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 38.684584856033325 }, { "epoch": 54, "train_loss": 5.828832433013916, "train_acc": 0.00888, "test_loss": 4.605171940612793, "test_acc": 0.01, "lyapunov": 1.9193241215118058, "grad_norm": 0.08862714787237397, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 38.6649751663208 }, { "epoch": 55, "train_loss": 5.829295374145508, "train_acc": 0.00864, "test_loss": 4.6051718048095704, "test_acc": 0.01, "lyapunov": 1.9196355620308605, "grad_norm": 0.08936964720805882, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007033683215378998, "time_sec": 38.66834211349487 }, { "epoch": 56, "train_loss": 5.831980644836426, "train_acc": 0.00872, "test_loss": 4.605172239685059, "test_acc": 0.01, "lyapunov": 1.9218218890602325, "grad_norm": 0.08828331902779529, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 38.67644000053406 }, { "epoch": 57, "train_loss": 5.8291939093017575, "train_acc": 0.00898, "test_loss": 4.605171894836426, "test_acc": 0.01, "lyapunov": 1.9195057918958347, "grad_norm": 0.08970762017367405, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423388, "time_sec": 38.66079378128052 }, { "epoch": 58, "train_loss": 5.826841032867431, "train_acc": 0.0085, "test_loss": 4.605172017669678, "test_acc": 0.01, "lyapunov": 1.9176025924170415, "grad_norm": 0.09048223717877525, "grad_max_sv": 0.0014875998720526695, "grad_min_sv": 0.0, "grad_condition": 1487599872.0526695, "lr": 0.0006742860236609073, "time_sec": 38.66658973693848 }, { "epoch": 59, "train_loss": 5.835019799499512, "train_acc": 0.00882, "test_loss": 4.60517190322876, "test_acc": 0.01, "lyapunov": 1.9238726757371518, "grad_norm": 0.09441160205385561, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 38.67969727516174 }, { "epoch": 60, "train_loss": 5.830721065979004, "train_acc": 0.00836, "test_loss": 4.605171463012695, "test_acc": 0.01, "lyapunov": 1.9208579142685132, "grad_norm": 0.08921306700093072, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 38.663196325302124 }, { "epoch": 61, "train_loss": 5.829596945648193, "train_acc": 0.00828, "test_loss": 4.605171449279785, "test_acc": 0.01, "lyapunov": 1.9199584844472157, "grad_norm": 0.08848056161918356, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 38.68021297454834 }, { "epoch": 62, "train_loss": 5.830569870300293, "train_acc": 0.00824, "test_loss": 4.605171228790283, "test_acc": 0.01, "lyapunov": 1.9206647436941982, "grad_norm": 0.08839721397975912, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 38.675719022750854 }, { "epoch": 63, "train_loss": 5.8305546853637695, "train_acc": 0.00854, "test_loss": 4.605172233581543, "test_acc": 0.01, "lyapunov": 1.9206541834584892, "grad_norm": 0.08903578043587344, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 38.658900022506714 }, { "epoch": 64, "train_loss": 5.836477585449218, "train_acc": 0.00876, "test_loss": 4.605171844482422, "test_acc": 0.01, "lyapunov": 1.9251100108446673, "grad_norm": 0.09951449127834824, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 38.67370843887329 }, { "epoch": 65, "train_loss": 5.830157748260498, "train_acc": 0.00854, "test_loss": 4.605171319580078, "test_acc": 0.01, "lyapunov": 1.920334783661396, "grad_norm": 0.09108085096662916, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 38.67955160140991 }, { "epoch": 66, "train_loss": 5.828997611694336, "train_acc": 0.00866, "test_loss": 4.605171671295166, "test_acc": 0.01, "lyapunov": 1.919463188751884, "grad_norm": 0.08904439645709107, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 38.67839956283569 }, { "epoch": 67, "train_loss": 5.830838754272461, "train_acc": 0.00868, "test_loss": 4.605171606445312, "test_acc": 0.01, "lyapunov": 1.9207777364174727, "grad_norm": 0.09755498438636814, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 38.67587614059448 }, { "epoch": 68, "train_loss": 5.827152337646484, "train_acc": 0.00928, "test_loss": 4.605171282958985, "test_acc": 0.01, "lyapunov": 1.9178936585136082, "grad_norm": 0.08799438562008605, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 38.67634415626526 }, { "epoch": 69, "train_loss": 5.830286772155762, "train_acc": 0.0096, "test_loss": 4.605171063232422, "test_acc": 0.01, "lyapunov": 1.9204461242231872, "grad_norm": 0.09070089337302271, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 38.678497076034546 }, { "epoch": 70, "train_loss": 5.832680291290283, "train_acc": 0.0098, "test_loss": 4.605171459197998, "test_acc": 0.01, "lyapunov": 1.9224533403621, "grad_norm": 0.08827257843406246, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 38.66450572013855 }, { "epoch": 71, "train_loss": 5.830269169921875, "train_acc": 0.00836, "test_loss": 4.605171234130859, "test_acc": 0.01, "lyapunov": 1.9205291399260616, "grad_norm": 0.08807564726395264, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 38.656336545944214 }, { "epoch": 72, "train_loss": 5.830037397460938, "train_acc": 0.00858, "test_loss": 4.605171022033692, "test_acc": 0.01, "lyapunov": 1.9203362114289229, "grad_norm": 0.08760409668351568, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646563, "time_sec": 38.68950128555298 }, { "epoch": 73, "train_loss": 5.83207408782959, "train_acc": 0.00862, "test_loss": 4.605171083068847, "test_acc": 0.01, "lyapunov": 1.922044792138707, "grad_norm": 0.08837012490740455, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 38.678892612457275 }, { "epoch": 74, "train_loss": 5.830842367553711, "train_acc": 0.00886, "test_loss": 4.6051713088989255, "test_acc": 0.01, "lyapunov": 1.9209648620746935, "grad_norm": 0.0881334492267735, "grad_max_sv": 0.0016617819666862488, "grad_min_sv": 0.0, "grad_condition": 1661781966.6862488, "lr": 0.0005104712099416781, "time_sec": 38.66536831855774 }, { "epoch": 75, "train_loss": 5.831041750488281, "train_acc": 0.00846, "test_loss": 4.605171099853516, "test_acc": 0.01, "lyapunov": 1.9211621680832884, "grad_norm": 0.08829717661983798, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 38.674325704574585 }, { "epoch": 76, "train_loss": 5.836333667144776, "train_acc": 0.00864, "test_loss": 4.605171186065673, "test_acc": 0.01, "lyapunov": 1.9246098906792644, "grad_norm": 0.11366095758738136, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 38.687448501586914 }, { "epoch": 77, "train_loss": 5.835334293212891, "train_acc": 0.0089, "test_loss": 4.6051709121704105, "test_acc": 0.01, "lyapunov": 1.9234618140608453, "grad_norm": 0.10831693857812812, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 38.65811228752136 }, { "epoch": 78, "train_loss": 5.827478051452637, "train_acc": 0.00882, "test_loss": 4.605171005249024, "test_acc": 0.01, "lyapunov": 1.9182067341206934, "grad_norm": 0.08781347391325668, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 38.676063537597656 }, { "epoch": 79, "train_loss": 5.8290468742370605, "train_acc": 0.00886, "test_loss": 4.605171278381348, "test_acc": 0.01, "lyapunov": 1.919505515671752, "grad_norm": 0.08854207911135165, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 38.673518896102905 }, { "epoch": 80, "train_loss": 5.833914941253662, "train_acc": 0.0089, "test_loss": 4.605170984649658, "test_acc": 0.01, "lyapunov": 1.9234306675088986, "grad_norm": 0.09381991898821151, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 38.672255754470825 }, { "epoch": 81, "train_loss": 5.829356372680664, "train_acc": 0.00902, "test_loss": 4.605171099853516, "test_acc": 0.01, "lyapunov": 1.919769955413116, "grad_norm": 0.08816368922697575, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 38.67954111099243 }, { "epoch": 82, "train_loss": 5.831741758117675, "train_acc": 0.00918, "test_loss": 4.605171073913574, "test_acc": 0.01, "lyapunov": 1.921732059525102, "grad_norm": 0.09264254493603952, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 38.673032999038696 }, { "epoch": 83, "train_loss": 5.834408538513183, "train_acc": 0.0092, "test_loss": 4.605170977020264, "test_acc": 0.01, "lyapunov": 1.9238771880069352, "grad_norm": 0.08953937527623661, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 38.68673372268677 }, { "epoch": 84, "train_loss": 5.830432665252686, "train_acc": 0.009, "test_loss": 4.605170909118653, "test_acc": 0.01, "lyapunov": 1.920691382854491, "grad_norm": 0.08848473612958971, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 38.663509130477905 }, { "epoch": 85, "train_loss": 5.83150433013916, "train_acc": 0.00862, "test_loss": 4.605170706176758, "test_acc": 0.01, "lyapunov": 1.921521064875376, "grad_norm": 0.0878123084846611, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 38.6465003490448 }, { "epoch": 86, "train_loss": 5.831791127319336, "train_acc": 0.00896, "test_loss": 4.605170570373535, "test_acc": 0.01, "lyapunov": 1.9217873232443925, "grad_norm": 0.0877757716455608, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 38.6744065284729 }, { "epoch": 87, "train_loss": 5.832627346191407, "train_acc": 0.00878, "test_loss": 4.605170877075195, "test_acc": 0.01, "lyapunov": 1.9224827862761515, "grad_norm": 0.08827499584565024, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 38.66921091079712 }, { "epoch": 88, "train_loss": 5.8317487963867185, "train_acc": 0.00824, "test_loss": 4.605170699310302, "test_acc": 0.01, "lyapunov": 1.921761295984468, "grad_norm": 0.08846045903994489, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 38.67842221260071 }, { "epoch": 89, "train_loss": 5.8302451986694335, "train_acc": 0.00862, "test_loss": 4.605170578765869, "test_acc": 0.01, "lyapunov": 1.9205519287177668, "grad_norm": 0.0880969562704879, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 38.66373419761658 }, { "epoch": 90, "train_loss": 5.828649435424805, "train_acc": 0.00928, "test_loss": 4.605170637512207, "test_acc": 0.01, "lyapunov": 1.919257033816384, "grad_norm": 0.08878565745159492, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 38.68431329727173 }, { "epoch": 91, "train_loss": 5.830266084594727, "train_acc": 0.0087, "test_loss": 4.60517045211792, "test_acc": 0.01, "lyapunov": 1.920564612464222, "grad_norm": 0.0883222592119473, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 38.67736315727234 }, { "epoch": 92, "train_loss": 5.831894824829101, "train_acc": 0.00856, "test_loss": 4.605170608520508, "test_acc": 0.01, "lyapunov": 1.9219116762166133, "grad_norm": 0.08764554261224523, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 38.67611908912659 }, { "epoch": 93, "train_loss": 5.82894446182251, "train_acc": 0.00844, "test_loss": 4.6051702972412105, "test_acc": 0.01, "lyapunov": 1.9194979228631919, "grad_norm": 0.08833998566442527, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 38.69344687461853 }, { "epoch": 94, "train_loss": 5.837506525115967, "train_acc": 0.00874, "test_loss": 4.60517064819336, "test_acc": 0.01, "lyapunov": 1.9243434188920823, "grad_norm": 0.11393882739366498, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 38.68289828300476 }, { "epoch": 95, "train_loss": 5.831888694152832, "train_acc": 0.00764, "test_loss": 4.605170504760742, "test_acc": 0.01, "lyapunov": 1.9216798833568993, "grad_norm": 0.10076789355226513, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 38.68230414390564 }, { "epoch": 96, "train_loss": 5.839447547912598, "train_acc": 0.00876, "test_loss": 4.605170679473877, "test_acc": 0.01, "lyapunov": 1.9261463017719787, "grad_norm": 0.11376740734099834, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 38.6755793094635 }, { "epoch": 97, "train_loss": 5.828961611328125, "train_acc": 0.00828, "test_loss": 4.605170320129394, "test_acc": 0.01, "lyapunov": 1.9195098590363018, "grad_norm": 0.08840788709710101, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 38.676655769348145 }, { "epoch": 98, "train_loss": 5.829206983032226, "train_acc": 0.00852, "test_loss": 4.605170263671875, "test_acc": 0.01, "lyapunov": 1.9197069199188896, "grad_norm": 0.08784611697907319, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 38.679508209228516 }, { "epoch": 99, "train_loss": 5.830749737243653, "train_acc": 0.0086, "test_loss": 4.605170584106445, "test_acc": 0.01, "lyapunov": 1.9209906048786916, "grad_norm": 0.08837860643236768, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 38.6536865234375 }, { "epoch": 100, "train_loss": 5.833174273071289, "train_acc": 0.00912, "test_loss": 4.605170581054687, "test_acc": 0.01, "lyapunov": 1.923052377713001, "grad_norm": 0.0880219202195275, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 38.669525146484375 }, { "epoch": 101, "train_loss": 5.832474216003418, "train_acc": 0.00924, "test_loss": 4.605170333862305, "test_acc": 0.01, "lyapunov": 1.9223707411295312, "grad_norm": 0.088109218729273, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 38.68469524383545 }, { "epoch": 102, "train_loss": 5.832093044128418, "train_acc": 0.0085, "test_loss": 4.6051706710815425, "test_acc": 0.01, "lyapunov": 1.9221026568156678, "grad_norm": 0.08806360302850152, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 38.667779207229614 }, { "epoch": 103, "train_loss": 5.829613971557618, "train_acc": 0.00884, "test_loss": 4.605170641326905, "test_acc": 0.01, "lyapunov": 1.9200275365044088, "grad_norm": 0.08827372352248057, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 38.67877268791199 }, { "epoch": 104, "train_loss": 5.829403175201416, "train_acc": 0.0085, "test_loss": 4.605170069885254, "test_acc": 0.01, "lyapunov": 1.9198780102498085, "grad_norm": 0.08759321728417062, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 38.67757058143616 }, { "epoch": 105, "train_loss": 5.83223681137085, "train_acc": 0.00838, "test_loss": 4.605170602416992, "test_acc": 0.01, "lyapunov": 1.922215115993529, "grad_norm": 0.08796326905677253, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 38.667465925216675 }, { "epoch": 106, "train_loss": 5.833028655090332, "train_acc": 0.00824, "test_loss": 4.605170317840576, "test_acc": 0.01, "lyapunov": 1.92289487815574, "grad_norm": 0.08795960069436239, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 38.68554091453552 }, { "epoch": 107, "train_loss": 5.827796527557373, "train_acc": 0.00876, "test_loss": 4.605170085144043, "test_acc": 0.01, "lyapunov": 1.918589440453083, "grad_norm": 0.08772654367791473, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 38.68501615524292 }, { "epoch": 108, "train_loss": 5.82904862991333, "train_acc": 0.00916, "test_loss": 4.605170137023926, "test_acc": 0.01, "lyapunov": 1.9196739556539395, "grad_norm": 0.08791956109774068, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 38.68057060241699 }, { "epoch": 109, "train_loss": 5.830072443237305, "train_acc": 0.00772, "test_loss": 4.605170295715332, "test_acc": 0.01, "lyapunov": 1.9204182008953046, "grad_norm": 0.08807291337304174, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 38.66407561302185 }, { "epoch": 110, "train_loss": 5.830760421295166, "train_acc": 0.00882, "test_loss": 4.605170086669922, "test_acc": 0.01, "lyapunov": 1.9210344882267516, "grad_norm": 0.08829325644128909, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 38.66635870933533 }, { "epoch": 111, "train_loss": 5.844144050140381, "train_acc": 0.00756, "test_loss": 4.605170138549805, "test_acc": 0.01, "lyapunov": 1.9289683185879836, "grad_norm": 0.08860258635222626, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 38.67165184020996 }, { "epoch": 112, "train_loss": 5.830768748779297, "train_acc": 0.0085, "test_loss": 4.605170237731934, "test_acc": 0.01, "lyapunov": 1.9210170031813405, "grad_norm": 0.0882870971276682, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 38.67701458930969 }, { "epoch": 113, "train_loss": 5.8316661862182615, "train_acc": 0.00856, "test_loss": 4.605170329284668, "test_acc": 0.01, "lyapunov": 1.921789816883214, "grad_norm": 0.08856537933077034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 38.66913890838623 }, { "epoch": 114, "train_loss": 5.83167002532959, "train_acc": 0.00886, "test_loss": 4.60517038269043, "test_acc": 0.01, "lyapunov": 1.9217432996501094, "grad_norm": 0.08829399946029161, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 38.68831920623779 }, { "epoch": 115, "train_loss": 5.829227747192383, "train_acc": 0.00872, "test_loss": 4.605170357513428, "test_acc": 0.01, "lyapunov": 1.9198200571567505, "grad_norm": 0.08820685400799948, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 38.898104667663574 }, { "epoch": 116, "train_loss": 5.826888065795899, "train_acc": 0.0084, "test_loss": 4.605169971466064, "test_acc": 0.01, "lyapunov": 1.9179128426724992, "grad_norm": 0.08799764957632915, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 38.664024114608765 }, { "epoch": 117, "train_loss": 5.833059454956055, "train_acc": 0.00838, "test_loss": 4.605170207214355, "test_acc": 0.01, "lyapunov": 1.9228876301699587, "grad_norm": 0.09229149137870292, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 38.66628289222717 }, { "epoch": 118, "train_loss": 5.834235620422363, "train_acc": 0.00838, "test_loss": 4.605170387268067, "test_acc": 0.01, "lyapunov": 1.9234702946889737, "grad_norm": 0.11393843809281681, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 38.67253303527832 }, { "epoch": 119, "train_loss": 5.836164589385986, "train_acc": 0.00878, "test_loss": 4.605170240783691, "test_acc": 0.01, "lyapunov": 1.9253446165558017, "grad_norm": 0.13051062587564605, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 38.675392627716064 }, { "epoch": 120, "train_loss": 5.833294369506836, "train_acc": 0.00902, "test_loss": 4.605170152282715, "test_acc": 0.01, "lyapunov": 1.9231391212214595, "grad_norm": 0.09107209306940374, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 38.68769383430481 }, { "epoch": 121, "train_loss": 5.830208008880615, "train_acc": 0.00872, "test_loss": 4.605169981384277, "test_acc": 0.01, "lyapunov": 1.920601219777256, "grad_norm": 0.08818902289292577, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 38.663066148757935 }, { "epoch": 122, "train_loss": 5.828988634338379, "train_acc": 0.00866, "test_loss": 4.6051700424194335, "test_acc": 0.01, "lyapunov": 1.9195775912545832, "grad_norm": 0.08827912521059493, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 38.66604161262512 }, { "epoch": 123, "train_loss": 5.8335463383483885, "train_acc": 0.0083, "test_loss": 4.605170326995849, "test_acc": 0.01, "lyapunov": 1.9230621321426937, "grad_norm": 0.09180967837607329, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 38.66097450256348 }, { "epoch": 124, "train_loss": 5.8313025344848635, "train_acc": 0.009, "test_loss": 4.605170251464844, "test_acc": 0.01, "lyapunov": 1.9215273033932347, "grad_norm": 0.0880278926594288, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 38.678382396698 }, { "epoch": 125, "train_loss": 5.829151732025147, "train_acc": 0.00856, "test_loss": 4.605170100402832, "test_acc": 0.01, "lyapunov": 1.9196982078844933, "grad_norm": 0.08802943628622184, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 38.651947021484375 }, { "epoch": 126, "train_loss": 5.828555057067871, "train_acc": 0.00854, "test_loss": 4.605170222473144, "test_acc": 0.01, "lyapunov": 1.9192795976043662, "grad_norm": 0.088302392455243, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 38.67385935783386 }, { "epoch": 127, "train_loss": 5.829820846405029, "train_acc": 0.00872, "test_loss": 4.605170227050781, "test_acc": 0.01, "lyapunov": 1.9203001791254029, "grad_norm": 0.0881103504591081, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 38.67335605621338 }, { "epoch": 128, "train_loss": 5.846653115692138, "train_acc": 0.00814, "test_loss": 4.605170144653321, "test_acc": 0.01, "lyapunov": 1.9271661183413338, "grad_norm": 0.12434413440967498, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 38.651455879211426 }, { "epoch": 129, "train_loss": 5.8315210632324215, "train_acc": 0.00858, "test_loss": 4.6051701629638675, "test_acc": 0.01, "lyapunov": 1.9216848407559992, "grad_norm": 0.09353770310247324, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 38.65707588195801 }, { "epoch": 130, "train_loss": 5.833166874389648, "train_acc": 0.00868, "test_loss": 4.605170000457764, "test_acc": 0.01, "lyapunov": 1.9230641779082511, "grad_norm": 0.08835242150848918, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 38.65906548500061 }, { "epoch": 131, "train_loss": 5.82969641418457, "train_acc": 0.00892, "test_loss": 4.60517036895752, "test_acc": 0.01, "lyapunov": 1.9201975795619017, "grad_norm": 0.08800100320314078, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 38.66576051712036 }, { "epoch": 132, "train_loss": 5.830922511901855, "train_acc": 0.00898, "test_loss": 4.605170082092285, "test_acc": 0.01, "lyapunov": 1.921166550472874, "grad_norm": 0.08780352004054458, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 38.67506122589111 }, { "epoch": 133, "train_loss": 5.830705413360596, "train_acc": 0.0089, "test_loss": 4.605170077514648, "test_acc": 0.01, "lyapunov": 1.9210232758461057, "grad_norm": 0.08765525433917719, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 38.66982293128967 }, { "epoch": 134, "train_loss": 5.828949987030029, "train_acc": 0.0092, "test_loss": 4.60517048034668, "test_acc": 0.01, "lyapunov": 1.9195570479268613, "grad_norm": 0.0878219052630613, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 38.658127784729004 }, { "epoch": 135, "train_loss": 5.832552122955322, "train_acc": 0.00898, "test_loss": 4.605170314025879, "test_acc": 0.01, "lyapunov": 1.922510105935509, "grad_norm": 0.08848585809638171, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 38.671475887298584 }, { "epoch": 136, "train_loss": 5.828762425842285, "train_acc": 0.00862, "test_loss": 4.605170394897461, "test_acc": 0.01, "lyapunov": 1.9194351151166364, "grad_norm": 0.08813677537771221, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 38.67206072807312 }, { "epoch": 137, "train_loss": 5.830585724487305, "train_acc": 0.0092, "test_loss": 4.605170066833496, "test_acc": 0.01, "lyapunov": 1.920962211725962, "grad_norm": 0.08822452447484254, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 38.67813777923584 }, { "epoch": 138, "train_loss": 5.8304260397338865, "train_acc": 0.0081, "test_loss": 4.605170138549805, "test_acc": 0.01, "lyapunov": 1.9208168641990409, "grad_norm": 0.08849509125868348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 38.67507195472717 }, { "epoch": 139, "train_loss": 5.829665904846191, "train_acc": 0.00956, "test_loss": 4.60517013092041, "test_acc": 0.01, "lyapunov": 1.9201480406324576, "grad_norm": 0.08790362350901093, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 38.673912048339844 }, { "epoch": 140, "train_loss": 5.832476518859863, "train_acc": 0.00906, "test_loss": 4.6051704071044925, "test_acc": 0.01, "lyapunov": 1.9224549364250945, "grad_norm": 0.08802773683248163, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 38.67948055267334 }, { "epoch": 141, "train_loss": 5.830304007110596, "train_acc": 0.00992, "test_loss": 4.605170399475098, "test_acc": 0.01, "lyapunov": 1.920735996702443, "grad_norm": 0.0882868275030572, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 38.675227880477905 }, { "epoch": 142, "train_loss": 5.831250300292969, "train_acc": 0.00984, "test_loss": 4.605170373535156, "test_acc": 0.01, "lyapunov": 1.921463219710933, "grad_norm": 0.08794004853752245, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 38.70003008842468 }, { "epoch": 143, "train_loss": 5.832011743011474, "train_acc": 0.00878, "test_loss": 4.605170379638672, "test_acc": 0.01, "lyapunov": 1.9220852223808502, "grad_norm": 0.08842628454422183, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 38.69024062156677 }, { "epoch": 144, "train_loss": 5.829982127532959, "train_acc": 0.0097, "test_loss": 4.605170482635498, "test_acc": 0.01, "lyapunov": 1.9204687541708008, "grad_norm": 0.08841994345313893, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 38.6822247505188 }, { "epoch": 145, "train_loss": 5.831171199645996, "train_acc": 0.00958, "test_loss": 4.605170204162597, "test_acc": 0.01, "lyapunov": 1.9213833555845958, "grad_norm": 0.11341783409581589, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 38.68064069747925 }, { "epoch": 146, "train_loss": 5.832137032470703, "train_acc": 0.00976, "test_loss": 4.605170028686524, "test_acc": 0.01, "lyapunov": 1.9221693624925735, "grad_norm": 0.08798089094104568, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 38.68038535118103 }, { "epoch": 147, "train_loss": 5.83251281906128, "train_acc": 0.00974, "test_loss": 4.605170251464844, "test_acc": 0.01, "lyapunov": 1.9224824981616282, "grad_norm": 0.08796659107314206, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 38.673001766204834 }, { "epoch": 148, "train_loss": 5.829547540588379, "train_acc": 0.01, "test_loss": 4.60517032623291, "test_acc": 0.01, "lyapunov": 1.920109924757877, "grad_norm": 0.08826415625381624, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 38.669779539108276 }, { "epoch": 149, "train_loss": 5.830913259735107, "train_acc": 0.01, "test_loss": 4.605170252227783, "test_acc": 0.01, "lyapunov": 1.9211858764024037, "grad_norm": 0.08849620940008496, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 38.67606210708618 }, { "epoch": 150, "train_loss": 5.830235260314941, "train_acc": 0.01, "test_loss": 4.605170276641846, "test_acc": 0.01, "lyapunov": 1.9206774539654823, "grad_norm": 0.08822638497198837, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 38.67439675331116 } ], "8": [ { "epoch": 1, "train_loss": 11.062658223266602, "train_acc": 0.0191, "test_loss": 4.636551777648926, "test_acc": 0.0192, "lyapunov": 4.093391669070934, "grad_norm": 6.553327303351535, "grad_max_sv": 5.005066078901291, "grad_min_sv": 9.498946289543397e-08, "grad_condition": 96914448.49987349, "lr": 0.0009998903417374227, "time_sec": 81.60158228874207 }, { "epoch": 2, "train_loss": 7.894516683044434, "train_acc": 0.02232, "test_loss": 4.509155606079101, "test_acc": 0.0281, "lyapunov": 3.109319945430512, "grad_norm": 4.711594955608515, "grad_max_sv": 3.8599576711654664, "grad_min_sv": 5.844970047842041e-08, "grad_condition": 1689973621.6123517, "lr": 0.0009995614150494292, "time_sec": 81.60659170150757 }, { "epoch": 3, "train_loss": 7.597164999084472, "train_acc": 0.02292, "test_loss": 4.547392833709717, "test_acc": 0.0138, "lyapunov": 3.040807009353052, "grad_norm": 3.4020100363883277, "grad_max_sv": 2.92706837952137, "grad_min_sv": 3.304632755468228e-08, "grad_condition": 5977960877.86062, "lr": 0.0009990133642141358, "time_sec": 81.63819622993469 }, { "epoch": 4, "train_loss": 7.466654327392578, "train_acc": 0.02596, "test_loss": 4.54970652999878, "test_acc": 0.0152, "lyapunov": 3.026890999825714, "grad_norm": 2.184726348696494, "grad_max_sv": 1.823475405573845, "grad_min_sv": 1.0126577207033096e-08, "grad_condition": 8307876314.683462, "lr": 0.0009982464296247522, "time_sec": 81.63975858688354 }, { "epoch": 5, "train_loss": 7.35825664352417, "train_acc": 0.0249, "test_loss": 4.575929130554199, "test_acc": 0.013, "lyapunov": 2.9873962725519827, "grad_norm": 1.2137091228137746, "grad_max_sv": 0.961378724873066, "grad_min_sv": 6.631390698336963e-11, "grad_condition": 115707330637.43631, "lr": 0.0009972609476841367, "time_sec": 81.71280694007874 }, { "epoch": 6, "train_loss": 7.152584227600098, "train_acc": 0.02408, "test_loss": 4.546905226135254, "test_acc": 0.0165, "lyapunov": 2.8627321110357102, "grad_norm": 0.7830228200215259, "grad_max_sv": 0.4966236546635628, "grad_min_sv": 8.468786915770583e-12, "grad_condition": 112190115201.81938, "lr": 0.000996057350657239, "time_sec": 81.67318558692932 }, { "epoch": 7, "train_loss": 6.736108720703125, "train_acc": 0.02286, "test_loss": 4.6234777084350585, "test_acc": 0.01, "lyapunov": 2.6260088990106607, "grad_norm": 0.503721920030939, "grad_max_sv": 0.28278580904006956, "grad_min_sv": 1.9822557287658092e-12, "grad_condition": 125105415477.25314, "lr": 0.000994636166481494, "time_sec": 81.64523100852966 }, { "epoch": 8, "train_loss": 6.564093143463134, "train_acc": 0.02234, "test_loss": 4.611732032775879, "test_acc": 0.01, "lyapunov": 2.514471580915134, "grad_norm": 0.6828735354454265, "grad_max_sv": 0.2100991995772347, "grad_min_sv": 6.476987908912428e-13, "grad_condition": 143664013250.37378, "lr": 0.0009929980185352525, "time_sec": 81.63371157646179 }, { "epoch": 9, "train_loss": 6.828797580261231, "train_acc": 0.01912, "test_loss": 4.606410037231445, "test_acc": 0.01, "lyapunov": 2.654179959041078, "grad_norm": 1.0698865873419308, "grad_max_sv": 0.16152255814522504, "grad_min_sv": 1.6541991394265796e-13, "grad_condition": 140818730869.57614, "lr": 0.0009911436253643444, "time_sec": 81.60695457458496 }, { "epoch": 10, "train_loss": 6.993563550720215, "train_acc": 0.01038, "test_loss": 4.6257774490356445, "test_acc": 0.01, "lyapunov": 2.7042983194141437, "grad_norm": 0.6205939496010421, "grad_max_sv": 0.10736188860610127, "grad_min_sv": 7.417080745085988e-16, "grad_condition": 107239971660.70801, "lr": 0.0009890738003669028, "time_sec": 81.59540891647339 }, { "epoch": 11, "train_loss": 6.5890699209594725, "train_acc": 0.01018, "test_loss": 4.605637271881103, "test_acc": 0.01, "lyapunov": 2.468636756053056, "grad_norm": 0.39837773763043477, "grad_max_sv": 0.06119964215904474, "grad_min_sv": 3.8185383152851266e-45, "grad_condition": 61199642159.044754, "lr": 0.00098678945143658, "time_sec": 81.5604145526886 }, { "epoch": 12, "train_loss": 6.5774819650268554, "train_acc": 0.01, "test_loss": 4.605390992736816, "test_acc": 0.01, "lyapunov": 2.4586855413968607, "grad_norm": 0.7705617527781408, "grad_max_sv": 0.00864509902894497, "grad_min_sv": 0.0, "grad_condition": 8645099028.94497, "lr": 0.0009842915805643154, "time_sec": 81.49474096298218 }, { "epoch": 13, "train_loss": 6.546455008239746, "train_acc": 0.01002, "test_loss": 4.605277996826172, "test_acc": 0.01, "lyapunov": 2.435590844020209, "grad_norm": 0.5128829478227843, "grad_max_sv": 0.004509441927075386, "grad_min_sv": 0.0, "grad_condition": 4509441927.075386, "lr": 0.000981581283398829, "time_sec": 81.4997489452362 }, { "epoch": 14, "train_loss": 6.575126316833496, "train_acc": 0.00944, "test_loss": 4.605232641601562, "test_acc": 0.01, "lyapunov": 2.451746358895851, "grad_norm": 0.5181440557950673, "grad_max_sv": 0.013719148561358451, "grad_min_sv": 0.0, "grad_condition": 13719148561.358452, "lr": 0.0009786597487660333, "time_sec": 81.5125732421875 }, { "epoch": 15, "train_loss": 6.587129125061035, "train_acc": 0.0092, "test_loss": 4.605205821228028, "test_acc": 0.01, "lyapunov": 2.453917900314721, "grad_norm": 0.6398426435720163, "grad_max_sv": 0.0049395252019166945, "grad_min_sv": 0.0, "grad_condition": 4939525201.916695, "lr": 0.0009755282581475766, "time_sec": 81.50915098190308 }, { "epoch": 16, "train_loss": 6.420363327789307, "train_acc": 0.00962, "test_loss": 4.605900651550293, "test_acc": 0.01, "lyapunov": 2.3524727979889306, "grad_norm": 0.5507826914381541, "grad_max_sv": 0.06663376707583665, "grad_min_sv": 0.0, "grad_condition": 66633767075.836655, "lr": 0.0009721881851187403, "time_sec": 81.59744453430176 }, { "epoch": 17, "train_loss": 6.291905773010254, "train_acc": 0.00924, "test_loss": 4.605198278045655, "test_acc": 0.01, "lyapunov": 2.2705817686017515, "grad_norm": 0.20954429598020885, "grad_max_sv": 0.007087096758186817, "grad_min_sv": 0.0, "grad_condition": 7087096758.186816, "lr": 0.0009686409947459456, "time_sec": 81.51701307296753 }, { "epoch": 18, "train_loss": 6.280198426513672, "train_acc": 0.00956, "test_loss": 4.605187928009033, "test_acc": 0.01, "lyapunov": 2.262371898612098, "grad_norm": 0.15673318486817656, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009648882429441254, "time_sec": 81.49850106239319 }, { "epoch": 19, "train_loss": 6.319409269714355, "train_acc": 0.00894, "test_loss": 4.605180485534668, "test_acc": 0.01, "lyapunov": 2.2773679802789712, "grad_norm": 0.18004037135900994, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00096093157579425, "time_sec": 81.52363634109497 }, { "epoch": 20, "train_loss": 6.279429423370361, "train_acc": 0.0089, "test_loss": 4.605177160644531, "test_acc": 0.01, "lyapunov": 2.261986050764313, "grad_norm": 0.10793581510968044, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009567727288213001, "time_sec": 81.49810361862183 }, { "epoch": 21, "train_loss": 6.277427138519287, "train_acc": 0.00862, "test_loss": 4.605176016998291, "test_acc": 0.01, "lyapunov": 2.2604778922732223, "grad_norm": 0.1164667413797286, "grad_max_sv": 0.005474003031849861, "grad_min_sv": 0.0, "grad_condition": 5474003031.849861, "lr": 0.0009524135262330095, "time_sec": 81.49689865112305 }, { "epoch": 22, "train_loss": 6.275057526855469, "train_acc": 0.0092, "test_loss": 4.605175686645508, "test_acc": 0.01, "lyapunov": 2.258924939748271, "grad_norm": 0.11032559480193316, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009478558801197061, "time_sec": 81.49366521835327 }, { "epoch": 23, "train_loss": 6.280477966156006, "train_acc": 0.00834, "test_loss": 4.60517352142334, "test_acc": 0.01, "lyapunov": 2.262287087452686, "grad_norm": 0.11733428454185782, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000943101789615607, "time_sec": 81.4926176071167 }, { "epoch": 24, "train_loss": 6.27477842300415, "train_acc": 0.00888, "test_loss": 4.6051733123779295, "test_acc": 0.01, "lyapunov": 2.2587200552606217, "grad_norm": 0.09563398461056706, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009381533400219313, "time_sec": 81.48560309410095 }, { "epoch": 25, "train_loss": 6.275597013549804, "train_acc": 0.00864, "test_loss": 4.605174243927002, "test_acc": 0.01, "lyapunov": 2.259342540560476, "grad_norm": 0.10626239815682126, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009330127018922189, "time_sec": 81.50195908546448 }, { "epoch": 26, "train_loss": 6.307570930175781, "train_acc": 0.00846, "test_loss": 4.6051738105773925, "test_acc": 0.01, "lyapunov": 2.2765520228754226, "grad_norm": 0.15671024580485657, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000927682130080253, "time_sec": 81.48380661010742 }, { "epoch": 27, "train_loss": 6.3007610939025875, "train_acc": 0.00916, "test_loss": 4.605174212646484, "test_acc": 0.01, "lyapunov": 2.2724761200682893, "grad_norm": 0.15438417468612603, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009221639627510072, "time_sec": 81.49885392189026 }, { "epoch": 28, "train_loss": 6.279321163024902, "train_acc": 0.0084, "test_loss": 4.605173818206787, "test_acc": 0.01, "lyapunov": 2.261768304478482, "grad_norm": 0.12913751626297293, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009164606203550494, "time_sec": 81.51960349082947 }, { "epoch": 29, "train_loss": 6.296547222290039, "train_acc": 0.00844, "test_loss": 4.605173532104492, "test_acc": 0.01, "lyapunov": 2.269540443444801, "grad_norm": 0.1257561792074065, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009105746045668516, "time_sec": 81.48529624938965 }, { "epoch": 30, "train_loss": 6.301725520019532, "train_acc": 0.00894, "test_loss": 4.605173407745362, "test_acc": 0.01, "lyapunov": 2.2715838626217657, "grad_norm": 0.14077235565425347, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009045084971874733, "time_sec": 81.47704434394836 }, { "epoch": 31, "train_loss": 6.279767997894287, "train_acc": 0.0086, "test_loss": 4.6051743087768555, "test_acc": 0.01, "lyapunov": 2.261623111222406, "grad_norm": 0.11414807727359211, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008982649590120977, "time_sec": 81.51038384437561 }, { "epoch": 32, "train_loss": 6.314449734039306, "train_acc": 0.0091, "test_loss": 4.605173248291016, "test_acc": 0.01, "lyapunov": 2.27814206686776, "grad_norm": 0.15985043411867914, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008918467286629196, "time_sec": 81.49317169189453 }, { "epoch": 33, "train_loss": 6.281702154998779, "train_acc": 0.0086, "test_loss": 4.605174011993408, "test_acc": 0.01, "lyapunov": 2.262753884810621, "grad_norm": 0.12070866490334974, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008852566213878943, "time_sec": 81.49454641342163 }, { "epoch": 34, "train_loss": 6.2773644987487796, "train_acc": 0.00906, "test_loss": 4.605173474121094, "test_acc": 0.01, "lyapunov": 2.260565836411303, "grad_norm": 0.11129476697402911, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000878497527825878, "time_sec": 81.58190107345581 }, { "epoch": 35, "train_loss": 6.309268474578857, "train_acc": 0.00864, "test_loss": 4.605172872161865, "test_acc": 0.01, "lyapunov": 2.277102802110755, "grad_norm": 0.17254724942107424, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000871572412738697, "time_sec": 81.51573705673218 }, { "epoch": 36, "train_loss": 6.2885913528442385, "train_acc": 0.00894, "test_loss": 4.605173197937011, "test_acc": 0.01, "lyapunov": 2.2663694641474263, "grad_norm": 0.12446302100514797, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107055, "time_sec": 81.4983901977539 }, { "epoch": 37, "train_loss": 6.314083187561035, "train_acc": 0.00826, "test_loss": 4.605172673034668, "test_acc": 0.01, "lyapunov": 2.2792197420164144, "grad_norm": 0.19167369428125208, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008572363398164014, "time_sec": 81.4910204410553 }, { "epoch": 38, "train_loss": 6.276701861419678, "train_acc": 0.00804, "test_loss": 4.605172772979737, "test_acc": 0.01, "lyapunov": 2.260084454055942, "grad_norm": 0.10142640032392508, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008498316702566826, "time_sec": 81.49372029304504 }, { "epoch": 39, "train_loss": 6.2982295426940915, "train_acc": 0.00834, "test_loss": 4.605172825622558, "test_acc": 0.01, "lyapunov": 2.271109230378095, "grad_norm": 0.13881594105822967, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643442, "time_sec": 81.50897860527039 }, { "epoch": 40, "train_loss": 6.282011164550782, "train_acc": 0.00864, "test_loss": 4.607664538574219, "test_acc": 0.01, "lyapunov": 2.263592470637368, "grad_norm": 0.1022934137238382, "grad_max_sv": 0.006253971112892031, "grad_min_sv": 0.0, "grad_condition": 6253971112.892032, "lr": 0.0008345653031794289, "time_sec": 81.51133847236633 }, { "epoch": 41, "train_loss": 6.283648276977539, "train_acc": 0.00898, "test_loss": 4.615698904418945, "test_acc": 0.01, "lyapunov": 2.2645610153217755, "grad_norm": 0.12524739066407903, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008267103019950526, "time_sec": 81.50317192077637 }, { "epoch": 42, "train_loss": 6.291501354827881, "train_acc": 0.00914, "test_loss": 4.605554750061035, "test_acc": 0.01, "lyapunov": 2.267925240499589, "grad_norm": 0.1307307918214705, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743447, "time_sec": 81.48968553543091 }, { "epoch": 43, "train_loss": 6.276330156860352, "train_acc": 0.00896, "test_loss": 4.605246144104004, "test_acc": 0.01, "lyapunov": 2.2598801464071054, "grad_norm": 0.0933943349122675, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000810573890139155, "time_sec": 81.50180649757385 }, { "epoch": 44, "train_loss": 6.2769957354736325, "train_acc": 0.00898, "test_loss": 4.60537618560791, "test_acc": 0.01, "lyapunov": 2.26023776756833, "grad_norm": 0.10724706931673801, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008022995574311873, "time_sec": 81.48934960365295 }, { "epoch": 45, "train_loss": 6.27975429473877, "train_acc": 0.0095, "test_loss": 4.605248934936523, "test_acc": 0.01, "lyapunov": 2.2623073298607945, "grad_norm": 0.095192742319822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462363, "time_sec": 81.50000143051147 }, { "epoch": 46, "train_loss": 6.297380412445069, "train_acc": 0.00876, "test_loss": 4.6052475326538085, "test_acc": 0.01, "lyapunov": 2.271654522327511, "grad_norm": 0.1534535578732401, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007853567838422158, "time_sec": 81.47789859771729 }, { "epoch": 47, "train_loss": 6.282922696990966, "train_acc": 0.0092, "test_loss": 4.605248429107666, "test_acc": 0.01, "lyapunov": 2.264536363084603, "grad_norm": 0.10842785613108402, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007766957746216719, "time_sec": 81.48331236839294 }, { "epoch": 48, "train_loss": 6.280480013275146, "train_acc": 0.00806, "test_loss": 4.605249649047852, "test_acc": 0.01, "lyapunov": 2.2628020630468186, "grad_norm": 0.09295297080650741, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894982, "time_sec": 81.48791313171387 }, { "epoch": 49, "train_loss": 6.295236266479492, "train_acc": 0.0081, "test_loss": 4.605244645690918, "test_acc": 0.01, "lyapunov": 2.270114410868691, "grad_norm": 0.14920321268372522, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000759013504686565, "time_sec": 81.49582886695862 }, { "epoch": 50, "train_loss": 6.315434308013916, "train_acc": 0.00828, "test_loss": 4.605247691345215, "test_acc": 0.01, "lyapunov": 2.2807927832883945, "grad_norm": 0.17847170404488147, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 81.49979019165039 }, { "epoch": 51, "train_loss": 6.302057292938232, "train_acc": 0.009, "test_loss": 4.605251131439209, "test_acc": 0.01, "lyapunov": 2.2735387291139957, "grad_norm": 0.1418090218860237, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508575, "time_sec": 81.49881410598755 }, { "epoch": 52, "train_loss": 6.278756464233399, "train_acc": 0.00866, "test_loss": 4.605250935363769, "test_acc": 0.01, "lyapunov": 2.2616379620778897, "grad_norm": 0.09283264461248593, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 81.49807143211365 }, { "epoch": 53, "train_loss": 6.276537058105469, "train_acc": 0.00894, "test_loss": 4.605252996826172, "test_acc": 0.01, "lyapunov": 2.2600054393339035, "grad_norm": 0.09889008649312356, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 81.50720810890198 }, { "epoch": 54, "train_loss": 6.2842115702819825, "train_acc": 0.0088, "test_loss": 4.60517135925293, "test_acc": 0.01, "lyapunov": 2.2653747550057024, "grad_norm": 0.1176830015085984, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 81.49119186401367 }, { "epoch": 55, "train_loss": 6.280401730041504, "train_acc": 0.00886, "test_loss": 4.605172096252441, "test_acc": 0.01, "lyapunov": 2.262633579771232, "grad_norm": 0.10354075360180534, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007033683215378998, "time_sec": 81.49315738677979 }, { "epoch": 56, "train_loss": 6.316937896728516, "train_acc": 0.00866, "test_loss": 4.605172169494629, "test_acc": 0.01, "lyapunov": 2.2807149234635142, "grad_norm": 0.15351000119410838, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 81.5045874118805 }, { "epoch": 57, "train_loss": 6.296867928161621, "train_acc": 0.00924, "test_loss": 4.605172319030761, "test_acc": 0.01, "lyapunov": 2.272276422861592, "grad_norm": 0.14439465021569048, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423388, "time_sec": 81.49606895446777 }, { "epoch": 58, "train_loss": 6.277121980133057, "train_acc": 0.00822, "test_loss": 4.605172018432617, "test_acc": 0.01, "lyapunov": 2.26043635926893, "grad_norm": 0.09147768117276701, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 81.49943733215332 }, { "epoch": 59, "train_loss": 6.2761470947265625, "train_acc": 0.00864, "test_loss": 4.605172242736816, "test_acc": 0.01, "lyapunov": 2.2597581962185442, "grad_norm": 0.0885807415167131, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 81.49118137359619 }, { "epoch": 60, "train_loss": 6.297447052307129, "train_acc": 0.00916, "test_loss": 4.605172019195557, "test_acc": 0.01, "lyapunov": 2.2733187815722298, "grad_norm": 0.15437497590627458, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 81.49486422538757 }, { "epoch": 61, "train_loss": 6.3111451325988766, "train_acc": 0.00872, "test_loss": 4.605171881103516, "test_acc": 0.01, "lyapunov": 2.279795357638308, "grad_norm": 0.1590526758324701, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 81.56430292129517 }, { "epoch": 62, "train_loss": 6.295817751617432, "train_acc": 0.00874, "test_loss": 4.605171612548828, "test_acc": 0.01, "lyapunov": 2.271848827981583, "grad_norm": 0.1613023358766049, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 81.48160147666931 }, { "epoch": 63, "train_loss": 6.307024629974365, "train_acc": 0.0085, "test_loss": 4.605171653747559, "test_acc": 0.01, "lyapunov": 2.2748339487158735, "grad_norm": 0.13676348001909264, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 81.48560905456543 }, { "epoch": 64, "train_loss": 6.277896643218994, "train_acc": 0.00846, "test_loss": 4.605171467590332, "test_acc": 0.01, "lyapunov": 2.261008509589583, "grad_norm": 0.09063727687835958, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 81.4799861907959 }, { "epoch": 65, "train_loss": 6.285225621643066, "train_acc": 0.00848, "test_loss": 4.605171078491211, "test_acc": 0.01, "lyapunov": 2.2658682217073562, "grad_norm": 0.10317682067163818, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 81.51162958145142 }, { "epoch": 66, "train_loss": 6.280715701446534, "train_acc": 0.00842, "test_loss": 4.605171147918701, "test_acc": 0.01, "lyapunov": 2.2628414155272267, "grad_norm": 0.09673219941672938, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 81.47932028770447 }, { "epoch": 67, "train_loss": 6.277698368530274, "train_acc": 0.00856, "test_loss": 4.6051715675354, "test_acc": 0.01, "lyapunov": 2.26088782466586, "grad_norm": 0.09056972140208994, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 81.48698115348816 }, { "epoch": 68, "train_loss": 6.30627403137207, "train_acc": 0.00826, "test_loss": 4.605171142578125, "test_acc": 0.01, "lyapunov": 2.2745680943169555, "grad_norm": 0.13148861913625765, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 81.49131727218628 }, { "epoch": 69, "train_loss": 6.280330782623291, "train_acc": 0.00892, "test_loss": 4.605170972442627, "test_acc": 0.01, "lyapunov": 2.2627177104315797, "grad_norm": 0.1124362788188755, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 83.16999244689941 }, { "epoch": 70, "train_loss": 6.28732081451416, "train_acc": 0.00818, "test_loss": 4.605170994567871, "test_acc": 0.01, "lyapunov": 2.2672290460532887, "grad_norm": 0.10634119980305662, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 81.48939347267151 }, { "epoch": 71, "train_loss": 6.279782330627442, "train_acc": 0.00912, "test_loss": 4.605171276855469, "test_acc": 0.01, "lyapunov": 2.262383164652168, "grad_norm": 0.10626668013646236, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 81.48840260505676 }, { "epoch": 72, "train_loss": 6.295553107910156, "train_acc": 0.00816, "test_loss": 4.605171234130859, "test_acc": 0.01, "lyapunov": 2.2699396323669903, "grad_norm": 0.10087516213292237, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646563, "time_sec": 81.66768407821655 }, { "epoch": 73, "train_loss": 6.279174601287842, "train_acc": 0.00854, "test_loss": 4.605171266174317, "test_acc": 0.01, "lyapunov": 2.261961253402788, "grad_norm": 0.09224354382614662, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 81.47679734230042 }, { "epoch": 74, "train_loss": 6.282529046783448, "train_acc": 0.00878, "test_loss": 4.605171199035644, "test_acc": 0.01, "lyapunov": 2.263870295966068, "grad_norm": 0.09731782277810722, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 81.49993348121643 }, { "epoch": 75, "train_loss": 6.277901949768067, "train_acc": 0.0089, "test_loss": 4.605170727539062, "test_acc": 0.01, "lyapunov": 2.261039003996593, "grad_norm": 0.09211112509965803, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 81.50083065032959 }, { "epoch": 76, "train_loss": 6.340216960601807, "train_acc": 0.00838, "test_loss": 4.605170699310302, "test_acc": 0.01, "lyapunov": 2.2909446268740212, "grad_norm": 0.23685392065021807, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 81.50020790100098 }, { "epoch": 77, "train_loss": 6.312104174957275, "train_acc": 0.00864, "test_loss": 4.605171252441406, "test_acc": 0.01, "lyapunov": 2.2805933543788197, "grad_norm": 0.18831482170422406, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 81.49737644195557 }, { "epoch": 78, "train_loss": 6.2789193016052245, "train_acc": 0.00852, "test_loss": 4.605171314239502, "test_acc": 0.01, "lyapunov": 2.261766994090946, "grad_norm": 0.0924358449039435, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 81.48207116127014 }, { "epoch": 79, "train_loss": 6.278578204803467, "train_acc": 0.00926, "test_loss": 4.6051709121704105, "test_acc": 0.01, "lyapunov": 2.2615611260504367, "grad_norm": 0.106081439799758, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 81.5153739452362 }, { "epoch": 80, "train_loss": 6.280757647094727, "train_acc": 0.00926, "test_loss": 4.605170848083496, "test_acc": 0.01, "lyapunov": 2.2630625789427694, "grad_norm": 0.09000806752766331, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 81.48912286758423 }, { "epoch": 81, "train_loss": 6.281069091949463, "train_acc": 0.00898, "test_loss": 4.605170893859864, "test_acc": 0.01, "lyapunov": 2.263333380984528, "grad_norm": 0.09221512328536063, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 81.5581386089325 }, { "epoch": 82, "train_loss": 6.27887787902832, "train_acc": 0.0087, "test_loss": 4.605170852661133, "test_acc": 0.01, "lyapunov": 2.261768191671737, "grad_norm": 0.09223604647823178, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 81.48868751525879 }, { "epoch": 83, "train_loss": 6.283419313049317, "train_acc": 0.00842, "test_loss": 4.605170945739746, "test_acc": 0.01, "lyapunov": 2.2647099933965738, "grad_norm": 0.11489596444213686, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 81.48753881454468 }, { "epoch": 84, "train_loss": 6.331098417663574, "train_acc": 0.00886, "test_loss": 4.605170746612549, "test_acc": 0.01, "lyapunov": 2.288768025005565, "grad_norm": 0.21523480615204088, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 81.49917888641357 }, { "epoch": 85, "train_loss": 6.279946563415527, "train_acc": 0.00858, "test_loss": 4.605170806884765, "test_acc": 0.01, "lyapunov": 2.262576125162032, "grad_norm": 0.09063877969543369, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 81.49754786491394 }, { "epoch": 86, "train_loss": 6.294878379211426, "train_acc": 0.0082, "test_loss": 4.605170738983154, "test_acc": 0.01, "lyapunov": 2.270076130967006, "grad_norm": 0.11269347737073286, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 81.49726057052612 }, { "epoch": 87, "train_loss": 6.2920974577331545, "train_acc": 0.009, "test_loss": 4.6051703125, "test_acc": 0.01, "lyapunov": 2.2685716097312207, "grad_norm": 0.14345779012680526, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 81.51811003684998 }, { "epoch": 88, "train_loss": 6.280257380981445, "train_acc": 0.00862, "test_loss": 4.605170468139648, "test_acc": 0.01, "lyapunov": 2.262734867422782, "grad_norm": 0.089208601870095, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 81.54773998260498 }, { "epoch": 89, "train_loss": 6.281720874176026, "train_acc": 0.00798, "test_loss": 4.605170385742188, "test_acc": 0.01, "lyapunov": 2.2637228892587333, "grad_norm": 0.13294770236555567, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 81.49507021903992 }, { "epoch": 90, "train_loss": 6.282031690979004, "train_acc": 0.00864, "test_loss": 4.6051704216003415, "test_acc": 0.01, "lyapunov": 2.263972556804452, "grad_norm": 0.09670924579322722, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 81.50043749809265 }, { "epoch": 91, "train_loss": 6.281220606231689, "train_acc": 0.00882, "test_loss": 4.605170685577392, "test_acc": 0.01, "lyapunov": 2.2634493798551047, "grad_norm": 0.08948481670861189, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 81.50585508346558 }, { "epoch": 92, "train_loss": 6.279705551147461, "train_acc": 0.00862, "test_loss": 4.60517056274414, "test_acc": 0.01, "lyapunov": 2.2624147529797174, "grad_norm": 0.09256700006903949, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 81.51557660102844 }, { "epoch": 93, "train_loss": 6.281244622955322, "train_acc": 0.0087, "test_loss": 4.60517061920166, "test_acc": 0.01, "lyapunov": 2.2632562803185503, "grad_norm": 0.11132757286060115, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 81.49661374092102 }, { "epoch": 94, "train_loss": 6.306097177734375, "train_acc": 0.00858, "test_loss": 4.605170388793946, "test_acc": 0.01, "lyapunov": 2.274985415856247, "grad_norm": 0.14003151421649307, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 81.48347187042236 }, { "epoch": 95, "train_loss": 6.283950561676026, "train_acc": 0.00878, "test_loss": 4.605170606994629, "test_acc": 0.01, "lyapunov": 2.264391293001297, "grad_norm": 0.11506545388832123, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 81.5063374042511 }, { "epoch": 96, "train_loss": 6.302323147125244, "train_acc": 0.00874, "test_loss": 4.60517081451416, "test_acc": 0.01, "lyapunov": 2.274367270872111, "grad_norm": 0.12307854636703328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 81.4797682762146 }, { "epoch": 97, "train_loss": 6.281584391479492, "train_acc": 0.00864, "test_loss": 4.605170351409912, "test_acc": 0.01, "lyapunov": 2.2636835014118866, "grad_norm": 0.10251001946667801, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 81.49354839324951 }, { "epoch": 98, "train_loss": 6.2782898904418944, "train_acc": 0.00868, "test_loss": 4.60517045135498, "test_acc": 0.01, "lyapunov": 2.261435853245923, "grad_norm": 0.08854436555507054, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 81.4875979423523 }, { "epoch": 99, "train_loss": 6.295129021606446, "train_acc": 0.0082, "test_loss": 4.605170526123047, "test_acc": 0.01, "lyapunov": 2.2712618536351585, "grad_norm": 0.11715866448048785, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 81.48900055885315 }, { "epoch": 100, "train_loss": 6.278292948303223, "train_acc": 0.00866, "test_loss": 4.605170332336426, "test_acc": 0.01, "lyapunov": 2.2613569385255388, "grad_norm": 0.09963153634244509, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 81.49986267089844 }, { "epoch": 101, "train_loss": 6.278483645935059, "train_acc": 0.00804, "test_loss": 4.60517053604126, "test_acc": 0.01, "lyapunov": 2.261537701272599, "grad_norm": 0.08871006809333543, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 81.51374125480652 }, { "epoch": 102, "train_loss": 6.280324393310547, "train_acc": 0.00806, "test_loss": 4.605170599365234, "test_acc": 0.01, "lyapunov": 2.262814277883076, "grad_norm": 0.08821870247597413, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 81.50025415420532 }, { "epoch": 103, "train_loss": 6.2799532815551755, "train_acc": 0.00876, "test_loss": 4.605170227050781, "test_acc": 0.01, "lyapunov": 2.2625574236330777, "grad_norm": 0.08935081241113577, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 81.50659584999084 }, { "epoch": 104, "train_loss": 6.298912643432617, "train_acc": 0.00842, "test_loss": 4.60517052154541, "test_acc": 0.01, "lyapunov": 2.2703244808079948, "grad_norm": 0.11414965346863236, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 81.5045850276947 }, { "epoch": 105, "train_loss": 6.290122275390625, "train_acc": 0.0086, "test_loss": 4.605170248413086, "test_acc": 0.01, "lyapunov": 2.268586759981902, "grad_norm": 0.09478727747372748, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 81.49806952476501 }, { "epoch": 106, "train_loss": 6.29548063659668, "train_acc": 0.00866, "test_loss": 4.605170534515381, "test_acc": 0.01, "lyapunov": 2.2701295159966746, "grad_norm": 0.11489602174527157, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 81.48596048355103 }, { "epoch": 107, "train_loss": 6.282184426269532, "train_acc": 0.0082, "test_loss": 4.605170352172852, "test_acc": 0.01, "lyapunov": 2.2641438352482397, "grad_norm": 0.08961045804319463, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 81.49523115158081 }, { "epoch": 108, "train_loss": 6.2777880932617185, "train_acc": 0.00864, "test_loss": 4.605170249938965, "test_acc": 0.01, "lyapunov": 2.2611292018305007, "grad_norm": 0.08837496982685777, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 81.5235505104065 }, { "epoch": 109, "train_loss": 6.279533188171387, "train_acc": 0.00846, "test_loss": 4.6051705436706545, "test_acc": 0.01, "lyapunov": 2.2622785964585326, "grad_norm": 0.09025198956904176, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 81.49149775505066 }, { "epoch": 110, "train_loss": 6.281950114135742, "train_acc": 0.00808, "test_loss": 4.605170324707031, "test_acc": 0.01, "lyapunov": 2.2638927835332767, "grad_norm": 0.09569022356709349, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 81.48516082763672 }, { "epoch": 111, "train_loss": 6.28185485534668, "train_acc": 0.00926, "test_loss": 4.6051703125, "test_acc": 0.01, "lyapunov": 2.2638340045119185, "grad_norm": 0.08892162931996153, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 81.49398422241211 }, { "epoch": 112, "train_loss": 6.310760371704101, "train_acc": 0.0083, "test_loss": 4.605170272064209, "test_acc": 0.01, "lyapunov": 2.2783618381870983, "grad_norm": 0.14829000342501422, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 81.47959303855896 }, { "epoch": 113, "train_loss": 6.280448321685791, "train_acc": 0.00868, "test_loss": 4.605170561218261, "test_acc": 0.01, "lyapunov": 2.262940209235072, "grad_norm": 0.08905882191321668, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 81.49572110176086 }, { "epoch": 114, "train_loss": 6.29521280166626, "train_acc": 0.00898, "test_loss": 4.6051701675415035, "test_acc": 0.01, "lyapunov": 2.2707663734855554, "grad_norm": 0.10226349996651533, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 81.48670983314514 }, { "epoch": 115, "train_loss": 6.2799824197387695, "train_acc": 0.00898, "test_loss": 4.605170332336426, "test_acc": 0.01, "lyapunov": 2.2626387176611233, "grad_norm": 0.08828544817683198, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 81.48745203018188 }, { "epoch": 116, "train_loss": 6.2778549322509765, "train_acc": 0.00826, "test_loss": 4.6051702964782715, "test_acc": 0.01, "lyapunov": 2.26113668122255, "grad_norm": 0.08806272896088922, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 81.54066944122314 }, { "epoch": 117, "train_loss": 6.279518751220703, "train_acc": 0.00934, "test_loss": 4.605170413208008, "test_acc": 0.01, "lyapunov": 2.2623144555884553, "grad_norm": 0.0877771191158831, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 81.48839020729065 }, { "epoch": 118, "train_loss": 6.281088227996826, "train_acc": 0.00902, "test_loss": 4.605170362854004, "test_acc": 0.01, "lyapunov": 2.2633964198324685, "grad_norm": 0.0880896864668632, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 81.50261282920837 }, { "epoch": 119, "train_loss": 6.282254580841064, "train_acc": 0.00884, "test_loss": 4.605170101165771, "test_acc": 0.01, "lyapunov": 2.264233167214162, "grad_norm": 0.08831557648722567, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 81.52568435668945 }, { "epoch": 120, "train_loss": 6.277676391906739, "train_acc": 0.0087, "test_loss": 4.6051705383300785, "test_acc": 0.01, "lyapunov": 2.2610504279661057, "grad_norm": 0.08852764058763012, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 81.50404500961304 }, { "epoch": 121, "train_loss": 6.282078470611572, "train_acc": 0.00904, "test_loss": 4.605170125579834, "test_acc": 0.01, "lyapunov": 2.264081825685623, "grad_norm": 0.08733889209956962, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 81.49174380302429 }, { "epoch": 122, "train_loss": 6.280417911529541, "train_acc": 0.00854, "test_loss": 4.605170150756836, "test_acc": 0.01, "lyapunov": 2.2629349579286697, "grad_norm": 0.08896774607886365, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 81.48855018615723 }, { "epoch": 123, "train_loss": 6.279605996398926, "train_acc": 0.00798, "test_loss": 4.605170092773437, "test_acc": 0.01, "lyapunov": 2.262386467755603, "grad_norm": 0.08795933479592377, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 81.50146007537842 }, { "epoch": 124, "train_loss": 6.291684345397949, "train_acc": 0.00856, "test_loss": 4.6051700492858885, "test_acc": 0.01, "lyapunov": 2.2678240815087047, "grad_norm": 0.11392589044407447, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 81.48491311073303 }, { "epoch": 125, "train_loss": 6.285427192077637, "train_acc": 0.00888, "test_loss": 4.605170321655273, "test_acc": 0.01, "lyapunov": 2.2660442904743086, "grad_norm": 0.1133754054706649, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 81.49100470542908 }, { "epoch": 126, "train_loss": 6.280400201568604, "train_acc": 0.00878, "test_loss": 4.6051705368041995, "test_acc": 0.01, "lyapunov": 2.2629254120390128, "grad_norm": 0.08821452866992016, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 81.49153852462769 }, { "epoch": 127, "train_loss": 6.279529089202881, "train_acc": 0.0088, "test_loss": 4.605170316314697, "test_acc": 0.01, "lyapunov": 2.2623902915993614, "grad_norm": 0.08745608733781365, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 81.50230026245117 }, { "epoch": 128, "train_loss": 6.278408692016601, "train_acc": 0.00888, "test_loss": 4.605170304870605, "test_acc": 0.01, "lyapunov": 2.261508503228502, "grad_norm": 0.08825893270809801, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 81.49138951301575 }, { "epoch": 129, "train_loss": 6.279044237976074, "train_acc": 0.00934, "test_loss": 4.605170484924316, "test_acc": 0.01, "lyapunov": 2.261979506753595, "grad_norm": 0.08762519682827673, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 81.50332951545715 }, { "epoch": 130, "train_loss": 6.2814196604919434, "train_acc": 0.00892, "test_loss": 4.605170237731934, "test_acc": 0.01, "lyapunov": 2.263650309399266, "grad_norm": 0.0879745908721408, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 81.48634791374207 }, { "epoch": 131, "train_loss": 6.279289369659423, "train_acc": 0.00816, "test_loss": 4.605170503234863, "test_acc": 0.01, "lyapunov": 2.2619674528956106, "grad_norm": 0.08830358541425926, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 81.49762201309204 }, { "epoch": 132, "train_loss": 6.284051736145019, "train_acc": 0.00918, "test_loss": 4.605169993591309, "test_acc": 0.01, "lyapunov": 2.265367220734696, "grad_norm": 0.09065551426084856, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 81.5026957988739 }, { "epoch": 133, "train_loss": 6.28203574508667, "train_acc": 0.00886, "test_loss": 4.60517046508789, "test_acc": 0.01, "lyapunov": 2.264016958148888, "grad_norm": 0.08811709248877145, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 81.4884991645813 }, { "epoch": 134, "train_loss": 6.295380000305176, "train_acc": 0.00924, "test_loss": 4.6051701171875, "test_acc": 0.01, "lyapunov": 2.270651138652011, "grad_norm": 0.09385452218544989, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 81.49120998382568 }, { "epoch": 135, "train_loss": 6.279313954925537, "train_acc": 0.0096, "test_loss": 4.605170198059082, "test_acc": 0.01, "lyapunov": 2.2621799277527557, "grad_norm": 0.08809804121534516, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 81.503009557724 }, { "epoch": 136, "train_loss": 6.281174714050293, "train_acc": 0.009, "test_loss": 4.605170434570312, "test_acc": 0.01, "lyapunov": 2.263484787758049, "grad_norm": 0.08787496788421857, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 81.49492454528809 }, { "epoch": 137, "train_loss": 6.2790307751464844, "train_acc": 0.00906, "test_loss": 4.605170115661621, "test_acc": 0.01, "lyapunov": 2.2619833738907524, "grad_norm": 0.08850586212515105, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 81.51062154769897 }, { "epoch": 138, "train_loss": 6.278728715362549, "train_acc": 0.0095, "test_loss": 4.605170520019532, "test_acc": 0.01, "lyapunov": 2.2618095082090335, "grad_norm": 0.08731291361885624, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 81.48903918266296 }, { "epoch": 139, "train_loss": 6.279946011657715, "train_acc": 0.00924, "test_loss": 4.605169985198975, "test_acc": 0.01, "lyapunov": 2.262684661104246, "grad_norm": 0.08830501755378455, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 81.50976133346558 }, { "epoch": 140, "train_loss": 6.2800713043212895, "train_acc": 0.0093, "test_loss": 4.605170336914062, "test_acc": 0.01, "lyapunov": 2.2627302271020993, "grad_norm": 0.08760865122091131, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 81.47953510284424 }, { "epoch": 141, "train_loss": 6.280382924652099, "train_acc": 0.00976, "test_loss": 4.605170390319824, "test_acc": 0.01, "lyapunov": 2.262962554116993, "grad_norm": 0.08731546735423716, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 81.50757503509521 }, { "epoch": 142, "train_loss": 6.280370573883057, "train_acc": 0.00936, "test_loss": 4.605170272064209, "test_acc": 0.01, "lyapunov": 2.262975048226164, "grad_norm": 0.08839664162758272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 81.70762014389038 }, { "epoch": 143, "train_loss": 6.278507639923096, "train_acc": 0.0095, "test_loss": 4.6051704162597655, "test_acc": 0.01, "lyapunov": 2.261611500054674, "grad_norm": 0.08694971985774991, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 81.48127150535583 }, { "epoch": 144, "train_loss": 6.281042174987793, "train_acc": 0.00942, "test_loss": 4.605170404815674, "test_acc": 0.01, "lyapunov": 2.263450643290644, "grad_norm": 0.0881830241474449, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 81.58690285682678 }, { "epoch": 145, "train_loss": 6.278796115875244, "train_acc": 0.01, "test_loss": 4.605169946289062, "test_acc": 0.01, "lyapunov": 2.2618483887304124, "grad_norm": 0.08774085138052039, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 81.47702813148499 }, { "epoch": 146, "train_loss": 6.28765030166626, "train_acc": 0.01, "test_loss": 4.605170179748535, "test_acc": 0.01, "lyapunov": 2.266257317169853, "grad_norm": 0.0926994360583192, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 81.53279685974121 }, { "epoch": 147, "train_loss": 6.28031106124878, "train_acc": 0.01, "test_loss": 4.605170380401612, "test_acc": 0.01, "lyapunov": 2.2628798844564297, "grad_norm": 0.08793782485118157, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 81.48903107643127 }, { "epoch": 148, "train_loss": 6.280096773681641, "train_acc": 0.01, "test_loss": 4.605170349884033, "test_acc": 0.01, "lyapunov": 2.2627320112779623, "grad_norm": 0.08818349122842602, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 81.4692907333374 }, { "epoch": 149, "train_loss": 6.281090885467529, "train_acc": 0.01, "test_loss": 4.605170343017578, "test_acc": 0.01, "lyapunov": 2.263427186195198, "grad_norm": 0.0872012744277379, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 81.53167700767517 }, { "epoch": 150, "train_loss": 6.279137640380859, "train_acc": 0.01, "test_loss": 4.605170111083984, "test_acc": 0.01, "lyapunov": 2.262077055318886, "grad_norm": 0.08725575780836431, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 81.56354284286499 } ], "12": [ { "epoch": 1, "train_loss": 12.888672213134766, "train_acc": 0.0157, "test_loss": 4.668669903564453, "test_acc": 0.0113, "lyapunov": 4.721897013656928, "grad_norm": 6.113449849588324, "grad_max_sv": 4.916350275278091, "grad_min_sv": 9.121745356832633e-08, "grad_condition": 85604761.14095068, "lr": 0.0009998903417374227, "time_sec": 124.4171769618988 }, { "epoch": 2, "train_loss": 8.873665056762695, "train_acc": 0.0172, "test_loss": 4.618728218078613, "test_acc": 0.0106, "lyapunov": 3.5643789152355145, "grad_norm": 4.270033727895912, "grad_max_sv": 3.703069430589676, "grad_min_sv": 4.972798216271515e-08, "grad_condition": 4407702901.858317, "lr": 0.0009995614150494292, "time_sec": 124.48686790466309 }, { "epoch": 3, "train_loss": 8.600334560241699, "train_acc": 0.01782, "test_loss": 4.650051962280274, "test_acc": 0.01, "lyapunov": 3.4914282776815506, "grad_norm": 3.3926839865294114, "grad_max_sv": 2.9882367312908173, "grad_min_sv": 1.3234509199243523e-08, "grad_condition": 54857460231.037346, "lr": 0.0009990133642141358, "time_sec": 124.54058074951172 }, { "epoch": 4, "train_loss": 8.263027096862793, "train_acc": 0.01714, "test_loss": 4.599512353515625, "test_acc": 0.0105, "lyapunov": 3.3760591937452937, "grad_norm": 2.278902599299841, "grad_max_sv": 1.9339918196201324, "grad_min_sv": 2.3884921456027857e-10, "grad_condition": 107255985296.78781, "lr": 0.0009982464296247522, "time_sec": 124.56976628303528 }, { "epoch": 5, "train_loss": 8.014010938720704, "train_acc": 0.01496, "test_loss": 4.616816136169434, "test_acc": 0.01, "lyapunov": 3.2668096848461023, "grad_norm": 1.8273408452911775, "grad_max_sv": 1.1145809442189922, "grad_min_sv": 1.2368932906215386e-11, "grad_condition": 320257530150.4256, "lr": 0.0009972609476841367, "time_sec": 124.43335103988647 }, { "epoch": 6, "train_loss": 7.492105539398193, "train_acc": 0.01378, "test_loss": 4.617157006835938, "test_acc": 0.01, "lyapunov": 2.993205757702098, "grad_norm": 1.155205925820389, "grad_max_sv": 0.8030500062418355, "grad_min_sv": 1.9935007673619705e-12, "grad_condition": 394942710887.2484, "lr": 0.000996057350657239, "time_sec": 124.40957427024841 }, { "epoch": 7, "train_loss": 7.546499238586426, "train_acc": 0.01474, "test_loss": 4.614982270812988, "test_acc": 0.01, "lyapunov": 3.0089273160071017, "grad_norm": 2.2107120727107343, "grad_max_sv": 0.5263522088527679, "grad_min_sv": 2.339208170494913e-12, "grad_condition": 228093595550.92413, "lr": 0.000994636166481494, "time_sec": 124.44238233566284 }, { "epoch": 8, "train_loss": 7.431590474243164, "train_acc": 0.01458, "test_loss": 4.613349987792969, "test_acc": 0.01, "lyapunov": 2.9677638501462424, "grad_norm": 1.4698803730862553, "grad_max_sv": 0.3683710671344215, "grad_min_sv": 1.0445961128587334e-12, "grad_condition": 222600534264.8287, "lr": 0.0009929980185352525, "time_sec": 124.46612310409546 }, { "epoch": 9, "train_loss": 7.177635037078858, "train_acc": 0.01324, "test_loss": 4.612429743957519, "test_acc": 0.01, "lyapunov": 2.8310226979463, "grad_norm": 1.4861384451742359, "grad_max_sv": 0.32697355831472236, "grad_min_sv": 7.011187907653872e-13, "grad_condition": 236887025983.79956, "lr": 0.0009911436253643444, "time_sec": 124.47700262069702 }, { "epoch": 10, "train_loss": 7.269148045806885, "train_acc": 0.01266, "test_loss": 4.60582406539917, "test_acc": 0.01, "lyapunov": 2.8725382824383123, "grad_norm": 2.342581709783361, "grad_max_sv": 0.25737013639882206, "grad_min_sv": 2.152763686233954e-13, "grad_condition": 237339662745.88754, "lr": 0.0009890738003669028, "time_sec": 124.34593343734741 }, { "epoch": 11, "train_loss": 7.854859015350342, "train_acc": 0.0135, "test_loss": 4.610336604309082, "test_acc": 0.01, "lyapunov": 3.174172605699895, "grad_norm": 2.7187327990789893, "grad_max_sv": 0.20388649497181177, "grad_min_sv": 8.088439153332857e-14, "grad_condition": 191904183934.97748, "lr": 0.00098678945143658, "time_sec": 124.38984727859497 }, { "epoch": 12, "train_loss": 7.352457761230469, "train_acc": 0.01424, "test_loss": 4.6108569480896, "test_acc": 0.01, "lyapunov": 2.9249625279165596, "grad_norm": 1.4927365138413504, "grad_max_sv": 0.19409580584615468, "grad_min_sv": 6.321730296975161e-14, "grad_condition": 185278377907.65347, "lr": 0.0009842915805643154, "time_sec": 124.45291423797607 }, { "epoch": 13, "train_loss": 7.126369653930664, "train_acc": 0.0127, "test_loss": 4.606200820922852, "test_acc": 0.01, "lyapunov": 2.7892982831696416, "grad_norm": 1.5745132805186597, "grad_max_sv": 0.16401691318606026, "grad_min_sv": 1.1404081781040362e-15, "grad_condition": 163820543107.00018, "lr": 0.000981581283398829, "time_sec": 124.47300815582275 }, { "epoch": 14, "train_loss": 6.9970923039245605, "train_acc": 0.0119, "test_loss": 4.606117165374756, "test_acc": 0.01, "lyapunov": 2.7211814384021418, "grad_norm": 0.8580084847133529, "grad_max_sv": 0.13348757792264224, "grad_min_sv": 3.507279862736168e-28, "grad_condition": 133487577922.64218, "lr": 0.0009786597487660333, "time_sec": 124.41379904747009 }, { "epoch": 15, "train_loss": 7.052154786376953, "train_acc": 0.0117, "test_loss": 4.606044427490234, "test_acc": 0.01, "lyapunov": 2.753269191288277, "grad_norm": 1.006394199833171, "grad_max_sv": 0.12816582168452442, "grad_min_sv": 4.518028483603919e-34, "grad_condition": 128165821684.52441, "lr": 0.0009755282581475766, "time_sec": 124.34007215499878 }, { "epoch": 16, "train_loss": 7.258110624084472, "train_acc": 0.0109, "test_loss": 4.605929005432129, "test_acc": 0.01, "lyapunov": 2.862082756998594, "grad_norm": 1.1482559574218805, "grad_max_sv": 0.10950499838218093, "grad_min_sv": 3.564320494794489e-35, "grad_condition": 109504998382.18094, "lr": 0.0009721881851187403, "time_sec": 124.38707971572876 }, { "epoch": 17, "train_loss": 6.873683618774414, "train_acc": 0.00996, "test_loss": 4.61062957611084, "test_acc": 0.01, "lyapunov": 2.641120981377409, "grad_norm": 2.0808485430057084, "grad_max_sv": 0.05978809341322631, "grad_min_sv": 2.4522723125684297e-46, "grad_condition": 59788093413.2263, "lr": 0.0009686409947459456, "time_sec": 124.47280597686768 }, { "epoch": 18, "train_loss": 7.016553334655762, "train_acc": 0.01398, "test_loss": 4.622579546356201, "test_acc": 0.01, "lyapunov": 2.728775659180663, "grad_norm": 1.2800257190104987, "grad_max_sv": 0.1043331983499229, "grad_min_sv": 3.1060564013215523e-18, "grad_condition": 104332858891.6054, "lr": 0.0009648882429441254, "time_sec": 124.54543328285217 }, { "epoch": 19, "train_loss": 6.869653914642334, "train_acc": 0.01194, "test_loss": 4.643599758911133, "test_acc": 0.01, "lyapunov": 2.638523844501856, "grad_norm": 0.5641956497166879, "grad_max_sv": 0.06742433752388025, "grad_min_sv": 9.779701625669289e-16, "grad_condition": 67360221904.04246, "lr": 0.00096093157579425, "time_sec": 124.44028401374817 }, { "epoch": 20, "train_loss": 6.866667858276367, "train_acc": 0.0096, "test_loss": 4.634420860290527, "test_acc": 0.01, "lyapunov": 2.628649781731998, "grad_norm": 0.5455051217507713, "grad_max_sv": 0.028104651859030126, "grad_min_sv": 0.0, "grad_condition": 28104651859.03013, "lr": 0.0009567727288213001, "time_sec": 124.34887290000916 }, { "epoch": 21, "train_loss": 6.825957579650879, "train_acc": 0.00936, "test_loss": 4.642799243164062, "test_acc": 0.01, "lyapunov": 2.607143042337559, "grad_norm": 0.5228902482624009, "grad_max_sv": 0.029772339016199113, "grad_min_sv": 0.0, "grad_condition": 29772339016.19911, "lr": 0.0009524135262330095, "time_sec": 124.38223886489868 }, { "epoch": 22, "train_loss": 6.60694779296875, "train_acc": 0.00934, "test_loss": 4.642452531433105, "test_acc": 0.01, "lyapunov": 2.4819612728665246, "grad_norm": 0.5929983668433683, "grad_max_sv": 0.028571362840011716, "grad_min_sv": 0.0, "grad_condition": 28571362840.01172, "lr": 0.0009478558801197061, "time_sec": 124.46409487724304 }, { "epoch": 23, "train_loss": 6.587394898986816, "train_acc": 0.00922, "test_loss": 4.642014373779297, "test_acc": 0.01, "lyapunov": 2.46996273287117, "grad_norm": 0.5937371167405978, "grad_max_sv": 0.027252211095765234, "grad_min_sv": 0.0, "grad_condition": 27252211095.765236, "lr": 0.000943101789615607, "time_sec": 124.41273093223572 }, { "epoch": 24, "train_loss": 6.5855675335693356, "train_acc": 0.00944, "test_loss": 4.629414208984375, "test_acc": 0.01, "lyapunov": 2.468693129546807, "grad_norm": 0.5173238649422355, "grad_max_sv": 0.026766624441370367, "grad_min_sv": 0.0, "grad_condition": 26766624441.37037, "lr": 0.0009381533400219313, "time_sec": 124.34699821472168 }, { "epoch": 25, "train_loss": 6.599731462860108, "train_acc": 0.00936, "test_loss": 4.6412096755981445, "test_acc": 0.01, "lyapunov": 2.476690198454406, "grad_norm": 0.5699426578758121, "grad_max_sv": 0.025352103635668755, "grad_min_sv": 0.0, "grad_condition": 25352103635.668755, "lr": 0.0009330127018922189, "time_sec": 124.3536787033081 }, { "epoch": 26, "train_loss": 6.5942790597534175, "train_acc": 0.00964, "test_loss": 4.640745770263672, "test_acc": 0.01, "lyapunov": 2.4741494673902116, "grad_norm": 0.546145353806512, "grad_max_sv": 0.021123076300136746, "grad_min_sv": 0.0, "grad_condition": 21123076300.136745, "lr": 0.000927682130080253, "time_sec": 124.4051742553711 }, { "epoch": 27, "train_loss": 6.6229908557128905, "train_acc": 0.00888, "test_loss": 4.605336713409423, "test_acc": 0.01, "lyapunov": 2.4850437781390022, "grad_norm": 0.6663677646075784, "grad_max_sv": 0.011104274867102503, "grad_min_sv": 0.0, "grad_condition": 11104274867.102505, "lr": 0.0009221639627510072, "time_sec": 124.44045972824097 }, { "epoch": 28, "train_loss": 6.597202638854981, "train_acc": 0.00916, "test_loss": 4.605269973754883, "test_acc": 0.01, "lyapunov": 2.4748127710483874, "grad_norm": 0.6602347286377247, "grad_max_sv": 0.005200258875265718, "grad_min_sv": 0.0, "grad_condition": 5200258875.2657175, "lr": 0.0009164606203550494, "time_sec": 124.41216611862183 }, { "epoch": 29, "train_loss": 6.5781180551147465, "train_acc": 0.00896, "test_loss": 4.605207743072509, "test_acc": 0.01, "lyapunov": 2.463899161809546, "grad_norm": 0.16963115020621336, "grad_max_sv": 0.0064356182236224415, "grad_min_sv": 0.0, "grad_condition": 6435618223.622441, "lr": 0.0009105746045668516, "time_sec": 124.52706933021545 }, { "epoch": 30, "train_loss": 6.580226347045898, "train_acc": 0.00922, "test_loss": 4.605211033630371, "test_acc": 0.01, "lyapunov": 2.4648621435970295, "grad_norm": 0.14897426222581245, "grad_max_sv": 0.006681703682988882, "grad_min_sv": 0.0, "grad_condition": 6681703682.988882, "lr": 0.0009045084971874733, "time_sec": 124.31314778327942 }, { "epoch": 31, "train_loss": 6.580346279144287, "train_acc": 0.00906, "test_loss": 4.605202531433106, "test_acc": 0.01, "lyapunov": 2.4647859356287496, "grad_norm": 0.13651802704858546, "grad_max_sv": 0.0033354544546455147, "grad_min_sv": 0.0, "grad_condition": 3335454454.6455145, "lr": 0.0008982649590120977, "time_sec": 124.37081241607666 }, { "epoch": 32, "train_loss": 6.5977811730957034, "train_acc": 0.00854, "test_loss": 4.605187432861328, "test_acc": 0.01, "lyapunov": 2.4727761562523023, "grad_norm": 0.12974748253445384, "grad_max_sv": 0.002326939906924963, "grad_min_sv": 0.0, "grad_condition": 2326939906.924963, "lr": 0.0008918467286629196, "time_sec": 124.42768621444702 }, { "epoch": 33, "train_loss": 6.574522008514404, "train_acc": 0.00888, "test_loss": 4.60518201751709, "test_acc": 0.01, "lyapunov": 2.461720284903446, "grad_norm": 0.10990146900045704, "grad_max_sv": 0.0026134482119232415, "grad_min_sv": 0.0, "grad_condition": 2613448211.9232416, "lr": 0.0008852566213878943, "time_sec": 124.36949467658997 }, { "epoch": 34, "train_loss": 6.577264302215577, "train_acc": 0.0092, "test_loss": 4.605177014923096, "test_acc": 0.01, "lyapunov": 2.463475263941928, "grad_norm": 0.12976444128871847, "grad_max_sv": 0.0009734443388879299, "grad_min_sv": 0.0, "grad_condition": 973444338.8879299, "lr": 0.000878497527825878, "time_sec": 124.3325207233429 }, { "epoch": 35, "train_loss": 6.587216622314453, "train_acc": 0.00888, "test_loss": 4.636661901855469, "test_acc": 0.01, "lyapunov": 2.4681083863348605, "grad_norm": 0.13220591916165889, "grad_max_sv": 0.00457856860011816, "grad_min_sv": 0.0, "grad_condition": 4578568600.118161, "lr": 0.000871572412738697, "time_sec": 124.3110682964325 }, { "epoch": 36, "train_loss": 6.592979219360352, "train_acc": 0.0092, "test_loss": 4.6051753067016605, "test_acc": 0.01, "lyapunov": 2.4714617686503377, "grad_norm": 0.1239857838330967, "grad_max_sv": 0.0005948701407760381, "grad_min_sv": 0.0, "grad_condition": 594870140.7760382, "lr": 0.0008644843137107055, "time_sec": 124.4406750202179 }, { "epoch": 37, "train_loss": 6.613644898376465, "train_acc": 0.00858, "test_loss": 4.605174197387695, "test_acc": 0.01, "lyapunov": 2.48187786294981, "grad_norm": 0.18028613006863556, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008572363398164014, "time_sec": 124.42482614517212 }, { "epoch": 38, "train_loss": 6.598032460021972, "train_acc": 0.00866, "test_loss": 4.605173423004151, "test_acc": 0.01, "lyapunov": 2.4748510588770327, "grad_norm": 0.17702039657703328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008498316702566826, "time_sec": 124.38127946853638 }, { "epoch": 39, "train_loss": 6.595033478546142, "train_acc": 0.00904, "test_loss": 4.605172880554199, "test_acc": 0.01, "lyapunov": 2.4724140514803055, "grad_norm": 0.1406852681746766, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643442, "time_sec": 124.27310037612915 }, { "epoch": 40, "train_loss": 6.607061416625976, "train_acc": 0.00882, "test_loss": 4.605173010253906, "test_acc": 0.01, "lyapunov": 2.4797774525859473, "grad_norm": 0.1602364870035822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008345653031794289, "time_sec": 124.35175013542175 }, { "epoch": 41, "train_loss": 6.652051022644043, "train_acc": 0.00868, "test_loss": 4.60517377319336, "test_acc": 0.01, "lyapunov": 2.494590156218585, "grad_norm": 0.1877202250366353, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008267103019950526, "time_sec": 124.42674827575684 }, { "epoch": 42, "train_loss": 6.609013889770508, "train_acc": 0.00818, "test_loss": 4.60517264328003, "test_acc": 0.01, "lyapunov": 2.4807275219646563, "grad_norm": 0.19291631462520265, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743447, "time_sec": 124.38730263710022 }, { "epoch": 43, "train_loss": 6.573144034423828, "train_acc": 0.0082, "test_loss": 4.6051730613708495, "test_acc": 0.01, "lyapunov": 2.4609296730412242, "grad_norm": 0.09628320238477034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000810573890139155, "time_sec": 124.36512160301208 }, { "epoch": 44, "train_loss": 6.575241811828613, "train_acc": 0.00884, "test_loss": 4.605172496032715, "test_acc": 0.01, "lyapunov": 2.462244158205779, "grad_norm": 0.10484293099591814, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008022995574311873, "time_sec": 124.30067491531372 }, { "epoch": 45, "train_loss": 6.594184577026367, "train_acc": 0.00936, "test_loss": 4.605172833251953, "test_acc": 0.01, "lyapunov": 2.4732542019670882, "grad_norm": 0.16310890352013555, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462363, "time_sec": 124.42177891731262 }, { "epoch": 46, "train_loss": 6.577082351989746, "train_acc": 0.00882, "test_loss": 4.605172598266601, "test_acc": 0.01, "lyapunov": 2.463544076665893, "grad_norm": 0.10037821136236143, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007853567838422158, "time_sec": 124.40465664863586 }, { "epoch": 47, "train_loss": 6.5774040518188475, "train_acc": 0.00862, "test_loss": 4.605172250366211, "test_acc": 0.01, "lyapunov": 2.4635354655478006, "grad_norm": 0.1162215297313361, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007766957746216719, "time_sec": 124.41038012504578 }, { "epoch": 48, "train_loss": 6.6083132769775395, "train_acc": 0.0086, "test_loss": 4.605171835327148, "test_acc": 0.01, "lyapunov": 2.4782137511026523, "grad_norm": 0.17135162198913576, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894982, "time_sec": 124.31084632873535 }, { "epoch": 49, "train_loss": 6.604438779449463, "train_acc": 0.0088, "test_loss": 4.60517212600708, "test_acc": 0.01, "lyapunov": 2.478019986311188, "grad_norm": 0.16895443836343932, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000759013504686565, "time_sec": 124.28308844566345 }, { "epoch": 50, "train_loss": 6.588782655029297, "train_acc": 0.00888, "test_loss": 4.605172025299073, "test_acc": 0.01, "lyapunov": 2.470017822197331, "grad_norm": 0.12889442183383476, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 124.42897295951843 }, { "epoch": 51, "train_loss": 6.601284326782227, "train_acc": 0.00796, "test_loss": 4.6051717948913575, "test_acc": 0.01, "lyapunov": 2.4773334834886636, "grad_norm": 0.17649093442856895, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508575, "time_sec": 124.39905118942261 }, { "epoch": 52, "train_loss": 6.575957306518554, "train_acc": 0.00918, "test_loss": 4.6051720420837405, "test_acc": 0.01, "lyapunov": 2.46280481565334, "grad_norm": 0.0968044467412458, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 124.42980766296387 }, { "epoch": 53, "train_loss": 6.587701625518799, "train_acc": 0.00872, "test_loss": 4.6051725509643555, "test_acc": 0.01, "lyapunov": 2.4698515999347657, "grad_norm": 0.13994770283254052, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 124.28514337539673 }, { "epoch": 54, "train_loss": 6.578931684265137, "train_acc": 0.00938, "test_loss": 4.605171647644043, "test_acc": 0.01, "lyapunov": 2.464453091097, "grad_norm": 0.104587329873943, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 124.3464949131012 }, { "epoch": 55, "train_loss": 6.610985378723145, "train_acc": 0.00822, "test_loss": 4.605172131347656, "test_acc": 0.01, "lyapunov": 2.4811968675354863, "grad_norm": 0.23664084539084446, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007033683215378998, "time_sec": 124.3919792175293 }, { "epoch": 56, "train_loss": 6.577887360839844, "train_acc": 0.0089, "test_loss": 4.605171892547608, "test_acc": 0.01, "lyapunov": 2.4638065877168076, "grad_norm": 0.12418210732155195, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 124.42023730278015 }, { "epoch": 57, "train_loss": 6.575769240722656, "train_acc": 0.00934, "test_loss": 4.605171751403809, "test_acc": 0.01, "lyapunov": 2.4626593559294405, "grad_norm": 0.08871385738467265, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423388, "time_sec": 124.39303755760193 }, { "epoch": 58, "train_loss": 6.649054284973144, "train_acc": 0.00788, "test_loss": 4.6051721786499025, "test_acc": 0.01, "lyapunov": 2.4995590183131227, "grad_norm": 0.26439944389263503, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 124.30309414863586 }, { "epoch": 59, "train_loss": 6.620378266906738, "train_acc": 0.0087, "test_loss": 4.605171722412109, "test_acc": 0.01, "lyapunov": 2.4861825994213524, "grad_norm": 0.2011814553286534, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 124.40799474716187 }, { "epoch": 60, "train_loss": 6.615863608703613, "train_acc": 0.00898, "test_loss": 4.605171568298339, "test_acc": 0.01, "lyapunov": 2.4820322356260647, "grad_norm": 0.16244295400836278, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 124.44055390357971 }, { "epoch": 61, "train_loss": 6.62539726638794, "train_acc": 0.00854, "test_loss": 4.605171578979492, "test_acc": 0.01, "lyapunov": 2.4873651598420596, "grad_norm": 0.18579251012972714, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 124.47138166427612 }, { "epoch": 62, "train_loss": 6.591934550476074, "train_acc": 0.00868, "test_loss": 4.605171854400635, "test_acc": 0.01, "lyapunov": 2.471130254018642, "grad_norm": 0.14241384092347348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 124.35206151008606 }, { "epoch": 63, "train_loss": 6.607412483825684, "train_acc": 0.00866, "test_loss": 4.605171817779541, "test_acc": 0.01, "lyapunov": 2.4772931200159176, "grad_norm": 0.12000050103102612, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 124.31255435943604 }, { "epoch": 64, "train_loss": 6.574604081420898, "train_acc": 0.0084, "test_loss": 4.60517174911499, "test_acc": 0.01, "lyapunov": 2.461947503297225, "grad_norm": 0.11837720061951122, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 124.42598223686218 }, { "epoch": 65, "train_loss": 6.669198082733154, "train_acc": 0.00846, "test_loss": 4.605171404266358, "test_acc": 0.01, "lyapunov": 2.50827671865673, "grad_norm": 0.3654068480597362, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 124.41292977333069 }, { "epoch": 66, "train_loss": 6.576071541442871, "train_acc": 0.00868, "test_loss": 4.60517176437378, "test_acc": 0.01, "lyapunov": 2.462862340995418, "grad_norm": 0.0924056370989614, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 124.44835186004639 }, { "epoch": 67, "train_loss": 6.623493032073974, "train_acc": 0.00798, "test_loss": 4.605171159362793, "test_acc": 0.01, "lyapunov": 2.4856161059016157, "grad_norm": 0.23515698863564433, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 124.32646751403809 }, { "epoch": 68, "train_loss": 6.58642106048584, "train_acc": 0.00814, "test_loss": 4.605171382141113, "test_acc": 0.01, "lyapunov": 2.4687487658332374, "grad_norm": 0.10028160631921758, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 124.34812188148499 }, { "epoch": 69, "train_loss": 6.612601704254151, "train_acc": 0.00846, "test_loss": 4.605171432495117, "test_acc": 0.01, "lyapunov": 2.478518716514568, "grad_norm": 0.16428393693339724, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 124.40169882774353 }, { "epoch": 70, "train_loss": 6.594199375915528, "train_acc": 0.0078, "test_loss": 4.605171556854248, "test_acc": 0.01, "lyapunov": 2.4733456675048986, "grad_norm": 0.13222269600542105, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 124.43159890174866 }, { "epoch": 71, "train_loss": 6.584797274169921, "train_acc": 0.00884, "test_loss": 4.605171443176269, "test_acc": 0.01, "lyapunov": 2.468046905439528, "grad_norm": 0.09698860702372256, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 124.38395667076111 }, { "epoch": 72, "train_loss": 6.62336443145752, "train_acc": 0.00826, "test_loss": 4.60517096862793, "test_acc": 0.01, "lyapunov": 2.486185181171388, "grad_norm": 0.20758922397897858, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646563, "time_sec": 124.28166174888611 }, { "epoch": 73, "train_loss": 6.624484212188721, "train_acc": 0.00906, "test_loss": 4.6051707977294924, "test_acc": 0.01, "lyapunov": 2.487110945879651, "grad_norm": 0.19977656643109526, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 124.35272693634033 }, { "epoch": 74, "train_loss": 6.603300393676758, "train_acc": 0.0091, "test_loss": 4.605170932006836, "test_acc": 0.01, "lyapunov": 2.477061335083164, "grad_norm": 0.16600248799904951, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 124.40994596481323 }, { "epoch": 75, "train_loss": 6.5982538143920895, "train_acc": 0.00856, "test_loss": 4.605171234130859, "test_acc": 0.01, "lyapunov": 2.473140881799371, "grad_norm": 0.16128953646649988, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 124.43308448791504 }, { "epoch": 76, "train_loss": 6.592834194946289, "train_acc": 0.00854, "test_loss": 4.605171026611328, "test_acc": 0.01, "lyapunov": 2.47263060750254, "grad_norm": 0.1340374980962284, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 124.34016180038452 }, { "epoch": 77, "train_loss": 6.584505953979492, "train_acc": 0.00864, "test_loss": 4.605171239471436, "test_acc": 0.01, "lyapunov": 2.4676697760286843, "grad_norm": 0.11435356827937113, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 124.3169755935669 }, { "epoch": 78, "train_loss": 6.5763300253295895, "train_acc": 0.00884, "test_loss": 4.6051710525512695, "test_acc": 0.01, "lyapunov": 2.4630901801311755, "grad_norm": 0.08961847488711042, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 124.3459620475769 }, { "epoch": 79, "train_loss": 6.575958716125489, "train_acc": 0.00932, "test_loss": 4.605170614624023, "test_acc": 0.01, "lyapunov": 2.462890618902338, "grad_norm": 0.0894392700212742, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 124.39721941947937 }, { "epoch": 80, "train_loss": 6.57727864440918, "train_acc": 0.00828, "test_loss": 4.6051712982177735, "test_acc": 0.01, "lyapunov": 2.4634996923949104, "grad_norm": 0.09357159928827649, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 124.43293237686157 }, { "epoch": 81, "train_loss": 6.576623619689942, "train_acc": 0.00858, "test_loss": 4.60517075958252, "test_acc": 0.01, "lyapunov": 2.4632719782612207, "grad_norm": 0.08778044836554635, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 124.33877468109131 }, { "epoch": 82, "train_loss": 6.706115616912842, "train_acc": 0.00852, "test_loss": 4.60517084274292, "test_acc": 0.01, "lyapunov": 2.5237014750995295, "grad_norm": 0.35892654821663944, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 124.33198618888855 }, { "epoch": 83, "train_loss": 6.693132893981933, "train_acc": 0.00928, "test_loss": 4.605170736694336, "test_acc": 0.01, "lyapunov": 2.5217734712468998, "grad_norm": 0.37154817796859707, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 124.33878684043884 }, { "epoch": 84, "train_loss": 6.673238817443847, "train_acc": 0.00904, "test_loss": 4.605171113586426, "test_acc": 0.01, "lyapunov": 2.5138309251926745, "grad_norm": 0.48242670306903057, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 124.42056584358215 }, { "epoch": 85, "train_loss": 6.597096472473145, "train_acc": 0.0083, "test_loss": 4.605170780181885, "test_acc": 0.01, "lyapunov": 2.4718706601720943, "grad_norm": 0.13232535416814104, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 124.43193411827087 }, { "epoch": 86, "train_loss": 6.575025537414551, "train_acc": 0.00834, "test_loss": 4.6051709815979, "test_acc": 0.01, "lyapunov": 2.4622172730048293, "grad_norm": 0.11156499374939659, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 124.34226822853088 }, { "epoch": 87, "train_loss": 6.573478553161621, "train_acc": 0.00842, "test_loss": 4.605170571899414, "test_acc": 0.01, "lyapunov": 2.4612386501048835, "grad_norm": 0.09079297617092336, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 124.27930355072021 }, { "epoch": 88, "train_loss": 6.5734689576721195, "train_acc": 0.00854, "test_loss": 4.605170808410644, "test_acc": 0.01, "lyapunov": 2.461263867595312, "grad_norm": 0.09120456341783888, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 124.38532066345215 }, { "epoch": 89, "train_loss": 6.578163130187988, "train_acc": 0.00852, "test_loss": 4.605170602416992, "test_acc": 0.01, "lyapunov": 2.4642753814492386, "grad_norm": 0.09559837141233972, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 124.44146919250488 }, { "epoch": 90, "train_loss": 6.5798112936401365, "train_acc": 0.0083, "test_loss": 4.605170631408692, "test_acc": 0.01, "lyapunov": 2.4649541908517825, "grad_norm": 0.09735485237927284, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 124.39319109916687 }, { "epoch": 91, "train_loss": 6.574903171081543, "train_acc": 0.0083, "test_loss": 4.605170557403564, "test_acc": 0.01, "lyapunov": 2.4621782180903207, "grad_norm": 0.08981548140002098, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 124.35036778450012 }, { "epoch": 92, "train_loss": 6.5757408012390135, "train_acc": 0.00836, "test_loss": 4.605170684814453, "test_acc": 0.01, "lyapunov": 2.4627471470162083, "grad_norm": 0.08817445544280453, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 124.33928322792053 }, { "epoch": 93, "train_loss": 6.612554905395508, "train_acc": 0.00834, "test_loss": 4.605170486450195, "test_acc": 0.01, "lyapunov": 2.4806297959574044, "grad_norm": 0.1882025016044833, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 124.40910911560059 }, { "epoch": 94, "train_loss": 6.595741138000489, "train_acc": 0.00806, "test_loss": 4.60517061920166, "test_acc": 0.01, "lyapunov": 2.472626593411731, "grad_norm": 0.16104566409905433, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 124.41845726966858 }, { "epoch": 95, "train_loss": 6.5987700848388675, "train_acc": 0.0085, "test_loss": 4.605170571899414, "test_acc": 0.01, "lyapunov": 2.4736888725739306, "grad_norm": 0.1552458690168984, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 124.34644985198975 }, { "epoch": 96, "train_loss": 6.597373901672364, "train_acc": 0.00828, "test_loss": 4.6051704193115235, "test_acc": 0.01, "lyapunov": 2.473390321902302, "grad_norm": 0.1443472451352086, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 124.32696723937988 }, { "epoch": 97, "train_loss": 6.590096541442871, "train_acc": 0.00862, "test_loss": 4.6051705436706545, "test_acc": 0.01, "lyapunov": 2.4693754414463287, "grad_norm": 0.11035396630097889, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 124.30454087257385 }, { "epoch": 98, "train_loss": 6.70725288696289, "train_acc": 0.00854, "test_loss": 4.605170336151123, "test_acc": 0.01, "lyapunov": 2.529677952037138, "grad_norm": 0.5122066284498856, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 124.31350612640381 }, { "epoch": 99, "train_loss": 6.575984575958252, "train_acc": 0.0085, "test_loss": 4.60517036895752, "test_acc": 0.01, "lyapunov": 2.462917518737676, "grad_norm": 0.08798552577224787, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 124.33125352859497 }, { "epoch": 100, "train_loss": 6.575890505371094, "train_acc": 0.00856, "test_loss": 4.605170387268067, "test_acc": 0.01, "lyapunov": 2.462910512524188, "grad_norm": 0.08984849200071802, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 124.41467308998108 }, { "epoch": 101, "train_loss": 6.5755246405029295, "train_acc": 0.00866, "test_loss": 4.605170295715332, "test_acc": 0.01, "lyapunov": 2.4626409702593715, "grad_norm": 0.08833234367069784, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 124.4282865524292 }, { "epoch": 102, "train_loss": 6.578647835388184, "train_acc": 0.00874, "test_loss": 4.60517028503418, "test_acc": 0.01, "lyapunov": 2.4644368957070744, "grad_norm": 0.0881800871840224, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 124.39285898208618 }, { "epoch": 103, "train_loss": 6.603837554931641, "train_acc": 0.0081, "test_loss": 4.605170309448242, "test_acc": 0.01, "lyapunov": 2.475680511016065, "grad_norm": 0.12862246002842495, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 124.30171847343445 }, { "epoch": 104, "train_loss": 6.589783010559082, "train_acc": 0.0087, "test_loss": 4.605170768737793, "test_acc": 0.01, "lyapunov": 2.469147738898197, "grad_norm": 0.1132666503606524, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 124.33115792274475 }, { "epoch": 105, "train_loss": 6.607209113769532, "train_acc": 0.00868, "test_loss": 4.605170411682129, "test_acc": 0.01, "lyapunov": 2.4791276979324457, "grad_norm": 0.19473222939710866, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 124.42748808860779 }, { "epoch": 106, "train_loss": 6.605109618988037, "train_acc": 0.00876, "test_loss": 4.605170632171631, "test_acc": 0.01, "lyapunov": 2.4781547934198014, "grad_norm": 0.19321601949412123, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 124.40237879753113 }, { "epoch": 107, "train_loss": 6.5744285192871095, "train_acc": 0.0084, "test_loss": 4.605170581054687, "test_acc": 0.01, "lyapunov": 2.461912363081637, "grad_norm": 0.09153624986240072, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 124.35668659210205 }, { "epoch": 108, "train_loss": 6.591736253662109, "train_acc": 0.009, "test_loss": 4.605170578002929, "test_acc": 0.01, "lyapunov": 2.469679483672237, "grad_norm": 0.17005631477257033, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 124.29520559310913 }, { "epoch": 109, "train_loss": 6.618268890991211, "train_acc": 0.00898, "test_loss": 4.605170452880859, "test_acc": 0.01, "lyapunov": 2.4846892923955113, "grad_norm": 0.22506407024101205, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 124.44524145126343 }, { "epoch": 110, "train_loss": 6.588956251525879, "train_acc": 0.0079, "test_loss": 4.605170387268067, "test_acc": 0.01, "lyapunov": 2.4697647594734837, "grad_norm": 0.1497151598092074, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 124.427237033844 }, { "epoch": 111, "train_loss": 6.597999030761719, "train_acc": 0.0082, "test_loss": 4.605170532226563, "test_acc": 0.01, "lyapunov": 2.47352661866971, "grad_norm": 0.1265460364033806, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 124.4067976474762 }, { "epoch": 112, "train_loss": 6.581220099945068, "train_acc": 0.00878, "test_loss": 4.605170124816895, "test_acc": 0.01, "lyapunov": 2.466078118595016, "grad_norm": 0.1166543211179088, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 124.3555097579956 }, { "epoch": 113, "train_loss": 6.5873154238891605, "train_acc": 0.00902, "test_loss": 4.605170477294922, "test_acc": 0.01, "lyapunov": 2.467848820454629, "grad_norm": 0.11336040865405435, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 124.34751081466675 }, { "epoch": 114, "train_loss": 6.575267355041504, "train_acc": 0.00892, "test_loss": 4.60517041015625, "test_acc": 0.01, "lyapunov": 2.4624666978636056, "grad_norm": 0.0882429459696398, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 124.43968343734741 }, { "epoch": 115, "train_loss": 6.575747386169434, "train_acc": 0.0087, "test_loss": 4.60517027130127, "test_acc": 0.01, "lyapunov": 2.46279121481854, "grad_norm": 0.08906865623909292, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 124.40401101112366 }, { "epoch": 116, "train_loss": 6.574066097106933, "train_acc": 0.00888, "test_loss": 4.605170015716553, "test_acc": 0.01, "lyapunov": 2.4617425267348816, "grad_norm": 0.09299280580563789, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 124.43384170532227 }, { "epoch": 117, "train_loss": 6.575292884674072, "train_acc": 0.00916, "test_loss": 4.605170446777343, "test_acc": 0.01, "lyapunov": 2.462491541567361, "grad_norm": 0.08789900440919356, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 124.31648087501526 }, { "epoch": 118, "train_loss": 6.578267410125733, "train_acc": 0.00826, "test_loss": 4.605170466613769, "test_acc": 0.01, "lyapunov": 2.4644045262690395, "grad_norm": 0.10415607883931481, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 124.33564472198486 }, { "epoch": 119, "train_loss": 6.574555395050049, "train_acc": 0.00854, "test_loss": 4.605170401000977, "test_acc": 0.01, "lyapunov": 2.4620885909975643, "grad_norm": 0.08778921241218508, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 124.65056228637695 }, { "epoch": 120, "train_loss": 6.583910481872558, "train_acc": 0.00864, "test_loss": 4.605170470428467, "test_acc": 0.01, "lyapunov": 2.467699810671989, "grad_norm": 0.3040678237626765, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 124.44140434265137 }, { "epoch": 121, "train_loss": 6.586020791015625, "train_acc": 0.00884, "test_loss": 4.605170375823975, "test_acc": 0.01, "lyapunov": 2.467914994720303, "grad_norm": 0.11635906922176238, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 124.43893909454346 }, { "epoch": 122, "train_loss": 6.576034954528809, "train_acc": 0.0088, "test_loss": 4.605170199584961, "test_acc": 0.01, "lyapunov": 2.463029363880987, "grad_norm": 0.08771533827211757, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 124.32056403160095 }, { "epoch": 123, "train_loss": 6.574589498291016, "train_acc": 0.00878, "test_loss": 4.605170094299316, "test_acc": 0.01, "lyapunov": 2.4620493037621385, "grad_norm": 0.08813480095873011, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 124.4015576839447 }, { "epoch": 124, "train_loss": 6.576157915649414, "train_acc": 0.00904, "test_loss": 4.605170024108887, "test_acc": 0.01, "lyapunov": 2.4630649205668806, "grad_norm": 0.08749001934915172, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 124.42104578018188 }, { "epoch": 125, "train_loss": 6.579862565307617, "train_acc": 0.00876, "test_loss": 4.605170492553711, "test_acc": 0.01, "lyapunov": 2.465126996759868, "grad_norm": 0.09372036345061274, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 124.4746482372284 }, { "epoch": 126, "train_loss": 6.577153359985352, "train_acc": 0.00866, "test_loss": 4.605170122528076, "test_acc": 0.01, "lyapunov": 2.463735998134174, "grad_norm": 0.09613135620568294, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 124.38881230354309 }, { "epoch": 127, "train_loss": 6.574400754547119, "train_acc": 0.0083, "test_loss": 4.605170375823975, "test_acc": 0.01, "lyapunov": 2.4619021769374836, "grad_norm": 0.08860379526254596, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 124.31344938278198 }, { "epoch": 128, "train_loss": 6.571165360717774, "train_acc": 0.00878, "test_loss": 4.605170154571534, "test_acc": 0.01, "lyapunov": 2.459857079074206, "grad_norm": 0.08757319736074258, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 124.39138221740723 }, { "epoch": 129, "train_loss": 6.575437990264892, "train_acc": 0.00846, "test_loss": 4.605170350646973, "test_acc": 0.01, "lyapunov": 2.46259711831427, "grad_norm": 0.08813574783200358, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 124.41060423851013 }, { "epoch": 130, "train_loss": 6.591315377197265, "train_acc": 0.00954, "test_loss": 4.605170065307617, "test_acc": 0.01, "lyapunov": 2.4702539943978, "grad_norm": 0.11366316284903058, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 124.4502763748169 }, { "epoch": 131, "train_loss": 6.577392526092529, "train_acc": 0.00946, "test_loss": 4.60517007446289, "test_acc": 0.01, "lyapunov": 2.46386312401813, "grad_norm": 0.08820500519427996, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 124.3550136089325 }, { "epoch": 132, "train_loss": 6.592328434906006, "train_acc": 0.00882, "test_loss": 4.6051704208374025, "test_acc": 0.01, "lyapunov": 2.4700996772102686, "grad_norm": 0.114161955094371, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 124.37056255340576 }, { "epoch": 133, "train_loss": 6.588796159973144, "train_acc": 0.00896, "test_loss": 4.605170506286621, "test_acc": 0.01, "lyapunov": 2.468394133745862, "grad_norm": 0.1295209594512649, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 124.36608004570007 }, { "epoch": 134, "train_loss": 6.576412990264893, "train_acc": 0.00898, "test_loss": 4.605170251464844, "test_acc": 0.01, "lyapunov": 2.4632679434383618, "grad_norm": 0.08812453692162578, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 124.43608951568604 }, { "epoch": 135, "train_loss": 6.5760765690612795, "train_acc": 0.00924, "test_loss": 4.605169999694824, "test_acc": 0.01, "lyapunov": 2.463012531895162, "grad_norm": 0.08722595509863246, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 124.46503901481628 }, { "epoch": 136, "train_loss": 6.575435556030273, "train_acc": 0.00884, "test_loss": 4.605170062255859, "test_acc": 0.01, "lyapunov": 2.4626583150585595, "grad_norm": 0.08796433458523298, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 124.34801983833313 }, { "epoch": 137, "train_loss": 6.575190331268311, "train_acc": 0.00934, "test_loss": 4.6051701629638675, "test_acc": 0.01, "lyapunov": 2.4624439023644724, "grad_norm": 0.08813731535348707, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 124.35173964500427 }, { "epoch": 138, "train_loss": 6.574904625091553, "train_acc": 0.0089, "test_loss": 4.60517007446289, "test_acc": 0.01, "lyapunov": 2.4622641213409735, "grad_norm": 0.08807062213809792, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 124.40467262268066 }, { "epoch": 139, "train_loss": 6.5738159555053715, "train_acc": 0.00926, "test_loss": 4.605170321655273, "test_acc": 0.01, "lyapunov": 2.4615705336451223, "grad_norm": 0.08717896516246301, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 124.4789035320282 }, { "epoch": 140, "train_loss": 6.575532109680176, "train_acc": 0.00924, "test_loss": 4.605170358276367, "test_acc": 0.01, "lyapunov": 2.4626962266614676, "grad_norm": 0.0882680648293281, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 124.40317368507385 }, { "epoch": 141, "train_loss": 6.5800046757507324, "train_acc": 0.00862, "test_loss": 4.60517036895752, "test_acc": 0.01, "lyapunov": 2.4654090264264275, "grad_norm": 0.11343015603036581, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 124.35891890525818 }, { "epoch": 142, "train_loss": 6.57490125793457, "train_acc": 0.00948, "test_loss": 4.6051704162597655, "test_acc": 0.01, "lyapunov": 2.462258317586406, "grad_norm": 0.08755517239002598, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 124.29203748703003 }, { "epoch": 143, "train_loss": 6.576884376220703, "train_acc": 0.00966, "test_loss": 4.605170155334473, "test_acc": 0.01, "lyapunov": 2.4635954634917665, "grad_norm": 0.08753943717047542, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 124.41098976135254 }, { "epoch": 144, "train_loss": 6.573677404937744, "train_acc": 0.00962, "test_loss": 4.60517022857666, "test_acc": 0.01, "lyapunov": 2.461500019673496, "grad_norm": 0.08775396126300311, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 124.44748258590698 }, { "epoch": 145, "train_loss": 6.573780137023926, "train_acc": 0.0092, "test_loss": 4.605170056152343, "test_acc": 0.01, "lyapunov": 2.4615867387913073, "grad_norm": 0.08734584455870835, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 124.4104528427124 }, { "epoch": 146, "train_loss": 6.574326271667481, "train_acc": 0.00928, "test_loss": 4.605170436859131, "test_acc": 0.01, "lyapunov": 2.4619192083168517, "grad_norm": 0.08784696936548642, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 124.3491895198822 }, { "epoch": 147, "train_loss": 6.573583771209717, "train_acc": 0.00938, "test_loss": 4.605170133209229, "test_acc": 0.01, "lyapunov": 2.461428134947482, "grad_norm": 0.08718184577116198, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 124.33614110946655 }, { "epoch": 148, "train_loss": 6.577077916870117, "train_acc": 0.01, "test_loss": 4.605170425415039, "test_acc": 0.01, "lyapunov": 2.4637341109078252, "grad_norm": 0.08788027221282606, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 124.37565398216248 }, { "epoch": 149, "train_loss": 6.5732455339050295, "train_acc": 0.01, "test_loss": 4.605170333862305, "test_acc": 0.01, "lyapunov": 2.461217089382279, "grad_norm": 0.08788179142338205, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 124.34460210800171 }, { "epoch": 150, "train_loss": 6.574304178619385, "train_acc": 0.01, "test_loss": 4.605170114135742, "test_acc": 0.01, "lyapunov": 2.4619127923570328, "grad_norm": 0.08771827398079268, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 124.40945982933044 } ], "16": [ { "epoch": 1, "train_loss": 13.988400897827148, "train_acc": 0.01438, "test_loss": 4.683009733581543, "test_acc": 0.0106, "lyapunov": 5.045674181960123, "grad_norm": 5.752499013515142, "grad_max_sv": 4.6983559966087345, "grad_min_sv": 8.501930549228987e-08, "grad_condition": 317270864.69818985, "lr": 0.0009998903417374227, "time_sec": 167.40048050880432 }, { "epoch": 2, "train_loss": 9.313672403564453, "train_acc": 0.01648, "test_loss": 4.631449128723145, "test_acc": 0.01, "lyapunov": 3.775117972317864, "grad_norm": 4.062466764062373, "grad_max_sv": 3.613509923219681, "grad_min_sv": 4.5653093948966327e-08, "grad_condition": 646545370.9190311, "lr": 0.0009995614150494292, "time_sec": 167.42056441307068 }, { "epoch": 3, "train_loss": 9.2102595413208, "train_acc": 0.01704, "test_loss": 4.625689315795898, "test_acc": 0.0099, "lyapunov": 3.769411094353327, "grad_norm": 3.2423057609153028, "grad_max_sv": 2.773962843418121, "grad_min_sv": 1.3365777420984947e-08, "grad_condition": 79084430364.82771, "lr": 0.0009990133642141358, "time_sec": 167.40087485313416 }, { "epoch": 4, "train_loss": 8.593553448181153, "train_acc": 0.01608, "test_loss": 4.623868472290039, "test_acc": 0.01, "lyapunov": 3.5245635119240606, "grad_norm": 2.236847501376478, "grad_max_sv": 1.9526167243719101, "grad_min_sv": 4.5824498221260444e-11, "grad_condition": 250389376731.7333, "lr": 0.0009982464296247522, "time_sec": 167.34348464012146 }, { "epoch": 5, "train_loss": 7.8038157984924315, "train_acc": 0.01666, "test_loss": 4.618056827545166, "test_acc": 0.01, "lyapunov": 3.1676931515374145, "grad_norm": 1.5048980928317333, "grad_max_sv": 1.1324948772788048, "grad_min_sv": 1.5125593644607378e-11, "grad_condition": 218348544809.20728, "lr": 0.0009972609476841367, "time_sec": 167.4401364326477 }, { "epoch": 6, "train_loss": 7.634129183959961, "train_acc": 0.01436, "test_loss": 4.617713563537598, "test_acc": 0.01, "lyapunov": 3.0711578097184904, "grad_norm": 1.9264530093156518, "grad_max_sv": 0.7561077677975927, "grad_min_sv": 2.3226373858483118e-12, "grad_condition": 319185362917.36163, "lr": 0.000996057350657239, "time_sec": 167.3985676765442 }, { "epoch": 7, "train_loss": 7.547255232238769, "train_acc": 0.01396, "test_loss": 4.614803285980225, "test_acc": 0.01, "lyapunov": 3.0217712657226015, "grad_norm": 1.075279960644913, "grad_max_sv": 0.6469582007612514, "grad_min_sv": 1.889760736503505e-12, "grad_condition": 338582040139.5369, "lr": 0.000994636166481494, "time_sec": 167.22783827781677 }, { "epoch": 8, "train_loss": 7.305741961669922, "train_acc": 0.01248, "test_loss": 4.611902558898926, "test_acc": 0.01, "lyapunov": 2.8956392976024268, "grad_norm": 1.304673575393078, "grad_max_sv": 0.4924972869455814, "grad_min_sv": 8.285040604573086e-13, "grad_condition": 334051794817.99695, "lr": 0.0009929980185352525, "time_sec": 167.31978368759155 }, { "epoch": 9, "train_loss": 7.328730865783691, "train_acc": 0.01336, "test_loss": 4.606002921295166, "test_acc": 0.01, "lyapunov": 2.913580340192751, "grad_norm": 1.4776699959663357, "grad_max_sv": 0.3292516863617735, "grad_min_sv": 5.235604182531881e-13, "grad_condition": 246744375025.40308, "lr": 0.0009911436253643444, "time_sec": 167.3429365158081 }, { "epoch": 10, "train_loss": 7.308604444580078, "train_acc": 0.01346, "test_loss": 4.611476264953613, "test_acc": 0.01, "lyapunov": 2.900581695234684, "grad_norm": 1.3123879020319187, "grad_max_sv": 0.27272568672558684, "grad_min_sv": 2.0496919726941882e-13, "grad_condition": 238625164756.47662, "lr": 0.0009890738003669028, "time_sec": 167.2653293609619 }, { "epoch": 11, "train_loss": 7.490302003173828, "train_acc": 0.01364, "test_loss": 4.611579527282715, "test_acc": 0.01, "lyapunov": 3.0006146321211324, "grad_norm": 2.2969507920003114, "grad_max_sv": 0.19786488203932162, "grad_min_sv": 8.37648333500382e-14, "grad_condition": 183815724532.2033, "lr": 0.00098678945143658, "time_sec": 167.22061586380005 }, { "epoch": 12, "train_loss": 7.307793238525391, "train_acc": 0.01262, "test_loss": 4.606186763000489, "test_acc": 0.01, "lyapunov": 2.9112238219327025, "grad_norm": 1.4729621434597777, "grad_max_sv": 0.2151564534753561, "grad_min_sv": 1.990284826719073e-14, "grad_condition": 211594713734.62634, "lr": 0.0009842915805643154, "time_sec": 167.35631036758423 }, { "epoch": 13, "train_loss": 7.459832763977051, "train_acc": 0.01172, "test_loss": 4.606186486053467, "test_acc": 0.01, "lyapunov": 2.9779586944433736, "grad_norm": 1.2584288878227161, "grad_max_sv": 0.17604726925492287, "grad_min_sv": 2.9740421215427092e-27, "grad_condition": 176047269254.9224, "lr": 0.000981581283398829, "time_sec": 167.55029773712158 }, { "epoch": 14, "train_loss": 7.959970283813477, "train_acc": 0.01162, "test_loss": 4.606137133789063, "test_acc": 0.01, "lyapunov": 3.224144145960698, "grad_norm": 1.3145379480759145, "grad_max_sv": 0.16056990809738636, "grad_min_sv": 6.069672152326662e-32, "grad_condition": 160569908097.38638, "lr": 0.0009786597487660333, "time_sec": 167.2209074497223 }, { "epoch": 15, "train_loss": 7.6532865875244145, "train_acc": 0.01084, "test_loss": 4.606105514526368, "test_acc": 0.01, "lyapunov": 3.0689418846384036, "grad_norm": 0.7741481577990978, "grad_max_sv": 0.1402381032705307, "grad_min_sv": 5.380285453775135e-40, "grad_condition": 140238103270.5307, "lr": 0.0009755282581475766, "time_sec": 167.3077232837677 }, { "epoch": 16, "train_loss": 7.216664337158203, "train_acc": 0.01118, "test_loss": 4.606032288360596, "test_acc": 0.01, "lyapunov": 2.8502078891715126, "grad_norm": 2.0735777194936222, "grad_max_sv": 0.10496805571019649, "grad_min_sv": 1.2874706397430962e-40, "grad_condition": 104968055710.1965, "lr": 0.0009721881851187403, "time_sec": 167.3395276069641 }, { "epoch": 17, "train_loss": 8.192574862670899, "train_acc": 0.01158, "test_loss": 4.6059588500976565, "test_acc": 0.01, "lyapunov": 3.3359562454321194, "grad_norm": 3.147348676481939, "grad_max_sv": 0.09904798325151205, "grad_min_sv": 3.313275631249688e-41, "grad_condition": 99047983251.51205, "lr": 0.0009686409947459456, "time_sec": 167.2007658481598 }, { "epoch": 18, "train_loss": 7.947704606018067, "train_acc": 0.01086, "test_loss": 4.605810301208496, "test_acc": 0.01, "lyapunov": 3.2087259890173403, "grad_norm": 1.1551680706222047, "grad_max_sv": 0.0897066842764616, "grad_min_sv": 3.5133705422167894e-42, "grad_condition": 89706684276.4616, "lr": 0.0009648882429441254, "time_sec": 167.2022511959076 }, { "epoch": 19, "train_loss": 8.011894176635742, "train_acc": 0.00998, "test_loss": 4.610458689880371, "test_acc": 0.01, "lyapunov": 3.247671382201602, "grad_norm": 0.789157877855446, "grad_max_sv": 0.04834392946213484, "grad_min_sv": 1.7516230804060213e-46, "grad_condition": 48343929462.134834, "lr": 0.00096093157579425, "time_sec": 167.33806610107422 }, { "epoch": 20, "train_loss": 8.051023805236817, "train_acc": 0.00904, "test_loss": 4.610909297180176, "test_acc": 0.01, "lyapunov": 3.2383710405100947, "grad_norm": 1.1273733660004814, "grad_max_sv": 0.010316886380314827, "grad_min_sv": 0.0, "grad_condition": 10316886380.314827, "lr": 0.0009567727288213001, "time_sec": 167.29369735717773 }, { "epoch": 21, "train_loss": 7.128181716918945, "train_acc": 0.00838, "test_loss": 4.607191325378418, "test_acc": 0.01, "lyapunov": 2.7860927539103475, "grad_norm": 1.0701329510796986, "grad_max_sv": 0.014478291012346744, "grad_min_sv": 0.0, "grad_condition": 14478291012.346745, "lr": 0.0009524135262330095, "time_sec": 167.20805835723877 }, { "epoch": 22, "train_loss": 6.963491222686768, "train_acc": 0.0091, "test_loss": 4.607380027770996, "test_acc": 0.01, "lyapunov": 2.6966084769314818, "grad_norm": 1.1730630244839415, "grad_max_sv": 0.012138673383742572, "grad_min_sv": 0.0, "grad_condition": 12138673383.742573, "lr": 0.0009478558801197061, "time_sec": 167.22877049446106 }, { "epoch": 23, "train_loss": 6.875370686798096, "train_acc": 0.00858, "test_loss": 4.609367184448242, "test_acc": 0.01, "lyapunov": 2.6493814430578286, "grad_norm": 1.3739908151868958, "grad_max_sv": 0.011468294635415077, "grad_min_sv": 0.0, "grad_condition": 11468294635.415077, "lr": 0.000943101789615607, "time_sec": 167.56782293319702 }, { "epoch": 24, "train_loss": 7.175245254516602, "train_acc": 0.00882, "test_loss": 4.6075513046264645, "test_acc": 0.01, "lyapunov": 2.813519052837206, "grad_norm": 1.9559849705093102, "grad_max_sv": 0.011112797912210226, "grad_min_sv": 0.0, "grad_condition": 11112797912.210226, "lr": 0.0009381533400219313, "time_sec": 167.2002296447754 }, { "epoch": 25, "train_loss": 6.835657153320312, "train_acc": 0.00898, "test_loss": 4.609123987579346, "test_acc": 0.01, "lyapunov": 2.6257676047742216, "grad_norm": 0.8499098981030252, "grad_max_sv": 0.010097978403791785, "grad_min_sv": 0.0, "grad_condition": 10097978403.791786, "lr": 0.0009330127018922189, "time_sec": 167.22895908355713 }, { "epoch": 26, "train_loss": 6.806944010009766, "train_acc": 0.00952, "test_loss": 4.608995832824707, "test_acc": 0.01, "lyapunov": 2.608501203224787, "grad_norm": 0.16959020377034753, "grad_max_sv": 0.009534611040726304, "grad_min_sv": 0.0, "grad_condition": 9534611040.726305, "lr": 0.000927682130080253, "time_sec": 167.30368304252625 }, { "epoch": 27, "train_loss": 6.796024333190918, "train_acc": 0.00918, "test_loss": 4.608860453033447, "test_acc": 0.01, "lyapunov": 2.601986149083013, "grad_norm": 0.10936615989500913, "grad_max_sv": 0.003977444209158421, "grad_min_sv": 0.0, "grad_condition": 3977444209.1584206, "lr": 0.0009221639627510072, "time_sec": 167.31120085716248 }, { "epoch": 28, "train_loss": 6.799691816711426, "train_acc": 0.00886, "test_loss": 4.6074915008544925, "test_acc": 0.01, "lyapunov": 2.604261659905124, "grad_norm": 0.09652074382540592, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009164606203550494, "time_sec": 167.08661937713623 }, { "epoch": 29, "train_loss": 6.8092449851989745, "train_acc": 0.00872, "test_loss": 4.608655583190918, "test_acc": 0.01, "lyapunov": 2.608830842825458, "grad_norm": 0.12376584460534797, "grad_max_sv": 0.002880856767296791, "grad_min_sv": 0.0, "grad_condition": 2880856767.296791, "lr": 0.0009105746045668516, "time_sec": 167.20095920562744 }, { "epoch": 30, "train_loss": 6.801117441558838, "train_acc": 0.00916, "test_loss": 4.608566645812989, "test_acc": 0.01, "lyapunov": 2.605140414689203, "grad_norm": 0.10511250252895085, "grad_max_sv": 0.0030666613951325417, "grad_min_sv": 0.0, "grad_condition": 3066661395.1325417, "lr": 0.0009045084971874733, "time_sec": 167.22371792793274 }, { "epoch": 31, "train_loss": 6.818323947296142, "train_acc": 0.00892, "test_loss": 4.607396678161621, "test_acc": 0.01, "lyapunov": 2.6131436501622507, "grad_norm": 0.17673479255010097, "grad_max_sv": 0.001358983526006341, "grad_min_sv": 0.0, "grad_condition": 1358983526.006341, "lr": 0.0008982649590120977, "time_sec": 167.21490716934204 }, { "epoch": 32, "train_loss": 6.81385307510376, "train_acc": 0.00854, "test_loss": 4.608588083648682, "test_acc": 0.01, "lyapunov": 2.61087080828674, "grad_norm": 0.1300116564110217, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008918467286629196, "time_sec": 167.17329859733582 }, { "epoch": 33, "train_loss": 6.798595635375976, "train_acc": 0.00848, "test_loss": 7.428785041809082, "test_acc": 0.01, "lyapunov": 2.603473731623891, "grad_norm": 0.10178851829698213, "grad_max_sv": 0.0006682275328785181, "grad_min_sv": 0.0, "grad_condition": 668227532.8785181, "lr": 0.0008852566213878943, "time_sec": 167.23122191429138 }, { "epoch": 34, "train_loss": 6.79622100402832, "train_acc": 0.0085, "test_loss": 7.445402703094483, "test_acc": 0.01, "lyapunov": 2.602201823383341, "grad_norm": 0.09821894401826198, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000878497527825878, "time_sec": 167.51045203208923 }, { "epoch": 35, "train_loss": 6.800452690124512, "train_acc": 0.0086, "test_loss": 4.6083794067382815, "test_acc": 0.01, "lyapunov": 2.604824850321426, "grad_norm": 0.09521574599597374, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000871572412738697, "time_sec": 167.14473628997803 }, { "epoch": 36, "train_loss": 6.801179714050293, "train_acc": 0.00882, "test_loss": 4.608353971862793, "test_acc": 0.01, "lyapunov": 2.605245649357281, "grad_norm": 0.09891258167661582, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107055, "time_sec": 167.21640372276306 }, { "epoch": 37, "train_loss": 6.798632629699707, "train_acc": 0.00856, "test_loss": 4.608331527709961, "test_acc": 0.01, "lyapunov": 2.603703239079936, "grad_norm": 0.09374120059954827, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008572363398164014, "time_sec": 167.28665328025818 }, { "epoch": 38, "train_loss": 6.798052488708496, "train_acc": 0.00864, "test_loss": 4.608306627655029, "test_acc": 0.01, "lyapunov": 2.6033894985228243, "grad_norm": 0.0928347460465077, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008498316702566826, "time_sec": 167.22592282295227 }, { "epoch": 39, "train_loss": 6.797720238189697, "train_acc": 0.00854, "test_loss": 4.608331230163574, "test_acc": 0.01, "lyapunov": 2.6030823568553876, "grad_norm": 0.1025783953694396, "grad_max_sv": 0.000793654378503561, "grad_min_sv": 0.0, "grad_condition": 793654378.503561, "lr": 0.0008422735529643442, "time_sec": 167.11991024017334 }, { "epoch": 40, "train_loss": 6.796907914123535, "train_acc": 0.00818, "test_loss": 7.429255201721191, "test_acc": 0.01, "lyapunov": 2.6026227175427215, "grad_norm": 0.09282398303274703, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008345653031794289, "time_sec": 167.28346157073975 }, { "epoch": 41, "train_loss": 6.811164211883545, "train_acc": 0.00882, "test_loss": 4.7162436149597164, "test_acc": 0.01, "lyapunov": 2.608923517529617, "grad_norm": 0.1222466987863888, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008267103019950526, "time_sec": 167.2502682209015 }, { "epoch": 42, "train_loss": 6.810527358703613, "train_acc": 0.00896, "test_loss": 4.736723460388184, "test_acc": 0.01, "lyapunov": 2.6098364740991227, "grad_norm": 0.12481417359397351, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743447, "time_sec": 167.19833540916443 }, { "epoch": 43, "train_loss": 6.8037118544006345, "train_acc": 0.0083, "test_loss": 4.676154768371582, "test_acc": 0.01, "lyapunov": 2.606640679147237, "grad_norm": 0.12856017826684152, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000810573890139155, "time_sec": 167.17452216148376 }, { "epoch": 44, "train_loss": 6.794667855529785, "train_acc": 0.00872, "test_loss": 4.7420101188659665, "test_acc": 0.01, "lyapunov": 2.6012551680855127, "grad_norm": 0.09209394266338691, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008022995574311873, "time_sec": 167.27408933639526 }, { "epoch": 45, "train_loss": 6.7950104260253905, "train_acc": 0.00898, "test_loss": 4.896900399780273, "test_acc": 0.01, "lyapunov": 2.6014791181325303, "grad_norm": 0.09205616000449629, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462363, "time_sec": 167.31984734535217 }, { "epoch": 46, "train_loss": 6.819086815185547, "train_acc": 0.00892, "test_loss": 4.605172099304199, "test_acc": 0.01, "lyapunov": 2.612778242896585, "grad_norm": 0.11562328930387418, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007853567838422158, "time_sec": 167.12109279632568 }, { "epoch": 47, "train_loss": 6.798819590454102, "train_acc": 0.00832, "test_loss": 4.605172010803223, "test_acc": 0.01, "lyapunov": 2.6037960967139515, "grad_norm": 0.09084227993519768, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007766957746216719, "time_sec": 167.26839470863342 }, { "epoch": 48, "train_loss": 6.797002004394531, "train_acc": 0.00882, "test_loss": 4.6051717926025395, "test_acc": 0.01, "lyapunov": 2.6027391889820928, "grad_norm": 0.09202982942979847, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894982, "time_sec": 167.25185203552246 }, { "epoch": 49, "train_loss": 6.799232456512451, "train_acc": 0.00864, "test_loss": 4.605324877929688, "test_acc": 0.01, "lyapunov": 2.6040493954173134, "grad_norm": 0.0929356327661651, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000759013504686565, "time_sec": 167.24265789985657 }, { "epoch": 50, "train_loss": 6.812471532135009, "train_acc": 0.00842, "test_loss": 4.608313929748535, "test_acc": 0.01, "lyapunov": 2.6102352337459163, "grad_norm": 0.11621130736417108, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 167.15211701393127 }, { "epoch": 51, "train_loss": 6.794671293334961, "train_acc": 0.00842, "test_loss": 4.605172332763672, "test_acc": 0.01, "lyapunov": 2.6012639694506556, "grad_norm": 0.0930565557537395, "grad_max_sv": 0.0036748358979821205, "grad_min_sv": 0.0, "grad_condition": 3674835897.9821205, "lr": 0.0007408768370508575, "time_sec": 167.3388113975525 }, { "epoch": 52, "train_loss": 6.799352421264649, "train_acc": 0.00892, "test_loss": 4.605172877502441, "test_acc": 0.01, "lyapunov": 2.6041594795558765, "grad_norm": 0.09046235706111078, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 168.00543642044067 }, { "epoch": 53, "train_loss": 6.821222294006348, "train_acc": 0.00822, "test_loss": 4.605560771179199, "test_acc": 0.01, "lyapunov": 2.612406419061334, "grad_norm": 0.10733736636185434, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 167.15741348266602 }, { "epoch": 54, "train_loss": 6.7975339453125, "train_acc": 0.0087, "test_loss": 4.605171894073487, "test_acc": 0.01, "lyapunov": 2.603086569729973, "grad_norm": 0.09401396255246093, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 167.15016341209412 }, { "epoch": 55, "train_loss": 6.818788750457764, "train_acc": 0.00834, "test_loss": 4.60517187576294, "test_acc": 0.01, "lyapunov": 2.614099033653279, "grad_norm": 0.10409203954293918, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007033683215378998, "time_sec": 167.16365313529968 }, { "epoch": 56, "train_loss": 6.823291486663819, "train_acc": 0.00896, "test_loss": 4.605172322082519, "test_acc": 0.01, "lyapunov": 2.6149235838819345, "grad_norm": 0.1215199933903174, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 167.22393465042114 }, { "epoch": 57, "train_loss": 6.812863822021485, "train_acc": 0.00918, "test_loss": 4.605172196197509, "test_acc": 0.01, "lyapunov": 2.6100745280380444, "grad_norm": 0.11428618016798626, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423388, "time_sec": 167.36779832839966 }, { "epoch": 58, "train_loss": 6.845285939025879, "train_acc": 0.00852, "test_loss": 4.605171984863281, "test_acc": 0.01, "lyapunov": 2.621920944784608, "grad_norm": 0.16133795983355934, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 167.1204113960266 }, { "epoch": 59, "train_loss": 6.8284387295532225, "train_acc": 0.00838, "test_loss": 4.605172086334228, "test_acc": 0.01, "lyapunov": 2.619316293150568, "grad_norm": 0.1660277007934849, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 167.1542353630066 }, { "epoch": 60, "train_loss": 6.853109035339355, "train_acc": 0.00904, "test_loss": 4.605171766662598, "test_acc": 0.01, "lyapunov": 2.626850544644134, "grad_norm": 0.14505200146170139, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 167.25803112983704 }, { "epoch": 61, "train_loss": 6.8587484286499025, "train_acc": 0.00894, "test_loss": 4.605171794128418, "test_acc": 0.01, "lyapunov": 2.6341320041500396, "grad_norm": 0.23780774328945256, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 167.1593141555786 }, { "epoch": 62, "train_loss": 6.856730157775879, "train_acc": 0.00858, "test_loss": 4.605171855926514, "test_acc": 0.01, "lyapunov": 2.6288814319064246, "grad_norm": 0.19871702414437586, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 167.14994502067566 }, { "epoch": 63, "train_loss": 6.840637737731933, "train_acc": 0.00874, "test_loss": 4.60517123260498, "test_acc": 0.01, "lyapunov": 2.624538544803629, "grad_norm": 0.2247756960679524, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 167.2067906856537 }, { "epoch": 64, "train_loss": 6.822744883117676, "train_acc": 0.00848, "test_loss": 4.60517158203125, "test_acc": 0.01, "lyapunov": 2.613635628424642, "grad_norm": 0.1329153891377645, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 167.26912307739258 }, { "epoch": 65, "train_loss": 6.8317010522460935, "train_acc": 0.00862, "test_loss": 4.605171473693848, "test_acc": 0.01, "lyapunov": 2.6185932665529763, "grad_norm": 0.13671337080211707, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 167.09261989593506 }, { "epoch": 66, "train_loss": 6.812226905822754, "train_acc": 0.0088, "test_loss": 4.605171728515625, "test_acc": 0.01, "lyapunov": 2.610206864374068, "grad_norm": 0.12722937279819782, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 167.21893763542175 }, { "epoch": 67, "train_loss": 6.808111183776855, "train_acc": 0.0093, "test_loss": 4.6051715423583985, "test_acc": 0.01, "lyapunov": 2.6089447556859087, "grad_norm": 0.15865472726238314, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 167.29591965675354 }, { "epoch": 68, "train_loss": 6.83726111694336, "train_acc": 0.00862, "test_loss": 4.605171617126465, "test_acc": 0.01, "lyapunov": 2.6234818724415185, "grad_norm": 0.21106961802984933, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 167.22871494293213 }, { "epoch": 69, "train_loss": 6.833951936035156, "train_acc": 0.00874, "test_loss": 4.605171533203125, "test_acc": 0.01, "lyapunov": 2.6221561791646817, "grad_norm": 0.23690960823937743, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 167.11618614196777 }, { "epoch": 70, "train_loss": 6.80746663269043, "train_acc": 0.00868, "test_loss": 4.6051711715698245, "test_acc": 0.01, "lyapunov": 2.608615706948673, "grad_norm": 0.19368668238286113, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 167.25853991508484 }, { "epoch": 71, "train_loss": 6.840300604553223, "train_acc": 0.00892, "test_loss": 4.605171086120605, "test_acc": 0.01, "lyapunov": 2.6233106214372093, "grad_norm": 0.21230815886405713, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 167.2756736278534 }, { "epoch": 72, "train_loss": 6.826620941162109, "train_acc": 0.00886, "test_loss": 4.605171425628662, "test_acc": 0.01, "lyapunov": 2.617017206328604, "grad_norm": 0.16852859644395693, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646563, "time_sec": 167.11485767364502 }, { "epoch": 73, "train_loss": 6.81151391418457, "train_acc": 0.0083, "test_loss": 4.605171309661865, "test_acc": 0.01, "lyapunov": 2.6109183840739454, "grad_norm": 0.15884163876986282, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 167.23269772529602 }, { "epoch": 74, "train_loss": 6.803579806518555, "train_acc": 0.00836, "test_loss": 4.605171119689941, "test_acc": 0.01, "lyapunov": 2.606299752774446, "grad_norm": 0.12416094470418608, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 167.30208802223206 }, { "epoch": 75, "train_loss": 6.85053612701416, "train_acc": 0.00864, "test_loss": 4.605171006774903, "test_acc": 0.01, "lyapunov": 2.6286537153336704, "grad_norm": 0.19093915741238635, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 167.27450942993164 }, { "epoch": 76, "train_loss": 6.801593222961426, "train_acc": 0.00904, "test_loss": 4.605170780181885, "test_acc": 0.01, "lyapunov": 2.6054461362111905, "grad_norm": 0.12884562844199357, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 167.09656834602356 }, { "epoch": 77, "train_loss": 6.796963772583008, "train_acc": 0.00794, "test_loss": 4.605171012878418, "test_acc": 0.01, "lyapunov": 2.6028354930145965, "grad_norm": 0.09104303565016296, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 167.33878350257874 }, { "epoch": 78, "train_loss": 6.7984873474121095, "train_acc": 0.00882, "test_loss": 4.605170700073242, "test_acc": 0.01, "lyapunov": 2.603611297314734, "grad_norm": 0.10157683305126329, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 167.25584626197815 }, { "epoch": 79, "train_loss": 6.820661872863769, "train_acc": 0.00986, "test_loss": 4.605170817565918, "test_acc": 0.01, "lyapunov": 2.612017824826643, "grad_norm": 0.14611535298895395, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 167.1672751903534 }, { "epoch": 80, "train_loss": 6.806377208557129, "train_acc": 0.00852, "test_loss": 4.605170895385742, "test_acc": 0.01, "lyapunov": 2.607236401809146, "grad_norm": 0.10585908127422697, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 167.1809687614441 }, { "epoch": 81, "train_loss": 6.808554836425781, "train_acc": 0.00942, "test_loss": 4.605170629882813, "test_acc": 0.01, "lyapunov": 2.6088667123214058, "grad_norm": 0.14379651420159803, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 167.25520253181458 }, { "epoch": 82, "train_loss": 6.8339071276855465, "train_acc": 0.00906, "test_loss": 4.605170634460449, "test_acc": 0.01, "lyapunov": 2.620855552766024, "grad_norm": 0.23055639987610052, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 167.52204132080078 }, { "epoch": 83, "train_loss": 6.828104596252442, "train_acc": 0.0093, "test_loss": 4.605170736694336, "test_acc": 0.01, "lyapunov": 2.6192942519322076, "grad_norm": 0.19017261102902538, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 167.1194040775299 }, { "epoch": 84, "train_loss": 6.808681617126465, "train_acc": 0.0084, "test_loss": 4.6051709182739256, "test_acc": 0.01, "lyapunov": 2.609468307641461, "grad_norm": 0.15622504553249358, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 167.19974207878113 }, { "epoch": 85, "train_loss": 6.818397989654541, "train_acc": 0.00824, "test_loss": 4.605170721435547, "test_acc": 0.01, "lyapunov": 2.6138416312234787, "grad_norm": 0.14833733270771185, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 167.2553927898407 }, { "epoch": 86, "train_loss": 6.799676761169434, "train_acc": 0.00838, "test_loss": 4.60517102508545, "test_acc": 0.01, "lyapunov": 2.604430999292437, "grad_norm": 0.11142070053574807, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 167.18824887275696 }, { "epoch": 87, "train_loss": 6.818209040527344, "train_acc": 0.00854, "test_loss": 4.605170503997803, "test_acc": 0.01, "lyapunov": 2.6141847765354242, "grad_norm": 0.14462203411441973, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 167.1196677684784 }, { "epoch": 88, "train_loss": 6.874744393615723, "train_acc": 0.00888, "test_loss": 4.605170900726319, "test_acc": 0.01, "lyapunov": 2.6346183640267844, "grad_norm": 0.20078574833508478, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 167.2573266029358 }, { "epoch": 89, "train_loss": 6.803292810211182, "train_acc": 0.00886, "test_loss": 4.60517081451416, "test_acc": 0.01, "lyapunov": 2.606465803082947, "grad_norm": 0.12244758192489462, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 167.22969937324524 }, { "epoch": 90, "train_loss": 6.842185859069824, "train_acc": 0.00942, "test_loss": 4.605170654296875, "test_acc": 0.01, "lyapunov": 2.622050429853942, "grad_norm": 0.1882414210254429, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 167.11765575408936 }, { "epoch": 91, "train_loss": 6.836290773010254, "train_acc": 0.00882, "test_loss": 4.605170703125, "test_acc": 0.01, "lyapunov": 2.619682075422438, "grad_norm": 0.19767006125117328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 167.22952795028687 }, { "epoch": 92, "train_loss": 6.791880859985351, "train_acc": 0.00842, "test_loss": 4.605170771789551, "test_acc": 0.01, "lyapunov": 2.5996962294859043, "grad_norm": 0.08760976620030388, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 167.26651191711426 }, { "epoch": 93, "train_loss": 6.80370014678955, "train_acc": 0.00806, "test_loss": 4.605170739746094, "test_acc": 0.01, "lyapunov": 2.606304941884697, "grad_norm": 0.13940577534302254, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 167.17852663993835 }, { "epoch": 94, "train_loss": 6.83537752532959, "train_acc": 0.00846, "test_loss": 4.605170500183106, "test_acc": 0.01, "lyapunov": 2.623438694288054, "grad_norm": 0.26310451945532815, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 167.17071175575256 }, { "epoch": 95, "train_loss": 6.799238587646484, "train_acc": 0.00926, "test_loss": 4.6051702911376955, "test_acc": 0.01, "lyapunov": 2.60419953631623, "grad_norm": 0.10657735488339905, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 167.223788022995 }, { "epoch": 96, "train_loss": 6.804974398498535, "train_acc": 0.00916, "test_loss": 4.605170680236816, "test_acc": 0.01, "lyapunov": 2.60721908383967, "grad_norm": 0.17693273008046123, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 167.2773995399475 }, { "epoch": 97, "train_loss": 6.8050346893310545, "train_acc": 0.0086, "test_loss": 4.605170379638672, "test_acc": 0.01, "lyapunov": 2.607598216332438, "grad_norm": 0.1351166427526852, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 167.0982165336609 }, { "epoch": 98, "train_loss": 6.814014775848388, "train_acc": 0.00896, "test_loss": 4.605170265960694, "test_acc": 0.01, "lyapunov": 2.611722286399978, "grad_norm": 0.16300027920865434, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 167.213885307312 }, { "epoch": 99, "train_loss": 6.810039446411133, "train_acc": 0.00874, "test_loss": 4.605170517730713, "test_acc": 0.01, "lyapunov": 2.609659137018501, "grad_norm": 0.13742401941675986, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 167.23094940185547 }, { "epoch": 100, "train_loss": 6.818154907836914, "train_acc": 0.00906, "test_loss": 4.6051704177856445, "test_acc": 0.01, "lyapunov": 2.613592106363048, "grad_norm": 0.13552057031594136, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 167.14863324165344 }, { "epoch": 101, "train_loss": 6.820175225524903, "train_acc": 0.00914, "test_loss": 4.605170472717285, "test_acc": 0.01, "lyapunov": 2.615781251731736, "grad_norm": 0.1825661927434339, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 167.13485431671143 }, { "epoch": 102, "train_loss": 6.843083056182861, "train_acc": 0.00814, "test_loss": 4.605170304107666, "test_acc": 0.01, "lyapunov": 2.6266718941271456, "grad_norm": 0.28170773297668966, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 167.3005588054657 }, { "epoch": 103, "train_loss": 6.81555390625, "train_acc": 0.0089, "test_loss": 4.605170388793946, "test_acc": 0.01, "lyapunov": 2.6132783401957558, "grad_norm": 0.20579070177059625, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 167.31917262077332 }, { "epoch": 104, "train_loss": 6.797420726623535, "train_acc": 0.00826, "test_loss": 4.60517056274414, "test_acc": 0.01, "lyapunov": 2.6031100310937827, "grad_norm": 0.09877603372479003, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 167.13279914855957 }, { "epoch": 105, "train_loss": 6.825426294555664, "train_acc": 0.00898, "test_loss": 4.605170573425293, "test_acc": 0.01, "lyapunov": 2.6164557750877515, "grad_norm": 0.23298022186302586, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 167.27876543998718 }, { "epoch": 106, "train_loss": 6.81034471786499, "train_acc": 0.00862, "test_loss": 4.605170178222656, "test_acc": 0.01, "lyapunov": 2.6101580525908017, "grad_norm": 0.11576839370764984, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 167.24659395217896 }, { "epoch": 107, "train_loss": 6.8369368406677244, "train_acc": 0.00846, "test_loss": 4.605170590209961, "test_acc": 0.01, "lyapunov": 2.62125125931352, "grad_norm": 0.1931519664931494, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 167.2057774066925 }, { "epoch": 108, "train_loss": 6.812288922576904, "train_acc": 0.0088, "test_loss": 4.605170223999023, "test_acc": 0.01, "lyapunov": 2.6103451739796593, "grad_norm": 0.13299121884159582, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 167.10559225082397 }, { "epoch": 109, "train_loss": 6.797308649902344, "train_acc": 0.00842, "test_loss": 4.605170259094239, "test_acc": 0.01, "lyapunov": 2.6030520350122086, "grad_norm": 0.09292253205333328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 167.28680682182312 }, { "epoch": 110, "train_loss": 6.802461311950683, "train_acc": 0.00886, "test_loss": 4.605170384979248, "test_acc": 0.01, "lyapunov": 2.605947788414138, "grad_norm": 0.09044100601755074, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 167.254047870636 }, { "epoch": 111, "train_loss": 6.800218295593262, "train_acc": 0.00898, "test_loss": 4.605170218658447, "test_acc": 0.01, "lyapunov": 2.6047815380193997, "grad_norm": 0.09096765167841042, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 167.18093347549438 }, { "epoch": 112, "train_loss": 6.80289358581543, "train_acc": 0.00846, "test_loss": 4.605170321655273, "test_acc": 0.01, "lyapunov": 2.606188810085092, "grad_norm": 0.11124745619391717, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 167.17500185966492 }, { "epoch": 113, "train_loss": 6.80328687286377, "train_acc": 0.0083, "test_loss": 4.605170209503174, "test_acc": 0.01, "lyapunov": 2.606580800717444, "grad_norm": 0.1173945856600355, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 167.2652928829193 }, { "epoch": 114, "train_loss": 6.833984843902588, "train_acc": 0.00896, "test_loss": 4.605170062255859, "test_acc": 0.01, "lyapunov": 2.6208856666789337, "grad_norm": 0.20744787133639947, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 167.21882677078247 }, { "epoch": 115, "train_loss": 6.822520295410156, "train_acc": 0.00838, "test_loss": 4.605170328521728, "test_acc": 0.01, "lyapunov": 2.615956858295919, "grad_norm": 0.14399695964710044, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 167.09929537773132 }, { "epoch": 116, "train_loss": 6.799036735839843, "train_acc": 0.00894, "test_loss": 4.605170152282715, "test_acc": 0.01, "lyapunov": 2.603793166787423, "grad_norm": 0.10032145854595359, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 167.25386571884155 }, { "epoch": 117, "train_loss": 6.800587829284668, "train_acc": 0.00834, "test_loss": 4.605170477294922, "test_acc": 0.01, "lyapunov": 2.604958756805381, "grad_norm": 0.11401729218950767, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 167.27676010131836 }, { "epoch": 118, "train_loss": 6.800997655029297, "train_acc": 0.0088, "test_loss": 4.605170313262939, "test_acc": 0.01, "lyapunov": 2.6053062838971464, "grad_norm": 0.10865983471852475, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 167.16999578475952 }, { "epoch": 119, "train_loss": 6.800622797088623, "train_acc": 0.0082, "test_loss": 4.605170126342774, "test_acc": 0.01, "lyapunov": 2.604655019462566, "grad_norm": 0.12369520749734833, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 167.13503623008728 }, { "epoch": 120, "train_loss": 6.795711727905274, "train_acc": 0.00866, "test_loss": 4.60517028503418, "test_acc": 0.01, "lyapunov": 2.602085701949761, "grad_norm": 0.08734190443194187, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 167.28283619880676 }, { "epoch": 121, "train_loss": 6.796959948425293, "train_acc": 0.0093, "test_loss": 4.605170495605469, "test_acc": 0.01, "lyapunov": 2.6028400558949736, "grad_norm": 0.08752194617001091, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 167.22894525527954 }, { "epoch": 122, "train_loss": 6.80965912033081, "train_acc": 0.00928, "test_loss": 4.605170267486573, "test_acc": 0.01, "lyapunov": 2.6096866935720224, "grad_norm": 0.11691201011842964, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 167.16074228286743 }, { "epoch": 123, "train_loss": 6.817136254882812, "train_acc": 0.00856, "test_loss": 4.605170227050781, "test_acc": 0.01, "lyapunov": 2.6124652438151563, "grad_norm": 0.1550769682935547, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 167.20862245559692 }, { "epoch": 124, "train_loss": 6.797611290588379, "train_acc": 0.0096, "test_loss": 4.605170072174072, "test_acc": 0.01, "lyapunov": 2.603274511864118, "grad_norm": 0.10698377372823001, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 167.24812293052673 }, { "epoch": 125, "train_loss": 6.811994839477539, "train_acc": 0.00868, "test_loss": 4.605170003509522, "test_acc": 0.01, "lyapunov": 2.6103333463449307, "grad_norm": 0.14234235939730758, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 167.15956830978394 }, { "epoch": 126, "train_loss": 6.799865046234131, "train_acc": 0.00862, "test_loss": 4.605170318603515, "test_acc": 0.01, "lyapunov": 2.604667879431449, "grad_norm": 0.09265194462378636, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 167.1222221851349 }, { "epoch": 127, "train_loss": 6.804667163391113, "train_acc": 0.00886, "test_loss": 4.605170178985595, "test_acc": 0.01, "lyapunov": 2.60723816342366, "grad_norm": 0.09360794490801955, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 167.1491777896881 }, { "epoch": 128, "train_loss": 6.803801723480225, "train_acc": 0.0089, "test_loss": 4.605170277404786, "test_acc": 0.01, "lyapunov": 2.606579548867462, "grad_norm": 0.10479682515434138, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 167.26385951042175 }, { "epoch": 129, "train_loss": 6.7995252819824215, "train_acc": 0.0085, "test_loss": 4.605170484924316, "test_acc": 0.01, "lyapunov": 2.604231426478042, "grad_norm": 0.08941205723411079, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 167.30450534820557 }, { "epoch": 130, "train_loss": 6.821313883209228, "train_acc": 0.00852, "test_loss": 4.605170134735108, "test_acc": 0.01, "lyapunov": 2.615080727335742, "grad_norm": 0.1662641683208483, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 167.14770483970642 }, { "epoch": 131, "train_loss": 6.795292775421142, "train_acc": 0.00846, "test_loss": 4.605170323944092, "test_acc": 0.01, "lyapunov": 2.601862790944326, "grad_norm": 0.11411966381332427, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 167.2135558128357 }, { "epoch": 132, "train_loss": 6.796047713775635, "train_acc": 0.00904, "test_loss": 4.6051700454711915, "test_acc": 0.01, "lyapunov": 2.602336645736109, "grad_norm": 0.08834944397480328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 167.23654413223267 }, { "epoch": 133, "train_loss": 6.799664002380371, "train_acc": 0.00904, "test_loss": 4.605170405578614, "test_acc": 0.01, "lyapunov": 2.6045111707409325, "grad_norm": 0.08768823633488758, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 167.25386261940002 }, { "epoch": 134, "train_loss": 6.799534449920654, "train_acc": 0.00966, "test_loss": 4.605170095825195, "test_acc": 0.01, "lyapunov": 2.604433027374775, "grad_norm": 0.08880059006188033, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 167.089768409729 }, { "epoch": 135, "train_loss": 6.816852741394043, "train_acc": 0.00922, "test_loss": 4.6051704139709475, "test_acc": 0.01, "lyapunov": 2.6120451417420525, "grad_norm": 0.1344230192150204, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 167.21077299118042 }, { "epoch": 136, "train_loss": 6.79835750869751, "train_acc": 0.01, "test_loss": 4.60517020111084, "test_acc": 0.01, "lyapunov": 2.6037550874988136, "grad_norm": 0.09237399837874004, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 167.25671005249023 }, { "epoch": 137, "train_loss": 6.799135870971679, "train_acc": 0.00948, "test_loss": 4.605170085144043, "test_acc": 0.01, "lyapunov": 2.6042151554771094, "grad_norm": 0.08937220866741212, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 167.19218349456787 }, { "epoch": 138, "train_loss": 6.824215604553222, "train_acc": 0.01, "test_loss": 4.605170098876953, "test_acc": 0.01, "lyapunov": 2.616335995666816, "grad_norm": 0.10994228945768546, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 167.09943842887878 }, { "epoch": 139, "train_loss": 6.802577704467773, "train_acc": 0.01, "test_loss": 4.605170218658447, "test_acc": 0.01, "lyapunov": 2.6062524855289313, "grad_norm": 0.09042623460420336, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 167.20513486862183 }, { "epoch": 140, "train_loss": 6.7961073709106445, "train_acc": 0.01, "test_loss": 4.605170453643799, "test_acc": 0.01, "lyapunov": 2.602320309490194, "grad_norm": 0.08815797205742677, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 167.25681805610657 }, { "epoch": 141, "train_loss": 6.797138239898682, "train_acc": 0.01, "test_loss": 4.605170432281494, "test_acc": 0.01, "lyapunov": 2.6029675891027426, "grad_norm": 0.0879981627311107, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 167.06548428535461 }, { "epoch": 142, "train_loss": 6.801417353363037, "train_acc": 0.01, "test_loss": 4.605170329284668, "test_acc": 0.01, "lyapunov": 2.605164134593876, "grad_norm": 0.08843743115572271, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 167.19282054901123 }, { "epoch": 143, "train_loss": 6.799633148193359, "train_acc": 0.01, "test_loss": 4.6051702880859375, "test_acc": 0.01, "lyapunov": 2.6045726491972006, "grad_norm": 0.09210601924786092, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 167.22217631340027 }, { "epoch": 144, "train_loss": 6.799774599914551, "train_acc": 0.01, "test_loss": 4.605170209503174, "test_acc": 0.01, "lyapunov": 2.6046122669258995, "grad_norm": 0.08889860655727871, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 167.18017983436584 }, { "epoch": 145, "train_loss": 6.7985524331665035, "train_acc": 0.01, "test_loss": 4.6051704223632814, "test_acc": 0.01, "lyapunov": 2.6038548361005076, "grad_norm": 0.08800873662125164, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 167.10364723205566 }, { "epoch": 146, "train_loss": 6.797061258239746, "train_acc": 0.01, "test_loss": 4.605170094299316, "test_acc": 0.01, "lyapunov": 2.6029466247314685, "grad_norm": 0.08767630908448117, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 167.13109254837036 }, { "epoch": 147, "train_loss": 6.7999437774658205, "train_acc": 0.01, "test_loss": 4.605170198059082, "test_acc": 0.01, "lyapunov": 2.6046864193723636, "grad_norm": 0.08792294865681417, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 167.20970582962036 }, { "epoch": 148, "train_loss": 6.798582576293946, "train_acc": 0.01, "test_loss": 4.605170455932617, "test_acc": 0.01, "lyapunov": 2.6038761730389215, "grad_norm": 0.09215822971292409, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 167.12604355812073 }, { "epoch": 149, "train_loss": 6.796307967529297, "train_acc": 0.01, "test_loss": 4.605170027923584, "test_acc": 0.01, "lyapunov": 2.6024758651128512, "grad_norm": 0.08782242943220565, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 167.15288949012756 }, { "epoch": 150, "train_loss": 6.797921124420166, "train_acc": 0.01, "test_loss": 4.6051702972412105, "test_acc": 0.01, "lyapunov": 2.6034922130272515, "grad_norm": 0.08768432297346943, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 167.14476084709167 } ], "20": [ { "epoch": 1, "train_loss": 15.093960892944336, "train_acc": 0.01476, "test_loss": 4.694812010192871, "test_acc": 0.0101, "lyapunov": 5.28920032362194, "grad_norm": 5.920792423737725, "grad_max_sv": 4.9676717877388, "grad_min_sv": 8.119859199878787e-08, "grad_condition": 1111289730.0106924, "lr": 0.0009998903417374227, "time_sec": 210.120050907135 }, { "epoch": 2, "train_loss": 9.793692145080566, "train_acc": 0.01708, "test_loss": 4.630818698120117, "test_acc": 0.0101, "lyapunov": 3.9491244813670283, "grad_norm": 4.179099264712139, "grad_max_sv": 3.6389390349388124, "grad_min_sv": 4.435643456510846e-08, "grad_condition": 1465465238.7805393, "lr": 0.0009995614150494292, "time_sec": 210.1432433128357 }, { "epoch": 3, "train_loss": 9.864517554931641, "train_acc": 0.01526, "test_loss": 4.635793448638916, "test_acc": 0.01, "lyapunov": 4.013264959120689, "grad_norm": 3.461175130912805, "grad_max_sv": 3.00231654047966, "grad_min_sv": 7.094927521799298e-09, "grad_condition": 151743845631.83978, "lr": 0.0009990133642141358, "time_sec": 210.18036890029907 }, { "epoch": 4, "train_loss": 9.012857937622071, "train_acc": 0.01522, "test_loss": 4.623633129882813, "test_acc": 0.01, "lyapunov": 3.700052426599176, "grad_norm": 2.6286152850939577, "grad_max_sv": 2.296706238389015, "grad_min_sv": 3.159897203264806e-11, "grad_condition": 343973728227.78937, "lr": 0.0009982464296247522, "time_sec": 210.1404571533203 }, { "epoch": 5, "train_loss": 8.190340083312988, "train_acc": 0.0141, "test_loss": 4.620581848144531, "test_acc": 0.01, "lyapunov": 3.3428353769395054, "grad_norm": 1.8058911521537262, "grad_max_sv": 1.3938701748847961, "grad_min_sv": 9.547992879409192e-12, "grad_condition": 323805955248.2424, "lr": 0.0009972609476841367, "time_sec": 210.12661004066467 }, { "epoch": 6, "train_loss": 7.759998917236328, "train_acc": 0.01288, "test_loss": 4.617343115997315, "test_acc": 0.01, "lyapunov": 3.1374943689312165, "grad_norm": 1.7534337420481565, "grad_max_sv": 0.9646675065159919, "grad_min_sv": 2.9231036572180592e-12, "grad_condition": 375265614590.23444, "lr": 0.000996057350657239, "time_sec": 210.0431251525879 }, { "epoch": 7, "train_loss": 7.5100171649169924, "train_acc": 0.01298, "test_loss": 4.613992894744873, "test_acc": 0.01, "lyapunov": 3.009886204434173, "grad_norm": 1.2599904723678697, "grad_max_sv": 0.683513353765011, "grad_min_sv": 2.034050211148161e-12, "grad_condition": 321368791479.6951, "lr": 0.000994636166481494, "time_sec": 210.03102850914001 }, { "epoch": 8, "train_loss": 7.526667755889893, "train_acc": 0.0137, "test_loss": 4.6132587142944335, "test_acc": 0.01, "lyapunov": 3.020487799973744, "grad_norm": 1.4149077024298684, "grad_max_sv": 0.43169260323047637, "grad_min_sv": 1.314155534129329e-12, "grad_condition": 228604061031.44318, "lr": 0.0009929980185352525, "time_sec": 210.09079957008362 }, { "epoch": 9, "train_loss": 7.424001091003418, "train_acc": 0.0139, "test_loss": 4.612518185424805, "test_acc": 0.01, "lyapunov": 2.9646140498578397, "grad_norm": 1.4854391503992914, "grad_max_sv": 0.39994182234216435, "grad_min_sv": 7.056669271977351e-13, "grad_condition": 272585344238.14337, "lr": 0.0009911436253643444, "time_sec": 210.04538559913635 }, { "epoch": 10, "train_loss": 7.422507609710693, "train_acc": 0.01292, "test_loss": 4.612365335083008, "test_acc": 0.01, "lyapunov": 2.9684851279344096, "grad_norm": 1.4578891690299673, "grad_max_sv": 0.3333915390074253, "grad_min_sv": 5.315411665648874e-13, "grad_condition": 252944829203.9721, "lr": 0.0009890738003669028, "time_sec": 210.01400017738342 }, { "epoch": 11, "train_loss": 7.279168519592285, "train_acc": 0.01416, "test_loss": 4.605921854400635, "test_acc": 0.01, "lyapunov": 2.8905254178644753, "grad_norm": 1.1550117670507138, "grad_max_sv": 0.26091913171112535, "grad_min_sv": 1.5622282665285416e-13, "grad_condition": 237845802721.57803, "lr": 0.00098678945143658, "time_sec": 210.0479826927185 }, { "epoch": 12, "train_loss": 7.238350921325684, "train_acc": 0.01288, "test_loss": 4.6059690254211425, "test_acc": 0.01, "lyapunov": 2.870093943212953, "grad_norm": 1.2092537765879001, "grad_max_sv": 0.2273966234177351, "grad_min_sv": 2.126834221214877e-15, "grad_condition": 226904883800.9376, "lr": 0.0009842915805643154, "time_sec": 210.02421975135803 }, { "epoch": 13, "train_loss": 7.237049304504395, "train_acc": 0.0122, "test_loss": 4.606073367309571, "test_acc": 0.01, "lyapunov": 2.8677229795919357, "grad_norm": 1.945360181719986, "grad_max_sv": 0.19105065988258402, "grad_min_sv": 7.58301405160596e-16, "grad_condition": 190882486106.46655, "lr": 0.000981581283398829, "time_sec": 209.9947109222412 }, { "epoch": 14, "train_loss": 7.725393817138672, "train_acc": 0.01264, "test_loss": 5.5369372573852536, "test_acc": 0.0157, "lyapunov": 3.1145479276661985, "grad_norm": 3.5850673850910875, "grad_max_sv": 0.13178386465706673, "grad_min_sv": 1.7957017814409413e-15, "grad_condition": 131460341909.11662, "lr": 0.0009786597487660333, "time_sec": 210.06614232063293 }, { "epoch": 15, "train_loss": 7.938173998718262, "train_acc": 0.0112, "test_loss": 4.605860107421875, "test_acc": 0.01, "lyapunov": 3.22320399442902, "grad_norm": 1.470918431013692, "grad_max_sv": 0.13412793046313495, "grad_min_sv": 1.3123556012424532e-27, "grad_condition": 134127930463.13481, "lr": 0.0009755282581475766, "time_sec": 210.01092720031738 }, { "epoch": 16, "train_loss": 7.877476094970703, "train_acc": 0.01078, "test_loss": 4.605639274597168, "test_acc": 0.01, "lyapunov": 3.1950507353028983, "grad_norm": 1.136967603821004, "grad_max_sv": 0.11695587523281574, "grad_min_sv": 5.493959932514282e-37, "grad_condition": 116955875232.81572, "lr": 0.0009721881851187403, "time_sec": 210.03272008895874 }, { "epoch": 17, "train_loss": 7.939653808288575, "train_acc": 0.01054, "test_loss": 4.60557441482544, "test_acc": 0.01, "lyapunov": 3.220062300982073, "grad_norm": 1.7456145739471243, "grad_max_sv": 0.09164720228873194, "grad_min_sv": 2.1019476964872255e-46, "grad_condition": 91647202288.73193, "lr": 0.0009686409947459456, "time_sec": 210.02848625183105 }, { "epoch": 18, "train_loss": 7.52693728515625, "train_acc": 0.0113, "test_loss": 4.605569499206543, "test_acc": 0.01, "lyapunov": 3.0156563999097976, "grad_norm": 2.4071740405774276, "grad_max_sv": 0.08130668587982655, "grad_min_sv": 4.554220009055656e-46, "grad_condition": 81306685879.82654, "lr": 0.0009648882429441254, "time_sec": 210.00972390174866 }, { "epoch": 19, "train_loss": 7.715430914611816, "train_acc": 0.0111, "test_loss": 4.605534184265137, "test_acc": 0.01, "lyapunov": 3.1088165675892547, "grad_norm": 2.6762849936508677, "grad_max_sv": 0.042965149600058795, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 42965149600.05879, "lr": 0.00096093157579425, "time_sec": 209.9727280139923 }, { "epoch": 20, "train_loss": 7.460425003356933, "train_acc": 0.0111, "test_loss": 7.111512740325928, "test_acc": 0.01, "lyapunov": 2.9692358793809897, "grad_norm": 2.853254134437055, "grad_max_sv": 0.050038989260792734, "grad_min_sv": 2.5374011942761624e-43, "grad_condition": 50038989260.792725, "lr": 0.0009567727288213001, "time_sec": 210.01186299324036 }, { "epoch": 21, "train_loss": 7.205679086456299, "train_acc": 0.0091, "test_loss": 7.044362417602539, "test_acc": 0.01, "lyapunov": 2.8364865828658004, "grad_norm": 3.3061229521295945, "grad_max_sv": 0.02213773485273123, "grad_min_sv": 0.0, "grad_condition": 22137734852.731228, "lr": 0.0009524135262330095, "time_sec": 209.98502397537231 }, { "epoch": 22, "train_loss": 7.1949261268615725, "train_acc": 0.0098, "test_loss": 4.605458296203613, "test_acc": 0.01, "lyapunov": 2.8206752724659716, "grad_norm": 6.972340571186882, "grad_max_sv": 0.02202093116939068, "grad_min_sv": 0.0, "grad_condition": 22020931169.39068, "lr": 0.0009478558801197061, "time_sec": 209.94458675384521 }, { "epoch": 23, "train_loss": 7.115987669677734, "train_acc": 0.00996, "test_loss": 6.645735456848144, "test_acc": 0.01, "lyapunov": 2.7744642029637876, "grad_norm": 7.989108672811228, "grad_max_sv": 0.011007561534643173, "grad_min_sv": 0.0, "grad_condition": 11007561534.643173, "lr": 0.000943101789615607, "time_sec": 209.97865319252014 }, { "epoch": 24, "train_loss": 7.058884606628418, "train_acc": 0.00872, "test_loss": 6.569473106384278, "test_acc": 0.01, "lyapunov": 2.745215448881964, "grad_norm": 5.5094378668531405, "grad_max_sv": 0.01464888285845518, "grad_min_sv": 0.0, "grad_condition": 14648882858.455181, "lr": 0.0009381533400219313, "time_sec": 210.0189917087555 }, { "epoch": 25, "train_loss": 7.515213393859863, "train_acc": 0.01036, "test_loss": 4.605401533508301, "test_acc": 0.01, "lyapunov": 3.0008729113947097, "grad_norm": 2.870644125398128, "grad_max_sv": 0.07644851161090856, "grad_min_sv": 3.1529215447308385e-46, "grad_condition": 76448511610.90854, "lr": 0.0009330127018922189, "time_sec": 210.00069952011108 }, { "epoch": 26, "train_loss": 7.552015746002197, "train_acc": 0.01018, "test_loss": 4.605392645263672, "test_acc": 0.01, "lyapunov": 3.0268727373284148, "grad_norm": 1.9702867287865506, "grad_max_sv": 0.07252425029873848, "grad_min_sv": 1.0509738482436128e-46, "grad_condition": 72524250298.73848, "lr": 0.000927682130080253, "time_sec": 210.00505328178406 }, { "epoch": 27, "train_loss": 7.204120320739746, "train_acc": 0.00916, "test_loss": 4.605300965118408, "test_acc": 0.01, "lyapunov": 2.8272059610127793, "grad_norm": 2.304850056236489, "grad_max_sv": 0.002205173298716545, "grad_min_sv": 0.0, "grad_condition": 2205173298.716545, "lr": 0.0009221639627510072, "time_sec": 210.04179668426514 }, { "epoch": 28, "train_loss": 7.194927945556641, "train_acc": 0.00832, "test_loss": 5.018761894989014, "test_acc": 0.01, "lyapunov": 2.834069358723243, "grad_norm": 2.6612819081862673, "grad_max_sv": 0.007065491378307342, "grad_min_sv": 0.0, "grad_condition": 7065491378.307343, "lr": 0.0009164606203550494, "time_sec": 209.9864535331726 }, { "epoch": 29, "train_loss": 7.058241820373535, "train_acc": 0.0089, "test_loss": 4.605222779083252, "test_acc": 0.01, "lyapunov": 2.7548481247309224, "grad_norm": 1.6469496155298196, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009105746045668516, "time_sec": 209.949223279953 }, { "epoch": 30, "train_loss": 6.992346358947754, "train_acc": 0.00846, "test_loss": 5.288449756622314, "test_acc": 0.01, "lyapunov": 2.7193446976449485, "grad_norm": 0.12148601528604053, "grad_max_sv": 0.010588385537266732, "grad_min_sv": 0.0, "grad_condition": 10588385537.266731, "lr": 0.0009045084971874733, "time_sec": 209.9674859046936 }, { "epoch": 31, "train_loss": 6.981909171295166, "train_acc": 0.0089, "test_loss": 5.256688010406494, "test_acc": 0.01, "lyapunov": 2.713971863622251, "grad_norm": 0.1172841827453055, "grad_max_sv": 0.004473739862442016, "grad_min_sv": 0.0, "grad_condition": 4473739862.442017, "lr": 0.0008982649590120977, "time_sec": 210.0011682510376 }, { "epoch": 32, "train_loss": 6.981826614379883, "train_acc": 0.00878, "test_loss": 5.260603121185302, "test_acc": 0.01, "lyapunov": 2.714321748679861, "grad_norm": 0.09952710953666385, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008918467286629196, "time_sec": 209.97604823112488 }, { "epoch": 33, "train_loss": 6.99227462890625, "train_acc": 0.00872, "test_loss": 5.264018801879883, "test_acc": 0.01, "lyapunov": 2.7198148792052206, "grad_norm": 0.10982760460792622, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008852566213878943, "time_sec": 209.99684286117554 }, { "epoch": 34, "train_loss": 6.985566412353515, "train_acc": 0.00828, "test_loss": 5.252056950378418, "test_acc": 0.01, "lyapunov": 2.71640632646468, "grad_norm": 0.0980287254251016, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000878497527825878, "time_sec": 209.97523665428162 }, { "epoch": 35, "train_loss": 6.983518271942138, "train_acc": 0.00802, "test_loss": 5.235891506958008, "test_acc": 0.01, "lyapunov": 2.7152942220878113, "grad_norm": 0.098301014644246, "grad_max_sv": 0.010264468565583228, "grad_min_sv": 0.0, "grad_condition": 10264468565.58323, "lr": 0.000871572412738697, "time_sec": 209.92434358596802 }, { "epoch": 36, "train_loss": 7.056292109069824, "train_acc": 0.00856, "test_loss": 5.234983450317383, "test_acc": 0.01, "lyapunov": 2.7453303550515336, "grad_norm": 0.16314843571536908, "grad_max_sv": 0.004481474310159684, "grad_min_sv": 0.0, "grad_condition": 4481474310.159683, "lr": 0.0008644843137107055, "time_sec": 209.98300409317017 }, { "epoch": 37, "train_loss": 7.04465570388794, "train_acc": 0.00922, "test_loss": 4.60517428894043, "test_acc": 0.01, "lyapunov": 2.7430449416265463, "grad_norm": 0.3622526875575334, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008572363398164014, "time_sec": 209.93617868423462 }, { "epoch": 38, "train_loss": 6.99952162109375, "train_acc": 0.00886, "test_loss": 4.605173640441895, "test_acc": 0.01, "lyapunov": 2.7234638078743236, "grad_norm": 0.13703797479309945, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008498316702566826, "time_sec": 209.95248365402222 }, { "epoch": 39, "train_loss": 7.040763073120117, "train_acc": 0.00844, "test_loss": 4.605174145507813, "test_acc": 0.01, "lyapunov": 2.7378825531591233, "grad_norm": 0.1820768645877041, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643442, "time_sec": 209.9344642162323 }, { "epoch": 40, "train_loss": 7.0346226399230956, "train_acc": 0.0086, "test_loss": 4.6051736892700195, "test_acc": 0.01, "lyapunov": 2.7368516513453724, "grad_norm": 0.16922090716634502, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008345653031794289, "time_sec": 209.97976160049438 }, { "epoch": 41, "train_loss": 7.102251969604493, "train_acc": 0.00846, "test_loss": 4.605173461914062, "test_acc": 0.01, "lyapunov": 2.764533970362085, "grad_norm": 0.2796669100517588, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008267103019950526, "time_sec": 209.97592854499817 }, { "epoch": 42, "train_loss": 6.989806396331787, "train_acc": 0.00866, "test_loss": 4.605173326110839, "test_acc": 0.01, "lyapunov": 2.718248601459786, "grad_norm": 0.11817449733439238, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743447, "time_sec": 209.91329216957092 }, { "epoch": 43, "train_loss": 6.980831128997803, "train_acc": 0.00798, "test_loss": 4.605173022460938, "test_acc": 0.01, "lyapunov": 2.713783808071595, "grad_norm": 0.09538783881391288, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000810573890139155, "time_sec": 209.95550656318665 }, { "epoch": 44, "train_loss": 6.979222456054687, "train_acc": 0.00884, "test_loss": 4.605172604370117, "test_acc": 0.01, "lyapunov": 2.712872148474769, "grad_norm": 0.0919946830154422, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008022995574311873, "time_sec": 209.928706407547 }, { "epoch": 45, "train_loss": 6.981346151428222, "train_acc": 0.00856, "test_loss": 4.605171971130371, "test_acc": 0.01, "lyapunov": 2.7140665036028304, "grad_norm": 0.09306477436154323, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462363, "time_sec": 209.92562985420227 }, { "epoch": 46, "train_loss": 6.981760795288086, "train_acc": 0.0086, "test_loss": 4.605172605133057, "test_acc": 0.01, "lyapunov": 2.714427888850727, "grad_norm": 0.08970786008826526, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007853567838422158, "time_sec": 210.02350616455078 }, { "epoch": 47, "train_loss": 7.014443389587402, "train_acc": 0.0088, "test_loss": 4.605172411346436, "test_acc": 0.01, "lyapunov": 2.728213080969613, "grad_norm": 0.1697709047839743, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007766957746216719, "time_sec": 209.98714351654053 }, { "epoch": 48, "train_loss": 6.98308254486084, "train_acc": 0.0088, "test_loss": 4.605172724151611, "test_acc": 0.01, "lyapunov": 2.7148986033466467, "grad_norm": 0.10089096056823664, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894982, "time_sec": 209.9425868988037 }, { "epoch": 49, "train_loss": 6.981540090026855, "train_acc": 0.00806, "test_loss": 4.610235414886475, "test_acc": 0.01, "lyapunov": 2.714101230396944, "grad_norm": 0.09707765972227518, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000759013504686565, "time_sec": 210.01923370361328 }, { "epoch": 50, "train_loss": 7.012723862762451, "train_acc": 0.0088, "test_loss": 4.6051725616455075, "test_acc": 0.01, "lyapunov": 2.729266738037929, "grad_norm": 0.1358370231708399, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007499999999999998, "time_sec": 209.99068450927734 }, { "epoch": 51, "train_loss": 7.017712171630859, "train_acc": 0.00878, "test_loss": 4.60517274017334, "test_acc": 0.01, "lyapunov": 2.729401938445733, "grad_norm": 0.13779403599934203, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508575, "time_sec": 210.01132082939148 }, { "epoch": 52, "train_loss": 6.98579848815918, "train_acc": 0.00862, "test_loss": 4.605172367095947, "test_acc": 0.01, "lyapunov": 2.7164978974920406, "grad_norm": 0.11440777465495124, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007316480175599307, "time_sec": 209.96309852600098 }, { "epoch": 53, "train_loss": 6.980713491516113, "train_acc": 0.0088, "test_loss": 4.605172201538086, "test_acc": 0.01, "lyapunov": 2.7136193919364753, "grad_norm": 0.0963297125293723, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007223175895924635, "time_sec": 210.0020875930786 }, { "epoch": 54, "train_loss": 6.9838667016601566, "train_acc": 0.00856, "test_loss": 4.605172233581543, "test_acc": 0.01, "lyapunov": 2.715499324871756, "grad_norm": 0.1368676120419564, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825361, "time_sec": 209.94060635566711 }, { "epoch": 55, "train_loss": 6.983624946899414, "train_acc": 0.00906, "test_loss": 4.605171611022949, "test_acc": 0.01, "lyapunov": 2.7151694712431533, "grad_norm": 0.1214142336589057, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007033683215378998, "time_sec": 209.92118954658508 }, { "epoch": 56, "train_loss": 6.996163428649902, "train_acc": 0.00826, "test_loss": 4.60517228012085, "test_acc": 0.01, "lyapunov": 2.721804239560881, "grad_norm": 0.13635707009394835, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006937577932260512, "time_sec": 210.05888557434082 }, { "epoch": 57, "train_loss": 6.9852110571289066, "train_acc": 0.00888, "test_loss": 4.6051725509643555, "test_acc": 0.01, "lyapunov": 2.7162836719961727, "grad_norm": 0.09827989868248155, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423388, "time_sec": 210.03313207626343 }, { "epoch": 58, "train_loss": 6.990598773498535, "train_acc": 0.0087, "test_loss": 4.605171973419189, "test_acc": 0.01, "lyapunov": 2.718923308355424, "grad_norm": 0.11245505032562926, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006742860236609073, "time_sec": 210.20554780960083 }, { "epoch": 59, "train_loss": 6.990819956512452, "train_acc": 0.00914, "test_loss": 4.605172409057618, "test_acc": 0.01, "lyapunov": 2.719175950950369, "grad_norm": 0.11267799994144367, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006644333233692913, "time_sec": 210.00883507728577 }, { "epoch": 60, "train_loss": 7.063073814697265, "train_acc": 0.00868, "test_loss": 4.605172189331054, "test_acc": 0.01, "lyapunov": 2.7483064634415806, "grad_norm": 0.18267690644430695, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874734, "time_sec": 210.0396704673767 }, { "epoch": 61, "train_loss": 6.994184250183105, "train_acc": 0.00868, "test_loss": 4.605171653747559, "test_acc": 0.01, "lyapunov": 2.7201892951565325, "grad_norm": 0.1215511744322559, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006445158984722354, "time_sec": 210.01424837112427 }, { "epoch": 62, "train_loss": 7.032484904479981, "train_acc": 0.00918, "test_loss": 4.605172390747071, "test_acc": 0.01, "lyapunov": 2.7373275226339353, "grad_norm": 0.20957283019702622, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006344599103076324, "time_sec": 210.07943868637085 }, { "epoch": 63, "train_loss": 6.997943234863281, "train_acc": 0.00816, "test_loss": 4.6051715438842775, "test_acc": 0.01, "lyapunov": 2.722739946506822, "grad_norm": 0.14325925108066898, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824269, "time_sec": 210.0124545097351 }, { "epoch": 64, "train_loss": 7.036040018615723, "train_acc": 0.00846, "test_loss": 4.6051715461730955, "test_acc": 0.01, "lyapunov": 2.737502407234953, "grad_norm": 0.1852649849094369, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006141754350553275, "time_sec": 210.16446352005005 }, { "epoch": 65, "train_loss": 6.987151607818603, "train_acc": 0.00856, "test_loss": 4.605171313476562, "test_acc": 0.01, "lyapunov": 2.717369063126157, "grad_norm": 0.11469395705842762, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006039558454088793, "time_sec": 210.01318955421448 }, { "epoch": 66, "train_loss": 7.095058049316406, "train_acc": 0.0084, "test_loss": 4.605171440124511, "test_acc": 0.01, "lyapunov": 2.76260655432406, "grad_norm": 0.38302198809757837, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000593690657292862, "time_sec": 209.99922275543213 }, { "epoch": 67, "train_loss": 6.990951052246094, "train_acc": 0.00822, "test_loss": 4.60517152709961, "test_acc": 0.01, "lyapunov": 2.719036699865785, "grad_norm": 0.12621463018935974, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005833843733580507, "time_sec": 210.0219807624817 }, { "epoch": 68, "train_loss": 6.979004976806641, "train_acc": 0.0089, "test_loss": 4.6051711723327635, "test_acc": 0.01, "lyapunov": 2.7127806817174265, "grad_norm": 0.0898257720991778, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005730415142812054, "time_sec": 209.98719429969788 }, { "epoch": 69, "train_loss": 7.030236116638184, "train_acc": 0.0085, "test_loss": 4.605171342468262, "test_acc": 0.01, "lyapunov": 2.7335510912453733, "grad_norm": 0.16033156081316657, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821517, "time_sec": 210.08958458900452 }, { "epoch": 70, "train_loss": 7.039960643615722, "train_acc": 0.00892, "test_loss": 4.6051711669921875, "test_acc": 0.01, "lyapunov": 2.739665296681397, "grad_norm": 0.22271149603025697, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005522642316338265, "time_sec": 210.03332662582397 }, { "epoch": 71, "train_loss": 6.994076708221436, "train_acc": 0.0088, "test_loss": 4.605171272277832, "test_acc": 0.01, "lyapunov": 2.720922397530597, "grad_norm": 0.1379622518868338, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005418389216661573, "time_sec": 210.08726000785828 }, { "epoch": 72, "train_loss": 7.031296715240479, "train_acc": 0.0093, "test_loss": 4.605170808410644, "test_acc": 0.01, "lyapunov": 2.7340313668751044, "grad_norm": 0.15171246429702803, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646563, "time_sec": 209.98722290992737 }, { "epoch": 73, "train_loss": 7.004211445465088, "train_acc": 0.00854, "test_loss": 4.605171342468262, "test_acc": 0.01, "lyapunov": 2.723038975844908, "grad_norm": 0.13946310624469108, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005209378268645994, "time_sec": 210.0228340625763 }, { "epoch": 74, "train_loss": 7.004648984680176, "train_acc": 0.00784, "test_loss": 4.605171240234375, "test_acc": 0.01, "lyapunov": 2.7241133033771954, "grad_norm": 0.14177753146701746, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005104712099416781, "time_sec": 210.09978771209717 }, { "epoch": 75, "train_loss": 7.037411134338379, "train_acc": 0.00828, "test_loss": 4.605171034240723, "test_acc": 0.01, "lyapunov": 2.7407932879065005, "grad_norm": 0.3048803615675911, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004999999999999996, "time_sec": 209.95723867416382 }, { "epoch": 76, "train_loss": 7.073835411071777, "train_acc": 0.00852, "test_loss": 4.605171124267578, "test_acc": 0.01, "lyapunov": 2.7557388784940287, "grad_norm": 0.3366831366752972, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004895287900583212, "time_sec": 210.0526421070099 }, { "epoch": 77, "train_loss": 7.069385101013183, "train_acc": 0.00882, "test_loss": 4.605171006011963, "test_acc": 0.01, "lyapunov": 2.7532967996719244, "grad_norm": 0.3023678187768571, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004790621731353997, "time_sec": 210.00937223434448 }, { "epoch": 78, "train_loss": 7.039409867553711, "train_acc": 0.00918, "test_loss": 4.605171101379394, "test_acc": 0.01, "lyapunov": 2.7399997028243512, "grad_norm": 0.2334340472843992, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000468604740235343, "time_sec": 209.98830223083496 }, { "epoch": 79, "train_loss": 7.060353764648437, "train_acc": 0.0089, "test_loss": 4.605171464538574, "test_acc": 0.01, "lyapunov": 2.7474362892872843, "grad_norm": 0.24607577443282014, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00045816107833384175, "time_sec": 209.9931514263153 }, { "epoch": 80, "train_loss": 6.994573851013183, "train_acc": 0.00838, "test_loss": 4.605170816040039, "test_acc": 0.01, "lyapunov": 2.7213273816706276, "grad_norm": 0.13316471216665574, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004477357683661729, "time_sec": 210.0208034515381 }, { "epoch": 81, "train_loss": 6.987541461791992, "train_acc": 0.00882, "test_loss": 4.605170903778077, "test_acc": 0.01, "lyapunov": 2.7174221109551238, "grad_norm": 0.103648369821384, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784746, "time_sec": 209.98763418197632 }, { "epoch": 82, "train_loss": 7.037619709472656, "train_acc": 0.009, "test_loss": 4.60517109298706, "test_acc": 0.01, "lyapunov": 2.740689567897631, "grad_norm": 0.2931576105004017, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004269584857187939, "time_sec": 209.9937252998352 }, { "epoch": 83, "train_loss": 6.985121826171875, "train_acc": 0.00916, "test_loss": 4.605170684051513, "test_acc": 0.01, "lyapunov": 2.7163276074792417, "grad_norm": 0.1492971550466505, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004166156266419484, "time_sec": 209.95198678970337 }, { "epoch": 84, "train_loss": 7.066727964477539, "train_acc": 0.00896, "test_loss": 4.605170683288574, "test_acc": 0.01, "lyapunov": 2.7504812116208286, "grad_norm": 0.2866450325163035, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 210.01719284057617 }, { "epoch": 85, "train_loss": 6.989573917999268, "train_acc": 0.00868, "test_loss": 4.605171029663086, "test_acc": 0.01, "lyapunov": 2.718881234488524, "grad_norm": 0.17966945444038818, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003960441545911199, "time_sec": 209.97075200080872 }, { "epoch": 86, "train_loss": 7.024203224792481, "train_acc": 0.009, "test_loss": 4.60517100982666, "test_acc": 0.01, "lyapunov": 2.7339598565455288, "grad_norm": 0.22243544874027923, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003858245649446718, "time_sec": 210.22112345695496 }, { "epoch": 87, "train_loss": 6.999354568481445, "train_acc": 0.0089, "test_loss": 4.605170932006836, "test_acc": 0.01, "lyapunov": 2.723075409984345, "grad_norm": 0.18428974005449253, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00037565505641757235, "time_sec": 210.0000035762787 }, { "epoch": 88, "train_loss": 6.986679251861572, "train_acc": 0.0085, "test_loss": 4.605170610046387, "test_acc": 0.01, "lyapunov": 2.7169672826976727, "grad_norm": 0.12620646621233791, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036554008969236695, "time_sec": 209.9843943119049 }, { "epoch": 89, "train_loss": 7.011478589172364, "train_acc": 0.00836, "test_loss": 4.605170822143554, "test_acc": 0.01, "lyapunov": 2.7271931854355365, "grad_norm": 0.15417699872251808, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003554841015277638, "time_sec": 209.97113156318665 }, { "epoch": 90, "train_loss": 7.101416894836426, "train_acc": 0.00908, "test_loss": 4.605170645141602, "test_acc": 0.01, "lyapunov": 2.7632448941545413, "grad_norm": 0.31835714546200394, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000345491502812526, "time_sec": 209.9718475341797 }, { "epoch": 91, "train_loss": 7.0410906286621096, "train_acc": 0.00862, "test_loss": 4.605170471191406, "test_acc": 0.01, "lyapunov": 2.7411284916236274, "grad_norm": 0.3464519876405528, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003355666766307081, "time_sec": 209.98472666740417 }, { "epoch": 92, "train_loss": 7.078473837890625, "train_acc": 0.00868, "test_loss": 4.605170490264893, "test_acc": 0.01, "lyapunov": 2.756490916547263, "grad_norm": 0.3699213952956702, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00032571397633909225, "time_sec": 209.99044036865234 }, { "epoch": 93, "train_loss": 6.9829315435791015, "train_acc": 0.00898, "test_loss": 4.605170346069336, "test_acc": 0.01, "lyapunov": 2.71514059576537, "grad_norm": 0.0883076892297495, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766094, "time_sec": 209.9776222705841 }, { "epoch": 94, "train_loss": 6.9855348080444335, "train_acc": 0.00822, "test_loss": 4.605170868682861, "test_acc": 0.01, "lyapunov": 2.7164944638986417, "grad_norm": 0.1479238762597201, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003062422067739483, "time_sec": 210.00643134117126 }, { "epoch": 95, "train_loss": 6.9874295346069335, "train_acc": 0.00856, "test_loss": 4.605170775604248, "test_acc": 0.01, "lyapunov": 2.7169240917391178, "grad_norm": 0.15626938065528906, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00029663167846209965, "time_sec": 209.99916791915894 }, { "epoch": 96, "train_loss": 6.983181795043945, "train_acc": 0.00818, "test_loss": 4.605170436096191, "test_acc": 0.01, "lyapunov": 2.7151255619800305, "grad_norm": 0.12016550567041384, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00028711035421746345, "time_sec": 210.07179808616638 }, { "epoch": 97, "train_loss": 6.9956132180786135, "train_acc": 0.0088, "test_loss": 4.6051704200744625, "test_acc": 0.01, "lyapunov": 2.7203723811127647, "grad_norm": 0.14197786423069308, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00027768241040753615, "time_sec": 209.9841606616974 }, { "epoch": 98, "train_loss": 6.9846799612426755, "train_acc": 0.00844, "test_loss": 4.605170723724365, "test_acc": 0.01, "lyapunov": 2.715931734465577, "grad_norm": 0.1266081420314572, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00026835198244006903, "time_sec": 209.96538734436035 }, { "epoch": 99, "train_loss": 7.002227352294922, "train_acc": 0.0088, "test_loss": 4.605170701599121, "test_acc": 0.01, "lyapunov": 2.7254832943382166, "grad_norm": 0.30098740432801424, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002591231629491421, "time_sec": 209.96611714363098 }, { "epoch": 100, "train_loss": 7.031358368072509, "train_acc": 0.0084, "test_loss": 4.605170401763916, "test_acc": 0.01, "lyapunov": 2.734792661179057, "grad_norm": 0.22052159160290236, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002499999999999997, "time_sec": 209.99191045761108 }, { "epoch": 101, "train_loss": 7.02535282836914, "train_acc": 0.0089, "test_loss": 4.605170426940918, "test_acc": 0.01, "lyapunov": 2.732613311094396, "grad_norm": 0.1884414449751891, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00024098649531343477, "time_sec": 209.96369862556458 }, { "epoch": 102, "train_loss": 6.979629467163086, "train_acc": 0.00892, "test_loss": 4.605170404052735, "test_acc": 0.01, "lyapunov": 2.713197677031807, "grad_norm": 0.11445011044498424, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002320866025105016, "time_sec": 209.94372940063477 }, { "epoch": 103, "train_loss": 6.992681996459961, "train_acc": 0.00866, "test_loss": 4.605170614624023, "test_acc": 0.01, "lyapunov": 2.7198261897582228, "grad_norm": 0.11698623871801088, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002233042253783278, "time_sec": 209.9833948612213 }, { "epoch": 104, "train_loss": 6.981217978515625, "train_acc": 0.00812, "test_loss": 4.605170754241944, "test_acc": 0.01, "lyapunov": 2.7141413487436825, "grad_norm": 0.08755411353395318, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000214643216157784, "time_sec": 210.01173162460327 }, { "epoch": 105, "train_loss": 6.981228657531738, "train_acc": 0.00804, "test_loss": 4.605170397949219, "test_acc": 0.01, "lyapunov": 2.7141372974571363, "grad_norm": 0.09294871100024936, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376332, "time_sec": 209.94330191612244 }, { "epoch": 106, "train_loss": 7.012609109344482, "train_acc": 0.0086, "test_loss": 4.605170350646973, "test_acc": 0.01, "lyapunov": 2.7288797901719426, "grad_norm": 0.20993573311720926, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019770044256881242, "time_sec": 210.00956416130066 }, { "epoch": 107, "train_loss": 7.00075564453125, "train_acc": 0.00862, "test_loss": 4.60517020111084, "test_acc": 0.01, "lyapunov": 2.7233152907827627, "grad_norm": 0.15372921012205631, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001894261098608447, "time_sec": 210.00604104995728 }, { "epoch": 108, "train_loss": 7.0513025799560545, "train_acc": 0.00884, "test_loss": 4.605170352172852, "test_acc": 0.01, "lyapunov": 2.7449967105065465, "grad_norm": 0.27576954124117053, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000181288005125655, "time_sec": 209.93969535827637 }, { "epoch": 109, "train_loss": 6.980083810424805, "train_acc": 0.00836, "test_loss": 4.605170263671875, "test_acc": 0.01, "lyapunov": 2.713495020366386, "grad_norm": 0.08939231438623309, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001732896980049473, "time_sec": 209.99505877494812 }, { "epoch": 110, "train_loss": 6.984004687805176, "train_acc": 0.00854, "test_loss": 4.60517056350708, "test_acc": 0.01, "lyapunov": 2.715787248538278, "grad_norm": 0.09252734679044972, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016543469682057076, "time_sec": 209.9858946800232 }, { "epoch": 111, "train_loss": 6.983103836517334, "train_acc": 0.00846, "test_loss": 4.6051701759338375, "test_acc": 0.01, "lyapunov": 2.715198960145721, "grad_norm": 0.12412466148890375, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015772644703565552, "time_sec": 209.98376154899597 }, { "epoch": 112, "train_loss": 7.001786309051513, "train_acc": 0.00842, "test_loss": 4.605170098876953, "test_acc": 0.01, "lyapunov": 2.7237192645402213, "grad_norm": 0.2611435951973152, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00015016832974331713, "time_sec": 210.04836750030518 }, { "epoch": 113, "train_loss": 6.985844685974121, "train_acc": 0.0083, "test_loss": 4.605170079040527, "test_acc": 0.01, "lyapunov": 2.716268786993783, "grad_norm": 0.12269496905075315, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014276366018359834, "time_sec": 210.01298427581787 }, { "epoch": 114, "train_loss": 6.982051696472168, "train_acc": 0.0086, "test_loss": 4.605170341491699, "test_acc": 0.01, "lyapunov": 2.7146723093584066, "grad_norm": 0.10102267353118359, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00013551568628929425, "time_sec": 209.98340034484863 }, { "epoch": 115, "train_loss": 6.97831426361084, "train_acc": 0.00934, "test_loss": 4.60517028503418, "test_acc": 0.01, "lyapunov": 2.7124323881495638, "grad_norm": 0.0910994755377039, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012842758726130276, "time_sec": 209.99640536308289 }, { "epoch": 116, "train_loss": 6.9820148625183105, "train_acc": 0.00932, "test_loss": 4.605170400238037, "test_acc": 0.01, "lyapunov": 2.7146591920681926, "grad_norm": 0.10075615501603827, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001215024721741218, "time_sec": 209.9244248867035 }, { "epoch": 117, "train_loss": 6.9843703225708005, "train_acc": 0.00914, "test_loss": 4.605170434570312, "test_acc": 0.01, "lyapunov": 2.715647294393281, "grad_norm": 0.11228216953551147, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210538, "time_sec": 209.9830358028412 }, { "epoch": 118, "train_loss": 7.017746971740722, "train_acc": 0.00848, "test_loss": 4.605170096588135, "test_acc": 0.01, "lyapunov": 2.7295747071580814, "grad_norm": 0.20995938315988794, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010815327133708009, "time_sec": 209.98030400276184 }, { "epoch": 119, "train_loss": 6.992286892089844, "train_acc": 0.00848, "test_loss": 4.605170076751709, "test_acc": 0.01, "lyapunov": 2.7198437071212416, "grad_norm": 0.13966024517159772, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010173504098790182, "time_sec": 209.8962001800537 }, { "epoch": 120, "train_loss": 6.988741851654053, "train_acc": 0.00882, "test_loss": 4.605170139312744, "test_acc": 0.01, "lyapunov": 2.7180907177498272, "grad_norm": 0.16074749971185626, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252629e-05, "time_sec": 210.00037145614624 }, { "epoch": 121, "train_loss": 6.9938799935913085, "train_acc": 0.00866, "test_loss": 4.605170372772217, "test_acc": 0.01, "lyapunov": 2.7198036820687297, "grad_norm": 0.15994838954410112, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.942539543314794e-05, "time_sec": 210.0474226474762 }, { "epoch": 122, "train_loss": 7.0039596870422365, "train_acc": 0.00892, "test_loss": 4.6051700347900395, "test_acc": 0.01, "lyapunov": 2.7259010494212665, "grad_norm": 0.09437754111929303, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.353937964495024e-05, "time_sec": 210.04152083396912 }, { "epoch": 123, "train_loss": 7.009052494049072, "train_acc": 0.00872, "test_loss": 4.605170434570312, "test_acc": 0.01, "lyapunov": 2.72874392755806, "grad_norm": 0.10432489602660702, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.783603724899243e-05, "time_sec": 210.2749161720276 }, { "epoch": 124, "train_loss": 7.074693834838867, "train_acc": 0.0093, "test_loss": 4.605170128631592, "test_acc": 0.01, "lyapunov": 2.758679599103415, "grad_norm": 0.22022455692760384, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.231786991974666e-05, "time_sec": 210.06590056419373 }, { "epoch": 125, "train_loss": 6.982606186523437, "train_acc": 0.00892, "test_loss": 4.605170491027832, "test_acc": 0.01, "lyapunov": 2.7148781255687897, "grad_norm": 0.08823763166065995, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.698729810778072e-05, "time_sec": 210.01559233665466 }, { "epoch": 126, "train_loss": 6.982140954437256, "train_acc": 0.0086, "test_loss": 4.605170350646973, "test_acc": 0.01, "lyapunov": 2.7147414952592777, "grad_norm": 0.10255408158855737, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806817e-05, "time_sec": 210.03672337532043 }, { "epoch": 127, "train_loss": 6.979871159973144, "train_acc": 0.00872, "test_loss": 4.605170230102539, "test_acc": 0.01, "lyapunov": 2.71336467369743, "grad_norm": 0.08818157608440398, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.6898210384392595e-05, "time_sec": 210.00639820098877 }, { "epoch": 128, "train_loss": 6.985049297180176, "train_acc": 0.00864, "test_loss": 4.605170027160645, "test_acc": 0.01, "lyapunov": 2.716455806551687, "grad_norm": 0.08762261938563776, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.214411988029363e-05, "time_sec": 209.97323060035706 }, { "epoch": 129, "train_loss": 6.985287237243653, "train_acc": 0.00956, "test_loss": 4.605170120239258, "test_acc": 0.01, "lyapunov": 2.7165556063737406, "grad_norm": 0.08764461237151443, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.7586473766990294e-05, "time_sec": 210.0408091545105 }, { "epoch": 130, "train_loss": 7.065185516815186, "train_acc": 0.00922, "test_loss": 4.605170118713379, "test_acc": 0.01, "lyapunov": 2.756326196138816, "grad_norm": 0.2237427649903656, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.32272711786996e-05, "time_sec": 210.05785131454468 }, { "epoch": 131, "train_loss": 7.003630043640137, "train_acc": 0.00874, "test_loss": 4.605170425415039, "test_acc": 0.01, "lyapunov": 2.7251280341916684, "grad_norm": 0.11404915316549034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.906842420574966e-05, "time_sec": 210.06771302223206 }, { "epoch": 132, "train_loss": 7.016419371795655, "train_acc": 0.00874, "test_loss": 4.605170411682129, "test_acc": 0.01, "lyapunov": 2.732408604048707, "grad_norm": 0.09643363295807468, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.5111757055874305e-05, "time_sec": 210.00194883346558 }, { "epoch": 133, "train_loss": 7.027043022460938, "train_acc": 0.00868, "test_loss": 4.605170454406738, "test_acc": 0.01, "lyapunov": 2.7380632366365787, "grad_norm": 0.08968045213589285, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.1359005254054254e-05, "time_sec": 210.257652759552 }, { "epoch": 134, "train_loss": 7.035782067260742, "train_acc": 0.00788, "test_loss": 4.605170135498047, "test_acc": 0.01, "lyapunov": 2.743028284033851, "grad_norm": 0.09341294223256699, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7811814881259484e-05, "time_sec": 209.9916913509369 }, { "epoch": 135, "train_loss": 7.071151198425293, "train_acc": 0.0096, "test_loss": 4.605170458984375, "test_acc": 0.01, "lyapunov": 2.760085921153388, "grad_norm": 0.09297571487706319, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.4471741852423218e-05, "time_sec": 210.2266161441803 }, { "epoch": 136, "train_loss": 7.034707638702392, "train_acc": 0.00916, "test_loss": 4.605170063018798, "test_acc": 0.01, "lyapunov": 2.742517843880617, "grad_norm": 0.08845657511108296, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.1340251233966362e-05, "time_sec": 210.06171536445618 }, { "epoch": 137, "train_loss": 7.0274613586425785, "train_acc": 0.00888, "test_loss": 4.605170385742188, "test_acc": 0.01, "lyapunov": 2.7373946475250945, "grad_norm": 0.10398852016478509, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.8418716601170932e-05, "time_sec": 209.9369614124298 }, { "epoch": 138, "train_loss": 7.025472250366211, "train_acc": 0.0095, "test_loss": 4.605170440673828, "test_acc": 0.01, "lyapunov": 2.736402528670133, "grad_norm": 0.09038559548514402, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568445e-05, "time_sec": 210.0793435573578 }, { "epoch": 139, "train_loss": 7.014701705322266, "train_acc": 0.00924, "test_loss": 4.605170342254639, "test_acc": 0.01, "lyapunov": 2.7315333481030084, "grad_norm": 0.10172944851300819, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.3210548563419845e-05, "time_sec": 210.09445595741272 }, { "epoch": 140, "train_loss": 7.003781777954101, "train_acc": 0.00918, "test_loss": 4.605170393371582, "test_acc": 0.01, "lyapunov": 2.7260687607328604, "grad_norm": 0.08766437036057895, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.0926199633097203e-05, "time_sec": 210.07793593406677 }, { "epoch": 141, "train_loss": 7.056627904968262, "train_acc": 0.01, "test_loss": 4.60516996383667, "test_acc": 0.01, "lyapunov": 2.7532575478029373, "grad_norm": 0.09441259373264534, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.856374635655688e-06, "time_sec": 210.04277729988098 }, { "epoch": 142, "train_loss": 6.989320599212647, "train_acc": 0.00982, "test_loss": 4.605170464324951, "test_acc": 0.01, "lyapunov": 2.718763675836041, "grad_norm": 0.08778246721140825, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.001981464747503e-06, "time_sec": 210.0390853881836 }, { "epoch": 143, "train_loss": 7.0194689248657225, "train_acc": 0.01, "test_loss": 4.605170278930664, "test_acc": 0.01, "lyapunov": 2.7337976069096714, "grad_norm": 0.088168048948687, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.3638335185058295e-06, "time_sec": 210.09060406684875 }, { "epoch": 144, "train_loss": 6.989500450592041, "train_acc": 0.01, "test_loss": 4.605170496368408, "test_acc": 0.01, "lyapunov": 2.71841098280514, "grad_norm": 0.08876604826979184, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761114e-06, "time_sec": 210.08678889274597 }, { "epoch": 145, "train_loss": 6.977725113220215, "train_acc": 0.01, "test_loss": 4.605170376586914, "test_acc": 0.01, "lyapunov": 2.712189649986794, "grad_norm": 0.08740841232989421, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.7390523158633524e-06, "time_sec": 210.07671403884888 }, { "epoch": 146, "train_loss": 7.063753978881836, "train_acc": 0.01, "test_loss": 4.605170356750488, "test_acc": 0.01, "lyapunov": 2.7562683031077273, "grad_norm": 0.08829447012972118, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.7535703752478133e-06, "time_sec": 210.06147265434265 }, { "epoch": 147, "train_loss": 6.97903392501831, "train_acc": 0.01, "test_loss": 4.605170056915283, "test_acc": 0.01, "lyapunov": 2.712921044405769, "grad_norm": 0.08792833595670006, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642196e-07, "time_sec": 210.12889552116394 }, { "epoch": 148, "train_loss": 7.024583773956299, "train_acc": 0.01, "test_loss": 4.605170234680176, "test_acc": 0.01, "lyapunov": 2.736283694386787, "grad_norm": 0.08841220675764232, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.38584950570808e-07, "time_sec": 210.09635305404663 }, { "epoch": 149, "train_loss": 6.9777571395874025, "train_acc": 0.01, "test_loss": 4.605170068359375, "test_acc": 0.01, "lyapunov": 2.7121838078169564, "grad_norm": 0.08769792454661404, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.096582625772501e-07, "time_sec": 210.0731065273285 }, { "epoch": 150, "train_loss": 6.9812114135742185, "train_acc": 0.01, "test_loss": 4.605170178985595, "test_acc": 0.01, "lyapunov": 2.71422858494322, "grad_norm": 0.08799513594752054, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 210.09806776046753 } ] } }