{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 4.357881842498779, "train_acc": 0.09446, "test_loss": 3.5281315925598142, "test_acc": 0.1727, "lyapunov": null, "grad_norm": 6.340097491169349, "grad_max_sv": 4.973841696977615, "grad_min_sv": 1.1637189214486199e-07, "grad_condition": 49820869.21311478, "lr": 0.0009998903417374227, "time_sec": 17.58898615837097 }, { "epoch": 2, "train_loss": 3.5162495974731445, "train_acc": 0.18166, "test_loss": 3.361986777496338, "test_acc": 0.2212, "lyapunov": null, "grad_norm": 4.547965644035686, "grad_max_sv": 3.3173387169837953, "grad_min_sv": 8.365211060512578e-08, "grad_condition": 74579242.00846244, "lr": 0.0009995614150494292, "time_sec": 15.70747685432434 }, { "epoch": 3, "train_loss": 3.049772911834717, "train_acc": 0.25444, "test_loss": 2.928312567138672, "test_acc": 0.2881, "lyapunov": null, "grad_norm": 3.571965368749656, "grad_max_sv": 2.4133509695529938, "grad_min_sv": 6.657408836430179e-08, "grad_condition": 49614137.32958214, "lr": 0.0009990133642141358, "time_sec": 15.519535303115845 }, { "epoch": 4, "train_loss": 2.724564817428589, "train_acc": 0.31436, "test_loss": 2.6733072105407714, "test_acc": 0.331, "lyapunov": null, "grad_norm": 2.9818986561503382, "grad_max_sv": 1.8422472059726716, "grad_min_sv": 5.5166534979056436e-08, "grad_condition": 46971156.93483184, "lr": 0.0009982464296247522, "time_sec": 15.458869457244873 }, { "epoch": 5, "train_loss": 2.501728704910278, "train_acc": 0.35702, "test_loss": 2.674536157989502, "test_acc": 0.3431, "lyapunov": null, "grad_norm": 2.6380344213218527, "grad_max_sv": 1.605541154742241, "grad_min_sv": 5.005898049068036e-08, "grad_condition": 177063609.4994608, "lr": 0.0009972609476841367, "time_sec": 15.46523928642273 }, { "epoch": 6, "train_loss": 2.322341884765625, "train_acc": 0.39588, "test_loss": 2.440810569000244, "test_acc": 0.3786, "lyapunov": null, "grad_norm": 2.4046357640712968, "grad_max_sv": 1.3473579943180085, "grad_min_sv": 4.569443099143589e-08, "grad_condition": 315579058.91849506, "lr": 0.000996057350657239, "time_sec": 15.45302700996399 }, { "epoch": 7, "train_loss": 2.1792964128112793, "train_acc": 0.42468, "test_loss": 3.6083086921691896, "test_acc": 0.2555, "lyapunov": null, "grad_norm": 2.2401065243050575, "grad_max_sv": 1.250352716445923, "grad_min_sv": 4.339612316023311e-08, "grad_condition": 110140464.91678305, "lr": 0.000994636166481494, "time_sec": 15.459157943725586 }, { "epoch": 8, "train_loss": 2.06442552192688, "train_acc": 0.4489, "test_loss": 2.2239890716552733, "test_acc": 0.4291, "lyapunov": null, "grad_norm": 2.1012594692428856, "grad_max_sv": 1.1558537915349008, "grad_min_sv": 4.060080087131546e-08, "grad_condition": 62897451.54566701, "lr": 0.0009929980185352525, "time_sec": 15.45511507987976 }, { "epoch": 9, "train_loss": 1.9475363119125366, "train_acc": 0.47542, "test_loss": 2.2026602458953857, "test_acc": 0.4287, "lyapunov": null, "grad_norm": 1.9715615750533326, "grad_max_sv": 1.032596978545189, "grad_min_sv": 3.794599175710456e-08, "grad_condition": 65058485.034411274, "lr": 0.0009911436253643444, "time_sec": 15.45013976097107 }, { "epoch": 10, "train_loss": 1.8557951174163818, "train_acc": 0.49814, "test_loss": 2.1774634853363035, "test_acc": 0.4362, "lyapunov": null, "grad_norm": 1.8504614407647018, "grad_max_sv": 0.9416742533445358, "grad_min_sv": 3.512936608274231e-08, "grad_condition": 46677459.72355051, "lr": 0.0009890738003669028, "time_sec": 15.440587997436523 }, { "epoch": 11, "train_loss": 1.763924418334961, "train_acc": 0.5187, "test_loss": 2.4288942903518675, "test_acc": 0.4051, "lyapunov": null, "grad_norm": 1.7822208884902826, "grad_max_sv": 0.9033506259322166, "grad_min_sv": 3.467363161036019e-08, "grad_condition": 30024832.372439463, "lr": 0.00098678945143658, "time_sec": 15.469273567199707 }, { "epoch": 12, "train_loss": 1.6992105947494507, "train_acc": 0.53384, "test_loss": 2.3932419761657715, "test_acc": 0.4169, "lyapunov": null, "grad_norm": 1.6908902602895592, "grad_max_sv": 0.8336813643574714, "grad_min_sv": 3.225944931739555e-08, "grad_condition": 38720407.501370475, "lr": 0.0009842915805643154, "time_sec": 15.462818622589111 }, { "epoch": 13, "train_loss": 1.6412196295166015, "train_acc": 0.54614, "test_loss": 2.303184538459778, "test_acc": 0.4269, "lyapunov": null, "grad_norm": 1.6321649042964204, "grad_max_sv": 0.7801442697644234, "grad_min_sv": 3.083002481085728e-08, "grad_condition": 35858025.435112044, "lr": 0.000981581283398829, "time_sec": 15.466039419174194 }, { "epoch": 14, "train_loss": 1.5800055722045898, "train_acc": 0.56072, "test_loss": 2.34448659324646, "test_acc": 0.4166, "lyapunov": null, "grad_norm": 1.5709541615646672, "grad_max_sv": 0.7645063757896423, "grad_min_sv": 3.010382080819579e-08, "grad_condition": 425485709.2107061, "lr": 0.0009786597487660333, "time_sec": 15.457959175109863 }, { "epoch": 15, "train_loss": 1.522832469100952, "train_acc": 0.5756, "test_loss": 2.018679809951782, "test_acc": 0.4728, "lyapunov": null, "grad_norm": 1.516521779058338, "grad_max_sv": 0.7272973746061325, "grad_min_sv": 2.8604062869697076e-08, "grad_condition": 94477206.12080687, "lr": 0.0009755282581475766, "time_sec": 15.45545220375061 }, { "epoch": 16, "train_loss": 1.4677007636260986, "train_acc": 0.58764, "test_loss": 1.9565035533905029, "test_acc": 0.4933, "lyapunov": null, "grad_norm": 1.453059249026843, "grad_max_sv": 0.67758848965168, "grad_min_sv": 2.7189674285665878e-08, "grad_condition": 55305058.773309946, "lr": 0.0009721881851187403, "time_sec": 15.498552322387695 }, { "epoch": 17, "train_loss": 1.4236618344116212, "train_acc": 0.59808, "test_loss": 1.8643951223373414, "test_acc": 0.5109, "lyapunov": null, "grad_norm": 1.4131743339238467, "grad_max_sv": 0.6649302154779434, "grad_min_sv": 2.678126555383242e-08, "grad_condition": 54799789.840084136, "lr": 0.0009686409947459456, "time_sec": 15.623136520385742 }, { "epoch": 18, "train_loss": 1.3931309001159669, "train_acc": 0.60628, "test_loss": 1.9086449605941773, "test_acc": 0.5161, "lyapunov": null, "grad_norm": 1.3774038135699718, "grad_max_sv": 0.6381687998771668, "grad_min_sv": 2.581961362491114e-08, "grad_condition": 53150613.95565927, "lr": 0.0009648882429441254, "time_sec": 16.356106758117676 }, { "epoch": 19, "train_loss": 1.332000114517212, "train_acc": 0.61976, "test_loss": 1.9447854751586915, "test_acc": 0.4998, "lyapunov": null, "grad_norm": 1.3339422136321473, "grad_max_sv": 0.6115798369050026, "grad_min_sv": 2.4986909905738708e-08, "grad_condition": 76361025.08562623, "lr": 0.00096093157579425, "time_sec": 15.486042737960815 }, { "epoch": 20, "train_loss": 1.2998398171234131, "train_acc": 0.62884, "test_loss": 1.9578068918228149, "test_acc": 0.499, "lyapunov": null, "grad_norm": 1.3044281680786607, "grad_max_sv": 0.5868817433714867, "grad_min_sv": 2.460346111539738e-08, "grad_condition": 1416469832.4203677, "lr": 0.0009567727288213001, "time_sec": 15.45453691482544 }, { "epoch": 21, "train_loss": 1.266195481147766, "train_acc": 0.63696, "test_loss": 2.05823407535553, "test_acc": 0.4838, "lyapunov": null, "grad_norm": 1.2726472953754493, "grad_max_sv": 0.5784675382077694, "grad_min_sv": 2.384093428370315e-08, "grad_condition": 156182020.27727562, "lr": 0.0009524135262330095, "time_sec": 15.506311893463135 }, { "epoch": 22, "train_loss": 1.2384513986587524, "train_acc": 0.64552, "test_loss": 1.9120031692504882, "test_acc": 0.5172, "lyapunov": null, "grad_norm": 1.252497757690001, "grad_max_sv": 0.5717031776905059, "grad_min_sv": 2.3619134396912768e-08, "grad_condition": 67519805.29707912, "lr": 0.0009478558801197061, "time_sec": 15.47418475151062 }, { "epoch": 23, "train_loss": 1.1993658528137208, "train_acc": 0.65306, "test_loss": 1.7887667993545533, "test_acc": 0.5382, "lyapunov": null, "grad_norm": 1.2275759420533918, "grad_max_sv": 0.5570299223065376, "grad_min_sv": 2.2936629940836784e-08, "grad_condition": 165671008.87666664, "lr": 0.000943101789615607, "time_sec": 15.476239204406738 }, { "epoch": 24, "train_loss": 1.1695793395996095, "train_acc": 0.66222, "test_loss": 1.9164223749160767, "test_acc": 0.5069, "lyapunov": null, "grad_norm": 1.19558806415952, "grad_max_sv": 0.5234090469777584, "grad_min_sv": 2.2025900239808215e-08, "grad_condition": 38525149.552328385, "lr": 0.0009381533400219313, "time_sec": 15.470394372940063 }, { "epoch": 25, "train_loss": 1.1371285773468018, "train_acc": 0.66864, "test_loss": 1.9049333578109742, "test_acc": 0.5198, "lyapunov": null, "grad_norm": 1.1691991255738516, "grad_max_sv": 0.5114153914153576, "grad_min_sv": 2.1633911190255262e-08, "grad_condition": 40420362.43580131, "lr": 0.0009330127018922189, "time_sec": 15.475921392440796 }, { "epoch": 26, "train_loss": 1.0984287197875977, "train_acc": 0.67622, "test_loss": 1.9236036626815796, "test_acc": 0.5105, "lyapunov": null, "grad_norm": 1.1491919288876447, "grad_max_sv": 0.5075508892536164, "grad_min_sv": 2.156528700753002e-08, "grad_condition": 52800149.44483626, "lr": 0.000927682130080253, "time_sec": 15.560164213180542 }, { "epoch": 27, "train_loss": 1.085814157333374, "train_acc": 0.68168, "test_loss": 1.854748671913147, "test_acc": 0.5303, "lyapunov": null, "grad_norm": 1.132642015283084, "grad_max_sv": 0.5079298578202724, "grad_min_sv": 2.0747377492413844e-08, "grad_condition": 40886114.03567152, "lr": 0.0009221639627510072, "time_sec": 15.515005350112915 }, { "epoch": 28, "train_loss": 1.0481378091812135, "train_acc": 0.6919, "test_loss": 1.787252332687378, "test_acc": 0.5447, "lyapunov": null, "grad_norm": 1.1084077878736969, "grad_max_sv": 0.48980700969696045, "grad_min_sv": 2.03924750370732e-08, "grad_condition": 144667188.87541157, "lr": 0.0009164606203550494, "time_sec": 15.477014064788818 }, { "epoch": 29, "train_loss": 1.0372727437210083, "train_acc": 0.6921, "test_loss": 1.8922377561569215, "test_acc": 0.5273, "lyapunov": null, "grad_norm": 1.0954714543743995, "grad_max_sv": 0.4976396970450878, "grad_min_sv": 2.0566780979669463e-08, "grad_condition": 42633949.37567282, "lr": 0.0009105746045668516, "time_sec": 15.492783546447754 }, { "epoch": 30, "train_loss": 0.9987185321426392, "train_acc": 0.70062, "test_loss": 1.8061668651580811, "test_acc": 0.5499, "lyapunov": null, "grad_norm": 1.0825800954246438, "grad_max_sv": 0.47690314128994943, "grad_min_sv": 2.0063227677488694e-08, "grad_condition": 114878509.5913475, "lr": 0.0009045084971874733, "time_sec": 15.465651512145996 }, { "epoch": 31, "train_loss": 0.9715755378532409, "train_acc": 0.71128, "test_loss": 2.5642683250427245, "test_acc": 0.434, "lyapunov": null, "grad_norm": 1.0638185111036047, "grad_max_sv": 0.46563360542058946, "grad_min_sv": 1.9753409723904936e-08, "grad_condition": 54475045.10178232, "lr": 0.0008982649590120977, "time_sec": 15.514770984649658 }, { "epoch": 32, "train_loss": 0.9588010568237305, "train_acc": 0.71496, "test_loss": 2.0556532321929932, "test_acc": 0.5074, "lyapunov": null, "grad_norm": 1.0445708403852423, "grad_max_sv": 0.4599720284342766, "grad_min_sv": 1.917516104857353e-08, "grad_condition": 71151837.22383483, "lr": 0.0008918467286629196, "time_sec": 15.503283977508545 }, { "epoch": 33, "train_loss": 0.93256760181427, "train_acc": 0.72162, "test_loss": 1.751899316596985, "test_acc": 0.5538, "lyapunov": null, "grad_norm": 1.0334590332592064, "grad_max_sv": 0.4484298422932625, "grad_min_sv": 1.938236048604214e-08, "grad_condition": 38422022.12695898, "lr": 0.0008852566213878943, "time_sec": 15.474556922912598 }, { "epoch": 34, "train_loss": 0.9141502959060669, "train_acc": 0.72538, "test_loss": 1.8125969528198242, "test_acc": 0.5461, "lyapunov": null, "grad_norm": 1.020200863648912, "grad_max_sv": 0.44143804982304574, "grad_min_sv": 1.856398942207127e-08, "grad_condition": 117935929.65389478, "lr": 0.000878497527825878, "time_sec": 15.485417366027832 }, { "epoch": 35, "train_loss": 0.8939477145385742, "train_acc": 0.72998, "test_loss": 1.8124234422683716, "test_acc": 0.5558, "lyapunov": null, "grad_norm": 1.0031609444634824, "grad_max_sv": 0.4364132799208164, "grad_min_sv": 1.819760966359496e-08, "grad_condition": 38733067.30472837, "lr": 0.000871572412738697, "time_sec": 15.474757432937622 }, { "epoch": 36, "train_loss": 0.8783849499893188, "train_acc": 0.7375, "test_loss": 2.0318579233169554, "test_acc": 0.5215, "lyapunov": null, "grad_norm": 0.993071712133669, "grad_max_sv": 0.4357504576444626, "grad_min_sv": 1.8338578772203463e-08, "grad_condition": 66584075.59983899, "lr": 0.0008644843137107055, "time_sec": 15.47328805923462 }, { "epoch": 37, "train_loss": 0.8544786010742188, "train_acc": 0.74252, "test_loss": 1.7350282289505006, "test_acc": 0.5703, "lyapunov": null, "grad_norm": 0.9779352878833807, "grad_max_sv": 0.42835590019822123, "grad_min_sv": 1.7869282904758865e-08, "grad_condition": 39240168.34852584, "lr": 0.0008572363398164014, "time_sec": 15.479693412780762 }, { "epoch": 38, "train_loss": 0.8369656467819214, "train_acc": 0.7451, "test_loss": 1.8668952745437621, "test_acc": 0.545, "lyapunov": null, "grad_norm": 0.9729051326605097, "grad_max_sv": 0.42709693908691404, "grad_min_sv": 1.8001504511339085e-08, "grad_condition": 69145831.04846993, "lr": 0.0008498316702566826, "time_sec": 15.467434167861938 }, { "epoch": 39, "train_loss": 0.8145392098999024, "train_acc": 0.75306, "test_loss": 1.8897558479309082, "test_acc": 0.5503, "lyapunov": null, "grad_norm": 0.9541931051989594, "grad_max_sv": 0.4177068963646889, "grad_min_sv": 1.733705095180449e-08, "grad_condition": 47970887.65811751, "lr": 0.0008422735529643442, "time_sec": 15.485415935516357 }, { "epoch": 40, "train_loss": 0.807158277015686, "train_acc": 0.75318, "test_loss": 1.9477338481903077, "test_acc": 0.5448, "lyapunov": null, "grad_norm": 0.954786311576214, "grad_max_sv": 0.4165697038173676, "grad_min_sv": 1.7467571476748044e-08, "grad_condition": 71184092.08959822, "lr": 0.0008345653031794289, "time_sec": 15.485467195510864 }, { "epoch": 41, "train_loss": 0.7800393992233277, "train_acc": 0.76146, "test_loss": 1.8521117683410644, "test_acc": 0.558, "lyapunov": null, "grad_norm": 0.9354361850547955, "grad_max_sv": 0.39634769782423973, "grad_min_sv": 1.7005577766619763e-08, "grad_condition": 138342469.93119007, "lr": 0.0008267103019950526, "time_sec": 15.47174334526062 }, { "epoch": 42, "train_loss": 0.7673079490661621, "train_acc": 0.76286, "test_loss": 1.7608818145751952, "test_acc": 0.577, "lyapunov": null, "grad_norm": 0.9379451954941195, "grad_max_sv": 0.4147824175655842, "grad_min_sv": 1.7161911683612197e-08, "grad_condition": 393263932.238869, "lr": 0.0008187119948743447, "time_sec": 15.480841875076294 }, { "epoch": 43, "train_loss": 0.7557721022987366, "train_acc": 0.76692, "test_loss": 1.8332683414459228, "test_acc": 0.5644, "lyapunov": null, "grad_norm": 0.9301101362040648, "grad_max_sv": 0.40277465879917146, "grad_min_sv": 1.665620945143914e-08, "grad_condition": 317094927.94089293, "lr": 0.000810573890139155, "time_sec": 15.466366291046143 }, { "epoch": 44, "train_loss": 0.7345015475463867, "train_acc": 0.77376, "test_loss": 2.0360315671920777, "test_acc": 0.5296, "lyapunov": null, "grad_norm": 0.9112815822240762, "grad_max_sv": 0.39828494787216184, "grad_min_sv": 1.6604482540208235e-08, "grad_condition": 1254182168.7542708, "lr": 0.0008022995574311873, "time_sec": 15.476161003112793 }, { "epoch": 45, "train_loss": 0.7160864910125733, "train_acc": 0.77798, "test_loss": 2.0404258838653564, "test_acc": 0.5382, "lyapunov": null, "grad_norm": 0.8941597810728247, "grad_max_sv": 0.397457180917263, "grad_min_sv": 1.6262863201943478e-08, "grad_condition": 84531533.80346392, "lr": 0.0007938926261462363, "time_sec": 15.475411176681519 }, { "epoch": 46, "train_loss": 0.6994082283973694, "train_acc": 0.78516, "test_loss": 1.8352840042114258, "test_acc": 0.5715, "lyapunov": null, "grad_norm": 0.8836953876364382, "grad_max_sv": 0.38196621984243395, "grad_min_sv": 1.585408843512992e-08, "grad_condition": 76847427.02204503, "lr": 0.0007853567838422158, "time_sec": 15.509245872497559 }, { "epoch": 47, "train_loss": 0.6929370341110229, "train_acc": 0.786, "test_loss": 1.7921090829849242, "test_acc": 0.5714, "lyapunov": null, "grad_norm": 0.8861845328251086, "grad_max_sv": 0.39072656705975534, "grad_min_sv": 1.5896329046182282e-08, "grad_condition": 600990537.5108824, "lr": 0.0007766957746216719, "time_sec": 15.538230895996094 }, { "epoch": 48, "train_loss": 0.6808394806671143, "train_acc": 0.79018, "test_loss": 1.8164992214202882, "test_acc": 0.5718, "lyapunov": null, "grad_norm": 0.8747589044293621, "grad_max_sv": 0.3651046365499496, "grad_min_sv": 1.5464912742416125e-08, "grad_condition": 108472217.28693132, "lr": 0.0007679133974894982, "time_sec": 15.491382360458374 }, { "epoch": 49, "train_loss": 0.6645313382148743, "train_acc": 0.79124, "test_loss": 1.9076677312850951, "test_acc": 0.5604, "lyapunov": null, "grad_norm": 0.8702547527458556, "grad_max_sv": 0.3733041428029537, "grad_min_sv": 1.552003626170695e-08, "grad_condition": 37206285.59276767, "lr": 0.000759013504686565, "time_sec": 15.492026090621948 }, { "epoch": 50, "train_loss": 0.6496543109512329, "train_acc": 0.79798, "test_loss": 1.7902040550231935, "test_acc": 0.577, "lyapunov": null, "grad_norm": 0.8583943232969492, "grad_max_sv": 0.3693894289433956, "grad_min_sv": 1.526528436018859e-08, "grad_condition": 167614304.3259273, "lr": 0.0007499999999999998, "time_sec": 15.511015892028809 }, { "epoch": 51, "train_loss": 0.6329201017856598, "train_acc": 0.8008, "test_loss": 1.8939409488677978, "test_acc": 0.5669, "lyapunov": null, "grad_norm": 0.8468251234327242, "grad_max_sv": 0.379767844825983, "grad_min_sv": 1.5527148693184055e-08, "grad_condition": 40445680.98758187, "lr": 0.0007408768370508575, "time_sec": 15.502861976623535 }, { "epoch": 52, "train_loss": 0.6156794411849975, "train_acc": 0.8076, "test_loss": 1.8557664161682128, "test_acc": 0.5669, "lyapunov": null, "grad_norm": 0.8409556426090318, "grad_max_sv": 0.3604695089161396, "grad_min_sv": 1.5232246320523447e-08, "grad_condition": 154891483.950261, "lr": 0.0007316480175599307, "time_sec": 15.50012731552124 }, { "epoch": 53, "train_loss": 0.6097512643051147, "train_acc": 0.80932, "test_loss": 1.9206684701919556, "test_acc": 0.5625, "lyapunov": null, "grad_norm": 0.8343400645564791, "grad_max_sv": 0.36483332961797715, "grad_min_sv": 1.4756883175842672e-08, "grad_condition": 60983068.9144889, "lr": 0.0007223175895924635, "time_sec": 15.473671436309814 }, { "epoch": 54, "train_loss": 0.5996515681266784, "train_acc": 0.81028, "test_loss": 1.813775136566162, "test_acc": 0.5799, "lyapunov": null, "grad_norm": 0.8292003009813924, "grad_max_sv": 0.3576398268342018, "grad_min_sv": 1.4879297414310821e-08, "grad_condition": 169462696.72509637, "lr": 0.0007128896457825361, "time_sec": 15.514740228652954 }, { "epoch": 55, "train_loss": 0.583572147731781, "train_acc": 0.81692, "test_loss": 2.1540262565612793, "test_acc": 0.5359, "lyapunov": null, "grad_norm": 0.8153888602407285, "grad_max_sv": 0.35695644542574884, "grad_min_sv": 1.4523149247103185e-08, "grad_condition": 121177173.48603642, "lr": 0.0007033683215378998, "time_sec": 15.494624614715576 }, { "epoch": 56, "train_loss": 0.5730211604690552, "train_acc": 0.81882, "test_loss": 1.9024797750473021, "test_acc": 0.5681, "lyapunov": null, "grad_norm": 0.8114470689653183, "grad_max_sv": 0.3512945234775543, "grad_min_sv": 1.4168293734420634e-08, "grad_condition": 1195593278.9067845, "lr": 0.0006937577932260512, "time_sec": 15.484891176223755 }, { "epoch": 57, "train_loss": 0.5623767246627808, "train_acc": 0.82144, "test_loss": 1.8823775342941285, "test_acc": 0.5727, "lyapunov": null, "grad_norm": 0.8082731215074979, "grad_max_sv": 0.348369175940752, "grad_min_sv": 1.429975417729934e-08, "grad_condition": 63927698.94124661, "lr": 0.0006840622763423388, "time_sec": 15.500881433486938 }, { "epoch": 58, "train_loss": 0.5483553691482544, "train_acc": 0.82696, "test_loss": 1.8506002332687377, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.7992259508625827, "grad_max_sv": 0.341405463218689, "grad_min_sv": 1.3835257317573735e-08, "grad_condition": 33930048.946812846, "lr": 0.0006742860236609073, "time_sec": 15.480631589889526 }, { "epoch": 59, "train_loss": 0.5366774555110931, "train_acc": 0.8303, "test_loss": 1.825086770439148, "test_acc": 0.5833, "lyapunov": null, "grad_norm": 0.7819063927350494, "grad_max_sv": 0.3418069466948509, "grad_min_sv": 1.3836575564691103e-08, "grad_condition": 408216925.10828066, "lr": 0.0006644333233692913, "time_sec": 15.500194072723389 }, { "epoch": 60, "train_loss": 0.5336303442287446, "train_acc": 0.83014, "test_loss": 1.8931641094207763, "test_acc": 0.5815, "lyapunov": null, "grad_norm": 0.7872838454858564, "grad_max_sv": 0.3333701379597187, "grad_min_sv": 1.3876314406248771e-08, "grad_condition": 438039568.05699426, "lr": 0.0006545084971874734, "time_sec": 15.50975775718689 }, { "epoch": 61, "train_loss": 0.5172760334014893, "train_acc": 0.8346, "test_loss": 1.8987928335189819, "test_acc": 0.579, "lyapunov": null, "grad_norm": 0.7761151334812662, "grad_max_sv": 0.34407150372862816, "grad_min_sv": 1.3653881279773738e-08, "grad_condition": 74302812.53353639, "lr": 0.0006445158984722354, "time_sec": 15.496349096298218 }, { "epoch": 62, "train_loss": 0.5046570606422425, "train_acc": 0.83994, "test_loss": 1.8855070373535157, "test_acc": 0.5827, "lyapunov": null, "grad_norm": 0.7637023137146217, "grad_max_sv": 0.3265983276069164, "grad_min_sv": 1.3850480627165818e-08, "grad_condition": 140662163.06722394, "lr": 0.0006344599103076324, "time_sec": 15.499541997909546 }, { "epoch": 63, "train_loss": 0.5043497357273102, "train_acc": 0.8385, "test_loss": 1.9895195541381836, "test_acc": 0.5677, "lyapunov": null, "grad_norm": 0.7677478821534836, "grad_max_sv": 0.33033859431743623, "grad_min_sv": 1.32192005543319e-08, "grad_condition": 238327868.213135, "lr": 0.0006243449435824269, "time_sec": 15.487115621566772 }, { "epoch": 64, "train_loss": 0.4833570729255676, "train_acc": 0.84588, "test_loss": 1.8681790885925293, "test_acc": 0.586, "lyapunov": null, "grad_norm": 0.751862285796187, "grad_max_sv": 0.3356017153710127, "grad_min_sv": 1.374610183761324e-08, "grad_condition": 301923677.0958418, "lr": 0.0006141754350553275, "time_sec": 15.47073483467102 }, { "epoch": 65, "train_loss": 0.4746548810005188, "train_acc": 0.85036, "test_loss": 1.8871611476898194, "test_acc": 0.5849, "lyapunov": null, "grad_norm": 0.7470026047014822, "grad_max_sv": 0.3292991783469915, "grad_min_sv": 1.3641982613693537e-08, "grad_condition": 89497941.46737906, "lr": 0.0006039558454088793, "time_sec": 15.498655796051025 }, { "epoch": 66, "train_loss": 0.4682476936244965, "train_acc": 0.85176, "test_loss": 1.9322247032165527, "test_acc": 0.5781, "lyapunov": null, "grad_norm": 0.746205818915284, "grad_max_sv": 0.324980178847909, "grad_min_sv": 1.332827236268791e-08, "grad_condition": 515634785.2347584, "lr": 0.000593690657292862, "time_sec": 15.49347710609436 }, { "epoch": 67, "train_loss": 0.4535627157497406, "train_acc": 0.85524, "test_loss": 1.9315398765563965, "test_acc": 0.5792, "lyapunov": null, "grad_norm": 0.7351128594354965, "grad_max_sv": 0.32144386470317843, "grad_min_sv": 1.316271100388136e-08, "grad_condition": 198503645.63195387, "lr": 0.0005833843733580507, "time_sec": 15.485307216644287 }, { "epoch": 68, "train_loss": 0.44375179916381835, "train_acc": 0.85868, "test_loss": 1.9626713150024413, "test_acc": 0.5797, "lyapunov": null, "grad_norm": 0.7275082319568421, "grad_max_sv": 0.31693296767771245, "grad_min_sv": 1.2464710682147037e-08, "grad_condition": 448992015.43105906, "lr": 0.0005730415142812054, "time_sec": 15.502485990524292 }, { "epoch": 69, "train_loss": 0.4375394599914551, "train_acc": 0.8578, "test_loss": 1.933611646080017, "test_acc": 0.5841, "lyapunov": null, "grad_norm": 0.7285377709438317, "grad_max_sv": 0.3246665924787521, "grad_min_sv": 1.2657065806900847e-08, "grad_condition": 183352263.73309737, "lr": 0.0005626666167821517, "time_sec": 15.504365682601929 }, { "epoch": 70, "train_loss": 0.4293804252910614, "train_acc": 0.86176, "test_loss": 1.9648184246063232, "test_acc": 0.5803, "lyapunov": null, "grad_norm": 0.7201252438636403, "grad_max_sv": 0.32932178787887095, "grad_min_sv": 1.2632546332082274e-08, "grad_condition": 152515630.29556593, "lr": 0.0005522642316338265, "time_sec": 15.50436282157898 }, { "epoch": 71, "train_loss": 0.4283500701713562, "train_acc": 0.86214, "test_loss": 1.9075251319885254, "test_acc": 0.5925, "lyapunov": null, "grad_norm": 0.7191799969742115, "grad_max_sv": 0.31320683732628823, "grad_min_sv": 1.3020388655790583e-08, "grad_condition": 140157658.32034963, "lr": 0.0005418389216661573, "time_sec": 15.498285293579102 }, { "epoch": 72, "train_loss": 0.41739362247467043, "train_acc": 0.86518, "test_loss": 1.9817939153671265, "test_acc": 0.5787, "lyapunov": null, "grad_norm": 0.7089702462612528, "grad_max_sv": 0.31360611245036124, "grad_min_sv": 1.2536597712286407e-08, "grad_condition": 419598262.18900955, "lr": 0.0005313952597646563, "time_sec": 15.484673976898193 }, { "epoch": 73, "train_loss": 0.4100272283267975, "train_acc": 0.8682, "test_loss": 1.9430673105239868, "test_acc": 0.5896, "lyapunov": null, "grad_norm": 0.701251782999493, "grad_max_sv": 0.31041153334081173, "grad_min_sv": 1.2882357953384466e-08, "grad_condition": 168668664.161966, "lr": 0.0005209378268645994, "time_sec": 15.47413682937622 }, { "epoch": 74, "train_loss": 0.399578921251297, "train_acc": 0.87068, "test_loss": 1.9265120712280273, "test_acc": 0.5864, "lyapunov": null, "grad_norm": 0.6934025786184035, "grad_max_sv": 0.3066574942320585, "grad_min_sv": 1.2560646439098433e-08, "grad_condition": 129867930.4907889, "lr": 0.0005104712099416781, "time_sec": 15.502904891967773 }, { "epoch": 75, "train_loss": 0.38554568584918975, "train_acc": 0.87558, "test_loss": 1.9176615629196168, "test_acc": 0.5925, "lyapunov": null, "grad_norm": 0.6895198915282967, "grad_max_sv": 0.3080108392983675, "grad_min_sv": 1.229493239038532e-08, "grad_condition": 1984776951.5641804, "lr": 0.0004999999999999996, "time_sec": 15.504841089248657 }, { "epoch": 76, "train_loss": 0.3888973752117157, "train_acc": 0.87366, "test_loss": 1.9323603094100952, "test_acc": 0.5905, "lyapunov": null, "grad_norm": 0.689575361251709, "grad_max_sv": 0.30503964237868786, "grad_min_sv": 1.223273589129499e-08, "grad_condition": 592473189.0734928, "lr": 0.0004895287900583212, "time_sec": 15.488545894622803 }, { "epoch": 77, "train_loss": 0.375536418132782, "train_acc": 0.87906, "test_loss": 1.9612086307525636, "test_acc": 0.5896, "lyapunov": null, "grad_norm": 0.6799899173694914, "grad_max_sv": 0.28870479166507723, "grad_min_sv": 1.1852196383013713e-08, "grad_condition": 974539567.6482589, "lr": 0.0004790621731353997, "time_sec": 15.496360778808594 }, { "epoch": 78, "train_loss": 0.3633386760520935, "train_acc": 0.88388, "test_loss": 2.0136638622283938, "test_acc": 0.5813, "lyapunov": null, "grad_norm": 0.669468067176516, "grad_max_sv": 0.2999464552849531, "grad_min_sv": 1.1967348311804626e-08, "grad_condition": 336932159.827844, "lr": 0.000468604740235343, "time_sec": 15.49899435043335 }, { "epoch": 79, "train_loss": 0.3648362389755249, "train_acc": 0.88286, "test_loss": 1.962812972831726, "test_acc": 0.5878, "lyapunov": null, "grad_norm": 0.6712781124195144, "grad_max_sv": 0.3077389158308506, "grad_min_sv": 1.1902174327019233e-08, "grad_condition": 79151255.2676374, "lr": 0.00045816107833384175, "time_sec": 15.50163722038269 }, { "epoch": 80, "train_loss": 0.3587533256816864, "train_acc": 0.88438, "test_loss": 2.031941645812988, "test_acc": 0.5782, "lyapunov": null, "grad_norm": 0.6682785418366496, "grad_max_sv": 0.3066766869276762, "grad_min_sv": 1.2061256379237995e-08, "grad_condition": 166882222.61886424, "lr": 0.0004477357683661729, "time_sec": 15.493919610977173 }, { "epoch": 81, "train_loss": 0.3532279273414612, "train_acc": 0.88642, "test_loss": 1.9712375566482543, "test_acc": 0.5907, "lyapunov": null, "grad_norm": 0.6617439515766644, "grad_max_sv": 0.2908315297216177, "grad_min_sv": 1.1691992539419882e-08, "grad_condition": 159733352.26610285, "lr": 0.00043733338321784746, "time_sec": 15.49502420425415 }, { "epoch": 82, "train_loss": 0.337565802192688, "train_acc": 0.8912, "test_loss": 2.0504629846572877, "test_acc": 0.5809, "lyapunov": null, "grad_norm": 0.6468139784059553, "grad_max_sv": 0.29187568798661234, "grad_min_sv": 1.1621694805114122e-08, "grad_condition": 4917199791.496119, "lr": 0.0004269584857187939, "time_sec": 15.506073236465454 }, { "epoch": 83, "train_loss": 0.3370664621257782, "train_acc": 0.8903, "test_loss": 1.9356835838317872, "test_acc": 0.5944, "lyapunov": null, "grad_norm": 0.6494703611205956, "grad_max_sv": 0.29382526241242884, "grad_min_sv": 1.174881616096586e-08, "grad_condition": 730478169.7287635, "lr": 0.0004166156266419484, "time_sec": 15.50250792503357 }, { "epoch": 84, "train_loss": 0.329011485414505, "train_acc": 0.8946, "test_loss": 2.079398715400696, "test_acc": 0.5797, "lyapunov": null, "grad_norm": 0.643698144652478, "grad_max_sv": 0.29514241628348825, "grad_min_sv": 1.140666323123582e-08, "grad_condition": 487746924.1063552, "lr": 0.0004063093427071373, "time_sec": 15.505268812179565 }, { "epoch": 85, "train_loss": 0.3234008149909973, "train_acc": 0.89458, "test_loss": 1.9295039024353027, "test_acc": 0.5972, "lyapunov": null, "grad_norm": 0.6406406419682773, "grad_max_sv": 0.28015601113438604, "grad_min_sv": 1.1093708248907652e-08, "grad_condition": 168584514.79069662, "lr": 0.0003960441545911199, "time_sec": 15.517300128936768 }, { "epoch": 86, "train_loss": 0.3155531369972229, "train_acc": 0.89746, "test_loss": 1.9418060377120971, "test_acc": 0.5998, "lyapunov": null, "grad_norm": 0.6350703488704397, "grad_max_sv": 0.29371371641755106, "grad_min_sv": 1.1439264175315545e-08, "grad_condition": 137016772.41396585, "lr": 0.0003858245649446718, "time_sec": 15.547461986541748 }, { "epoch": 87, "train_loss": 0.3074404651927948, "train_acc": 0.90046, "test_loss": 1.9792525926589966, "test_acc": 0.5962, "lyapunov": null, "grad_norm": 0.6264501533131277, "grad_max_sv": 0.2842790149152279, "grad_min_sv": 1.0928390427257691e-08, "grad_condition": 1305488613.824437, "lr": 0.00037565505641757235, "time_sec": 15.51766037940979 }, { "epoch": 88, "train_loss": 0.30229676830768587, "train_acc": 0.90176, "test_loss": 1.976724716567993, "test_acc": 0.5936, "lyapunov": null, "grad_norm": 0.6211883734687677, "grad_max_sv": 0.2838983990252018, "grad_min_sv": 1.1175761286449232e-08, "grad_condition": 333355247.3488082, "lr": 0.00036554008969236695, "time_sec": 15.503639221191406 }, { "epoch": 89, "train_loss": 0.2988234822654724, "train_acc": 0.90424, "test_loss": 1.9976719675064087, "test_acc": 0.5967, "lyapunov": null, "grad_norm": 0.6213370027659331, "grad_max_sv": 0.28663169853389264, "grad_min_sv": 1.1367645391321956e-08, "grad_condition": 134336770.77173668, "lr": 0.0003554841015277638, "time_sec": 15.497193574905396 }, { "epoch": 90, "train_loss": 0.29101773542404175, "train_acc": 0.9066, "test_loss": 1.9723329444885254, "test_acc": 0.5984, "lyapunov": null, "grad_norm": 0.6117671492586956, "grad_max_sv": 0.2787142962217331, "grad_min_sv": 1.082959833688564e-08, "grad_condition": 693540712.1308935, "lr": 0.000345491502812526, "time_sec": 15.504314661026001 }, { "epoch": 91, "train_loss": 0.29135215978622436, "train_acc": 0.90466, "test_loss": 1.9791620111465453, "test_acc": 0.5971, "lyapunov": null, "grad_norm": 0.6144584827027046, "grad_max_sv": 0.2858317792415619, "grad_min_sv": 1.112117410219729e-08, "grad_condition": 533297710.9846781, "lr": 0.0003355666766307081, "time_sec": 15.508234977722168 }, { "epoch": 92, "train_loss": 0.28011693614006045, "train_acc": 0.90924, "test_loss": 1.9835497787475587, "test_acc": 0.5948, "lyapunov": null, "grad_norm": 0.6018450358334453, "grad_max_sv": 0.2840783912688494, "grad_min_sv": 1.073533659606829e-08, "grad_condition": 553082386.2675663, "lr": 0.00032571397633909225, "time_sec": 15.51693344116211 }, { "epoch": 93, "train_loss": 0.28014948011398316, "train_acc": 0.91044, "test_loss": 1.9525927974700927, "test_acc": 0.5988, "lyapunov": null, "grad_norm": 0.5970591995758349, "grad_max_sv": 0.27580611146986483, "grad_min_sv": 1.084302959390368e-08, "grad_condition": 267617873.38796434, "lr": 0.00031593772365766094, "time_sec": 15.507484197616577 }, { "epoch": 94, "train_loss": 0.2744602131557465, "train_acc": 0.90992, "test_loss": 1.9839596082687379, "test_acc": 0.5989, "lyapunov": null, "grad_norm": 0.5927553038661005, "grad_max_sv": 0.2760546799749136, "grad_min_sv": 1.0739196502950258e-08, "grad_condition": 394969307.85135096, "lr": 0.0003062422067739483, "time_sec": 15.516487121582031 }, { "epoch": 95, "train_loss": 0.2686861476325989, "train_acc": 0.91254, "test_loss": 1.977996702194214, "test_acc": 0.605, "lyapunov": null, "grad_norm": 0.5892956934064133, "grad_max_sv": 0.27805082462728026, "grad_min_sv": 1.052729135583158e-08, "grad_condition": 344387886.3070652, "lr": 0.00029663167846209965, "time_sec": 15.495723962783813 }, { "epoch": 96, "train_loss": 0.26172939152240754, "train_acc": 0.91622, "test_loss": 2.0434574504852296, "test_acc": 0.5946, "lyapunov": null, "grad_norm": 0.5805032172314536, "grad_max_sv": 0.2648235227912664, "grad_min_sv": 1.057376605411841e-08, "grad_condition": 771027815.348639, "lr": 0.00028711035421746345, "time_sec": 15.489963293075562 }, { "epoch": 97, "train_loss": 0.25184455102920533, "train_acc": 0.91832, "test_loss": 1.9518341100692749, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.5774864526737941, "grad_max_sv": 0.26801337823271754, "grad_min_sv": 1.0317103195465332e-08, "grad_condition": 602185384.328079, "lr": 0.00027768241040753615, "time_sec": 15.513015985488892 }, { "epoch": 98, "train_loss": 0.24914393192768097, "train_acc": 0.91812, "test_loss": 1.983034141921997, "test_acc": 0.6073, "lyapunov": null, "grad_norm": 0.573198769045943, "grad_max_sv": 0.2713981341570616, "grad_min_sv": 1.03603865028723e-08, "grad_condition": 87200014.42748493, "lr": 0.00026835198244006903, "time_sec": 15.507933616638184 }, { "epoch": 99, "train_loss": 0.2450516757631302, "train_acc": 0.9213, "test_loss": 2.0576653924942017, "test_acc": 0.5987, "lyapunov": null, "grad_norm": 0.565340793701802, "grad_max_sv": 0.26787664406001566, "grad_min_sv": 1.0084340480113335e-08, "grad_condition": 993815528.2154503, "lr": 0.0002591231629491421, "time_sec": 15.498576164245605 }, { "epoch": 100, "train_loss": 0.2435112312412262, "train_acc": 0.92126, "test_loss": 1.9808508350372314, "test_acc": 0.6083, "lyapunov": null, "grad_norm": 0.5671331888797334, "grad_max_sv": 0.2718590907752514, "grad_min_sv": 1.0603882181613872e-08, "grad_condition": 515734941.7641746, "lr": 0.0002499999999999997, "time_sec": 15.509106874465942 }, { "epoch": 101, "train_loss": 0.23981757608413695, "train_acc": 0.92198, "test_loss": 1.9874406982421875, "test_acc": 0.6051, "lyapunov": null, "grad_norm": 0.5662694992474826, "grad_max_sv": 0.27430120259523394, "grad_min_sv": 1.0230437299217631e-08, "grad_condition": 552718981.9754595, "lr": 0.00024098649531343477, "time_sec": 15.50493860244751 }, { "epoch": 102, "train_loss": 0.23594800971031188, "train_acc": 0.92386, "test_loss": 2.0030108623504637, "test_acc": 0.6045, "lyapunov": null, "grad_norm": 0.557765074009711, "grad_max_sv": 0.25009447410702706, "grad_min_sv": 9.674274866248132e-09, "grad_condition": 671563833.1462272, "lr": 0.0002320866025105016, "time_sec": 15.537469863891602 }, { "epoch": 103, "train_loss": 0.22944483037471772, "train_acc": 0.9257, "test_loss": 1.997948205947876, "test_acc": 0.6021, "lyapunov": null, "grad_norm": 0.5530501913094669, "grad_max_sv": 0.25403534434735775, "grad_min_sv": 9.987440614811493e-09, "grad_condition": 64606423.56909867, "lr": 0.0002233042253783278, "time_sec": 15.524824619293213 }, { "epoch": 104, "train_loss": 0.2232392775917053, "train_acc": 0.92808, "test_loss": 1.916127438735962, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.5470142147101442, "grad_max_sv": 0.2518034357577562, "grad_min_sv": 9.64682456273784e-09, "grad_condition": 523753099.18247145, "lr": 0.000214643216157784, "time_sec": 15.519572973251343 }, { "epoch": 105, "train_loss": 0.21899011870384216, "train_acc": 0.93022, "test_loss": 1.9813644931793213, "test_acc": 0.6042, "lyapunov": null, "grad_norm": 0.540595572944098, "grad_max_sv": 0.25836079344153406, "grad_min_sv": 9.721760932390744e-09, "grad_condition": 149408798.18128103, "lr": 0.00020610737385376332, "time_sec": 15.511976957321167 }, { "epoch": 106, "train_loss": 0.22239319385528564, "train_acc": 0.9288, "test_loss": 2.019803592300415, "test_acc": 0.6062, "lyapunov": null, "grad_norm": 0.5444023817051111, "grad_max_sv": 0.2558960601687431, "grad_min_sv": 9.743871165522958e-09, "grad_condition": 421456811.7162399, "lr": 0.00019770044256881242, "time_sec": 15.492303371429443 }, { "epoch": 107, "train_loss": 0.21911219958305359, "train_acc": 0.92724, "test_loss": 1.9594658828735352, "test_acc": 0.6122, "lyapunov": null, "grad_norm": 0.5463060896750315, "grad_max_sv": 0.25181276090443133, "grad_min_sv": 9.477817535397808e-09, "grad_condition": 260599469.65846786, "lr": 0.0001894261098608447, "time_sec": 15.511865139007568 }, { "epoch": 108, "train_loss": 0.2136860816383362, "train_acc": 0.93128, "test_loss": 1.9913309350967408, "test_acc": 0.6093, "lyapunov": null, "grad_norm": 0.5352068921664158, "grad_max_sv": 0.2675321064889431, "grad_min_sv": 1.0163352071659035e-08, "grad_condition": 3452227132.4482284, "lr": 0.000181288005125655, "time_sec": 15.58255934715271 }, { "epoch": 109, "train_loss": 0.21131246563911438, "train_acc": 0.93124, "test_loss": 1.9869737873077393, "test_acc": 0.6101, "lyapunov": null, "grad_norm": 0.5344952417105377, "grad_max_sv": 0.2572028797119856, "grad_min_sv": 9.894322512259829e-09, "grad_condition": 825239604.2039155, "lr": 0.0001732896980049473, "time_sec": 15.527096509933472 }, { "epoch": 110, "train_loss": 0.20613145572185515, "train_acc": 0.93496, "test_loss": 1.9642673852920531, "test_acc": 0.6083, "lyapunov": null, "grad_norm": 0.5266562322432973, "grad_max_sv": 0.25352666079998015, "grad_min_sv": 9.363287075498869e-09, "grad_condition": 505733273.3952273, "lr": 0.00016543469682057076, "time_sec": 15.536001443862915 }, { "epoch": 111, "train_loss": 0.20270503174304963, "train_acc": 0.93508, "test_loss": 1.9903694719314575, "test_acc": 0.608, "lyapunov": null, "grad_norm": 0.5210342707384447, "grad_max_sv": 0.2542009174823761, "grad_min_sv": 9.446510174006967e-09, "grad_condition": 286370629.6135062, "lr": 0.00015772644703565552, "time_sec": 15.513093948364258 }, { "epoch": 112, "train_loss": 0.20146147197723388, "train_acc": 0.93366, "test_loss": 2.0144760524749756, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.5269979725551543, "grad_max_sv": 0.26795426234602926, "grad_min_sv": 9.357044586204288e-09, "grad_condition": 370288038.01884973, "lr": 0.00015016832974331713, "time_sec": 15.502255916595459 }, { "epoch": 113, "train_loss": 0.19924361347198485, "train_acc": 0.93656, "test_loss": 2.037332961463928, "test_acc": 0.6045, "lyapunov": null, "grad_norm": 0.5185296845346113, "grad_max_sv": 0.2515675876289606, "grad_min_sv": 9.252139900398081e-09, "grad_condition": 112959773.59806451, "lr": 0.00014276366018359834, "time_sec": 15.511096477508545 }, { "epoch": 114, "train_loss": 0.1925122591304779, "train_acc": 0.9381, "test_loss": 2.001781312942505, "test_acc": 0.6067, "lyapunov": null, "grad_norm": 0.512080843138899, "grad_max_sv": 0.2638113047927618, "grad_min_sv": 9.222902344467079e-09, "grad_condition": 702867317.5417335, "lr": 0.00013551568628929425, "time_sec": 15.528293132781982 }, { "epoch": 115, "train_loss": 0.1863429721736908, "train_acc": 0.94024, "test_loss": 1.9896372226715089, "test_acc": 0.6147, "lyapunov": null, "grad_norm": 0.5052730414811996, "grad_max_sv": 0.239008704200387, "grad_min_sv": 8.86921835820207e-09, "grad_condition": 1285263365.3241801, "lr": 0.00012842758726130276, "time_sec": 15.514945983886719 }, { "epoch": 116, "train_loss": 0.18872571726799012, "train_acc": 0.93914, "test_loss": 2.0415555866241455, "test_acc": 0.6066, "lyapunov": null, "grad_norm": 0.5103345009623144, "grad_max_sv": 0.24828836917877198, "grad_min_sv": 9.405215367630503e-09, "grad_condition": 207294853.39805278, "lr": 0.0001215024721741218, "time_sec": 15.541447639465332 }, { "epoch": 117, "train_loss": 0.18968458090782164, "train_acc": 0.93852, "test_loss": 2.043529853057861, "test_acc": 0.6064, "lyapunov": null, "grad_norm": 0.5117797700108315, "grad_max_sv": 0.25188570134341715, "grad_min_sv": 9.368504555202357e-09, "grad_condition": 350583787.5469278, "lr": 0.00011474337861210538, "time_sec": 15.519954681396484 }, { "epoch": 118, "train_loss": 0.18446471235752104, "train_acc": 0.94032, "test_loss": 2.0161501600265503, "test_acc": 0.611, "lyapunov": null, "grad_norm": 0.5034586286350297, "grad_max_sv": 0.24743926264345645, "grad_min_sv": 9.410030827038682e-09, "grad_condition": 1867541501.3184059, "lr": 0.00010815327133708009, "time_sec": 15.52394437789917 }, { "epoch": 119, "train_loss": 0.18162137420654298, "train_acc": 0.94302, "test_loss": 2.045531623840332, "test_acc": 0.6089, "lyapunov": null, "grad_norm": 0.4988474494797281, "grad_max_sv": 0.2458579033613205, "grad_min_sv": 9.119631047809635e-09, "grad_condition": 646958702.124923, "lr": 0.00010173504098790182, "time_sec": 15.515710353851318 }, { "epoch": 120, "train_loss": 0.17938962819099427, "train_acc": 0.94308, "test_loss": 2.0503937309265137, "test_acc": 0.6077, "lyapunov": null, "grad_norm": 0.4989562559637299, "grad_max_sv": 0.2459786232560873, "grad_min_sv": 9.11741269214554e-09, "grad_condition": 412394597.02274954, "lr": 9.549150281252629e-05, "time_sec": 15.50988483428955 }, { "epoch": 121, "train_loss": 0.17874448727607728, "train_acc": 0.9433, "test_loss": 1.9961147312164307, "test_acc": 0.6151, "lyapunov": null, "grad_norm": 0.4935280058170082, "grad_max_sv": 0.24326966032385827, "grad_min_sv": 9.25761599965963e-09, "grad_condition": 299984759.10134274, "lr": 8.942539543314794e-05, "time_sec": 15.528467416763306 }, { "epoch": 122, "train_loss": 0.17431395033836364, "train_acc": 0.94446, "test_loss": 2.038390445327759, "test_acc": 0.613, "lyapunov": null, "grad_norm": 0.48926666642054484, "grad_max_sv": 0.23983839638531207, "grad_min_sv": 8.987133019505365e-09, "grad_condition": 372068253.35925686, "lr": 8.353937964495024e-05, "time_sec": 15.500731706619263 }, { "epoch": 123, "train_loss": 0.1746806291246414, "train_acc": 0.94498, "test_loss": 2.0120771438598632, "test_acc": 0.6099, "lyapunov": null, "grad_norm": 0.48962253985732923, "grad_max_sv": 0.23851457759737968, "grad_min_sv": 8.603977001459158e-09, "grad_condition": 1007854799.2213293, "lr": 7.783603724899243e-05, "time_sec": 15.516981840133667 }, { "epoch": 124, "train_loss": 0.17128678526878358, "train_acc": 0.94656, "test_loss": 2.0720390872955323, "test_acc": 0.6088, "lyapunov": null, "grad_norm": 0.4869814196810216, "grad_max_sv": 0.2417709030210972, "grad_min_sv": 9.009437708026868e-09, "grad_condition": 145836314.2500567, "lr": 7.231786991974666e-05, "time_sec": 15.496051549911499 }, { "epoch": 125, "train_loss": 0.17059236883163453, "train_acc": 0.94604, "test_loss": 2.0477584241867066, "test_acc": 0.6122, "lyapunov": null, "grad_norm": 0.4843155728593804, "grad_max_sv": 0.2388555094599724, "grad_min_sv": 8.632761457245953e-09, "grad_condition": 270912168.9760497, "lr": 6.698729810778072e-05, "time_sec": 15.507468223571777 }, { "epoch": 126, "train_loss": 0.1733051071071625, "train_acc": 0.94568, "test_loss": 2.0736024877548216, "test_acc": 0.6062, "lyapunov": null, "grad_norm": 0.4894754419923655, "grad_max_sv": 0.2332348022609949, "grad_min_sv": 8.863469305384064e-09, "grad_condition": 160444601.063775, "lr": 6.184665997806817e-05, "time_sec": 15.507078647613525 }, { "epoch": 127, "train_loss": 0.16721239070892335, "train_acc": 0.9461, "test_loss": 2.0207285331726075, "test_acc": 0.6115, "lyapunov": null, "grad_norm": 0.4795404458508196, "grad_max_sv": 0.23950408175587654, "grad_min_sv": 8.801710726718485e-09, "grad_condition": 1343442143.4331565, "lr": 5.6898210384392595e-05, "time_sec": 15.510753154754639 }, { "epoch": 128, "train_loss": 0.16301859991550446, "train_acc": 0.94872, "test_loss": 2.0851793113708497, "test_acc": 0.6103, "lyapunov": null, "grad_norm": 0.4714155804221718, "grad_max_sv": 0.23401366584002972, "grad_min_sv": 8.772188082482521e-09, "grad_condition": 704162454.9287102, "lr": 5.214411988029363e-05, "time_sec": 15.514019966125488 }, { "epoch": 129, "train_loss": 0.16865292779922486, "train_acc": 0.94554, "test_loss": 2.0298268291473387, "test_acc": 0.6124, "lyapunov": null, "grad_norm": 0.4834939277959604, "grad_max_sv": 0.23208196237683296, "grad_min_sv": 8.83715973165871e-09, "grad_condition": 657084742.2965086, "lr": 4.7586473766990294e-05, "time_sec": 15.501888990402222 }, { "epoch": 130, "train_loss": 0.16090039955615998, "train_acc": 0.94934, "test_loss": 2.003493827056885, "test_acc": 0.6146, "lyapunov": null, "grad_norm": 0.4705215229572171, "grad_max_sv": 0.23428524732589723, "grad_min_sv": 8.827295219608623e-09, "grad_condition": 132321813.8931369, "lr": 4.32272711786996e-05, "time_sec": 15.520491600036621 }, { "epoch": 131, "train_loss": 0.16265953367233277, "train_acc": 0.94782, "test_loss": 2.0326833637237547, "test_acc": 0.6098, "lyapunov": null, "grad_norm": 0.4733595950570731, "grad_max_sv": 0.2481051605194807, "grad_min_sv": 8.921660872021013e-09, "grad_condition": 1308927492.8875818, "lr": 3.906842420574966e-05, "time_sec": 15.518625020980835 }, { "epoch": 132, "train_loss": 0.16258932497501374, "train_acc": 0.94914, "test_loss": 2.0198348827362063, "test_acc": 0.6125, "lyapunov": null, "grad_norm": 0.4699519678045664, "grad_max_sv": 0.24516641050577165, "grad_min_sv": 9.013820106567064e-09, "grad_condition": 2740149017.6448007, "lr": 3.5111757055874305e-05, "time_sec": 15.513976335525513 }, { "epoch": 133, "train_loss": 0.16045542496204376, "train_acc": 0.9487, "test_loss": 2.0480993354797365, "test_acc": 0.6079, "lyapunov": null, "grad_norm": 0.47270172858917925, "grad_max_sv": 0.24782115481793882, "grad_min_sv": 8.897941883821703e-09, "grad_condition": 2462171077.7853346, "lr": 3.1359005254054254e-05, "time_sec": 15.518577098846436 }, { "epoch": 134, "train_loss": 0.1573088404560089, "train_acc": 0.95036, "test_loss": 1.996682660484314, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.467276051790063, "grad_max_sv": 0.23228747248649598, "grad_min_sv": 8.598132571376038e-09, "grad_condition": 260351989.2850774, "lr": 2.7811814881259484e-05, "time_sec": 15.509779214859009 }, { "epoch": 135, "train_loss": 0.15793343636512755, "train_acc": 0.94978, "test_loss": 2.078777936553955, "test_acc": 0.61, "lyapunov": null, "grad_norm": 0.46749496867126566, "grad_max_sv": 0.23898076675832272, "grad_min_sv": 8.952387563860784e-09, "grad_condition": 451518473.6951105, "lr": 2.4471741852423218e-05, "time_sec": 15.52340030670166 }, { "epoch": 136, "train_loss": 0.154298712348938, "train_acc": 0.9515, "test_loss": 1.9956215568542481, "test_acc": 0.6138, "lyapunov": null, "grad_norm": 0.4608054622581305, "grad_max_sv": 0.2408101461827755, "grad_min_sv": 8.805307293241817e-09, "grad_condition": 1102254676.5159357, "lr": 2.1340251233966362e-05, "time_sec": 15.507319211959839 }, { "epoch": 137, "train_loss": 0.15331442908525467, "train_acc": 0.95256, "test_loss": 2.0495632625579834, "test_acc": 0.6123, "lyapunov": null, "grad_norm": 0.4574770378660416, "grad_max_sv": 0.23036178909242153, "grad_min_sv": 8.661849632126891e-09, "grad_condition": 506789914.31804866, "lr": 1.8418716601170932e-05, "time_sec": 15.507285833358765 }, { "epoch": 138, "train_loss": 0.1548746111679077, "train_acc": 0.9515, "test_loss": 2.0342879112243653, "test_acc": 0.6092, "lyapunov": null, "grad_norm": 0.4633719984784024, "grad_max_sv": 0.23631713092327117, "grad_min_sv": 8.577337108357351e-09, "grad_condition": 2670530904.2886295, "lr": 1.570841943568445e-05, "time_sec": 15.521555662155151 }, { "epoch": 139, "train_loss": 0.15485820642471312, "train_acc": 0.95088, "test_loss": 2.107874339675903, "test_acc": 0.604, "lyapunov": null, "grad_norm": 0.4629261012072699, "grad_max_sv": 0.23058986626565456, "grad_min_sv": 8.546779077175937e-09, "grad_condition": 89370689.31677079, "lr": 1.3210548563419845e-05, "time_sec": 15.533792972564697 }, { "epoch": 140, "train_loss": 0.15574090136051177, "train_acc": 0.95052, "test_loss": 2.0240774383544924, "test_acc": 0.6098, "lyapunov": null, "grad_norm": 0.46494058002876526, "grad_max_sv": 0.23221574500203132, "grad_min_sv": 8.638921627709962e-09, "grad_condition": 80246168.02315111, "lr": 1.0926199633097203e-05, "time_sec": 15.512130975723267 }, { "epoch": 141, "train_loss": 0.1591239344215393, "train_acc": 0.94958, "test_loss": 2.024708453178406, "test_acc": 0.6149, "lyapunov": null, "grad_norm": 0.46462826011917274, "grad_max_sv": 0.23822997957468034, "grad_min_sv": 8.92720696771363e-09, "grad_condition": 4042860284.9715805, "lr": 8.856374635655688e-06, "time_sec": 15.50205683708191 }, { "epoch": 142, "train_loss": 0.1531704497528076, "train_acc": 0.95164, "test_loss": 2.019575048828125, "test_acc": 0.6145, "lyapunov": null, "grad_norm": 0.45691454501139306, "grad_max_sv": 0.2273581113666296, "grad_min_sv": 8.328775530700144e-09, "grad_condition": 1373651140.614626, "lr": 7.001981464747503e-06, "time_sec": 15.521899938583374 }, { "epoch": 143, "train_loss": 0.15698250900268554, "train_acc": 0.94968, "test_loss": 2.0042268390655518, "test_acc": 0.6097, "lyapunov": null, "grad_norm": 0.46686753330324193, "grad_max_sv": 0.23650417439639568, "grad_min_sv": 8.831455570535232e-09, "grad_condition": 482562028.10267067, "lr": 5.3638335185058295e-06, "time_sec": 15.537745237350464 }, { "epoch": 144, "train_loss": 0.15602278783798218, "train_acc": 0.95138, "test_loss": 2.042717301368713, "test_acc": 0.611, "lyapunov": null, "grad_norm": 0.46083256086412094, "grad_max_sv": 0.23666680604219437, "grad_min_sv": 8.818174148696178e-09, "grad_condition": 276670204.88561904, "lr": 3.942649342761114e-06, "time_sec": 15.521801948547363 }, { "epoch": 145, "train_loss": 0.15351612282276153, "train_acc": 0.95176, "test_loss": 2.0216105178833006, "test_acc": 0.6124, "lyapunov": null, "grad_norm": 0.4578762379981558, "grad_max_sv": 0.21950803697109222, "grad_min_sv": 8.404475567989662e-09, "grad_condition": 6256996699.314726, "lr": 2.7390523158633524e-06, "time_sec": 15.50935411453247 }, { "epoch": 146, "train_loss": 0.15463469685077666, "train_acc": 0.95138, "test_loss": 1.9923904767990113, "test_acc": 0.6146, "lyapunov": null, "grad_norm": 0.4604794709370396, "grad_max_sv": 0.23074053600430489, "grad_min_sv": 8.697518219221225e-09, "grad_condition": 857409957.1641747, "lr": 1.7535703752478133e-06, "time_sec": 15.525001287460327 }, { "epoch": 147, "train_loss": 0.15173500085830688, "train_acc": 0.95292, "test_loss": 2.0695271726608278, "test_acc": 0.6111, "lyapunov": null, "grad_norm": 0.4579307395851847, "grad_max_sv": 0.24183545261621475, "grad_min_sv": 8.57581264745045e-09, "grad_condition": 811599787.3349051, "lr": 9.866357858642196e-07, "time_sec": 15.52645206451416 }, { "epoch": 148, "train_loss": 0.15419637537956238, "train_acc": 0.95064, "test_loss": 2.059994563674927, "test_acc": 0.6067, "lyapunov": null, "grad_norm": 0.4599018124122232, "grad_max_sv": 0.23474312983453274, "grad_min_sv": 9.05704030905452e-09, "grad_condition": 153015326.96145612, "lr": 4.38584950570808e-07, "time_sec": 15.522296905517578 }, { "epoch": 149, "train_loss": 0.15387048045158386, "train_acc": 0.95202, "test_loss": 2.021223978805542, "test_acc": 0.6131, "lyapunov": null, "grad_norm": 0.45892673603732886, "grad_max_sv": 0.23917307555675507, "grad_min_sv": 8.54765248256041e-09, "grad_condition": 282516990.135565, "lr": 1.096582625772501e-07, "time_sec": 15.493387222290039 }, { "epoch": 150, "train_loss": 0.14960056081056594, "train_acc": 0.95382, "test_loss": 2.009403101348877, "test_acc": 0.6142, "lyapunov": null, "grad_norm": 0.4516160601649041, "grad_max_sv": 0.23220950104296206, "grad_min_sv": 8.634985401440986e-09, "grad_condition": 1119985917.5419166, "lr": 0.0, "time_sec": 15.502899169921875 } ], "8": [ { "epoch": 1, "train_loss": 4.612606842651367, "train_acc": 0.05934, "test_loss": 4.430249005126953, "test_acc": 0.0547, "lyapunov": null, "grad_norm": 6.270141227832012, "grad_max_sv": 5.356529116630554, "grad_min_sv": 1.0947098767893904e-07, "grad_condition": 215195113.11712712, "lr": 0.0009998903417374227, "time_sec": 32.60336875915527 }, { "epoch": 2, "train_loss": 3.9147449421691896, "train_acc": 0.11836, "test_loss": 4.028561441802979, "test_acc": 0.0982, "lyapunov": null, "grad_norm": 4.747243571853921, "grad_max_sv": 4.05106902718544, "grad_min_sv": 8.568258646965421e-08, "grad_condition": 545107965.2871394, "lr": 0.0009995614150494292, "time_sec": 32.505430459976196 }, { "epoch": 3, "train_loss": 3.5624093733215334, "train_acc": 0.16334, "test_loss": 3.77226120300293, "test_acc": 0.1374, "lyapunov": null, "grad_norm": 3.93250289804397, "grad_max_sv": 3.243712919950485, "grad_min_sv": 7.186751209697917e-08, "grad_condition": 88711185.58982365, "lr": 0.0009990133642141358, "time_sec": 32.51404023170471 }, { "epoch": 4, "train_loss": 3.3006829078674316, "train_acc": 0.20094, "test_loss": 3.4272261234283445, "test_acc": 0.1834, "lyapunov": null, "grad_norm": 3.319092979228889, "grad_max_sv": 2.5326511025428773, "grad_min_sv": 6.180275069489483e-08, "grad_condition": 54405947.77847425, "lr": 0.0009982464296247522, "time_sec": 32.52905559539795 }, { "epoch": 5, "train_loss": 3.0730740076446534, "train_acc": 0.24396, "test_loss": 3.2210192291259765, "test_acc": 0.2218, "lyapunov": null, "grad_norm": 2.8429187472839956, "grad_max_sv": 2.069159355759621, "grad_min_sv": 5.258070004746096e-08, "grad_condition": 221832198.05063334, "lr": 0.0009972609476841367, "time_sec": 32.5269730091095 }, { "epoch": 6, "train_loss": 2.8943703575897217, "train_acc": 0.27524, "test_loss": 3.2233618530273436, "test_acc": 0.2301, "lyapunov": null, "grad_norm": 2.489126623121483, "grad_max_sv": 1.7037211507558823, "grad_min_sv": 4.641174645991786e-08, "grad_condition": 69020973.60049818, "lr": 0.000996057350657239, "time_sec": 32.522809982299805 }, { "epoch": 7, "train_loss": 2.7278697608184816, "train_acc": 0.30568, "test_loss": 2.7846542739868165, "test_acc": 0.3021, "lyapunov": null, "grad_norm": 2.2145469317565336, "grad_max_sv": 1.4053084224462509, "grad_min_sv": 4.121676469709401e-08, "grad_condition": 74031008.12531385, "lr": 0.000994636166481494, "time_sec": 32.5133273601532 }, { "epoch": 8, "train_loss": 2.5846466691589356, "train_acc": 0.33468, "test_loss": 2.6393014106750488, "test_acc": 0.3355, "lyapunov": null, "grad_norm": 2.001252586211609, "grad_max_sv": 1.2068818539381028, "grad_min_sv": 3.724083600525896e-08, "grad_condition": 111617642.9828302, "lr": 0.0009929980185352525, "time_sec": 32.54776215553284 }, { "epoch": 9, "train_loss": 2.4496477169036863, "train_acc": 0.36334, "test_loss": 2.6101227111816407, "test_acc": 0.338, "lyapunov": null, "grad_norm": 1.8212885788905564, "grad_max_sv": 1.0235964789986611, "grad_min_sv": 3.432924873258969e-08, "grad_condition": 33560453.54798009, "lr": 0.0009911436253643444, "time_sec": 32.51866698265076 }, { "epoch": 10, "train_loss": 2.3403686044311525, "train_acc": 0.38794, "test_loss": 2.52991734085083, "test_acc": 0.3506, "lyapunov": null, "grad_norm": 1.6843997430422568, "grad_max_sv": 0.8722436726093292, "grad_min_sv": 3.162951408564041e-08, "grad_condition": 41826895.787083015, "lr": 0.0009890738003669028, "time_sec": 32.545666456222534 }, { "epoch": 11, "train_loss": 2.2328610494232177, "train_acc": 0.4093, "test_loss": 2.4910150177001955, "test_acc": 0.3614, "lyapunov": null, "grad_norm": 1.602309204488071, "grad_max_sv": 0.7984312251210213, "grad_min_sv": 3.0149957178093877e-08, "grad_condition": 42410766.28650923, "lr": 0.00098678945143658, "time_sec": 32.538198471069336 }, { "epoch": 12, "train_loss": 2.143996323623657, "train_acc": 0.42864, "test_loss": 2.4733912868499757, "test_acc": 0.371, "lyapunov": null, "grad_norm": 1.5058778232189263, "grad_max_sv": 0.7046674489974976, "grad_min_sv": 2.8541812209514905e-08, "grad_condition": 89676864.87927453, "lr": 0.0009842915805643154, "time_sec": 32.55523920059204 }, { "epoch": 13, "train_loss": 2.0627913328552245, "train_acc": 0.44824, "test_loss": 2.3573100704193117, "test_acc": 0.3883, "lyapunov": null, "grad_norm": 1.4381799734328438, "grad_max_sv": 0.657113502919674, "grad_min_sv": 2.6757648968755986e-08, "grad_condition": 44542952.01193309, "lr": 0.000981581283398829, "time_sec": 32.53194808959961 }, { "epoch": 14, "train_loss": 2.0010124866104126, "train_acc": 0.45794, "test_loss": 2.2445085243225096, "test_acc": 0.4153, "lyapunov": null, "grad_norm": 1.3839283952743018, "grad_max_sv": 0.6215245097875595, "grad_min_sv": 2.586353823885723e-08, "grad_condition": 32103062.13610636, "lr": 0.0009786597487660333, "time_sec": 32.547112703323364 }, { "epoch": 15, "train_loss": 1.9416577011489868, "train_acc": 0.47534, "test_loss": 2.2182875526428223, "test_acc": 0.4247, "lyapunov": null, "grad_norm": 1.3285678956385127, "grad_max_sv": 0.5932768613100052, "grad_min_sv": 2.5034504780308e-08, "grad_condition": 29217346.01697495, "lr": 0.0009755282581475766, "time_sec": 32.527819871902466 }, { "epoch": 16, "train_loss": 1.873101312637329, "train_acc": 0.48986, "test_loss": 2.2290160217285155, "test_acc": 0.4272, "lyapunov": null, "grad_norm": 1.2913331830478172, "grad_max_sv": 0.5665568478405476, "grad_min_sv": 2.474239251260002e-08, "grad_condition": 27395673.607036375, "lr": 0.0009721881851187403, "time_sec": 32.52952456474304 }, { "epoch": 17, "train_loss": 1.8097029363250732, "train_acc": 0.50292, "test_loss": 2.2615955074310303, "test_acc": 0.424, "lyapunov": null, "grad_norm": 1.252294761267169, "grad_max_sv": 0.5210624538362026, "grad_min_sv": 2.3697808424968936e-08, "grad_condition": 114051245.48515114, "lr": 0.0009686409947459456, "time_sec": 32.54529142379761 }, { "epoch": 18, "train_loss": 1.747176973838806, "train_acc": 0.51946, "test_loss": 2.2190833429336547, "test_acc": 0.4281, "lyapunov": null, "grad_norm": 1.213131360578199, "grad_max_sv": 0.5172027304768563, "grad_min_sv": 2.289411261818808e-08, "grad_condition": 51051175.59109087, "lr": 0.0009648882429441254, "time_sec": 32.51650047302246 }, { "epoch": 19, "train_loss": 1.694791968383789, "train_acc": 0.5301, "test_loss": 2.2439287574768065, "test_acc": 0.4362, "lyapunov": null, "grad_norm": 1.1797460355462452, "grad_max_sv": 0.4871015749871731, "grad_min_sv": 2.21617759829304e-08, "grad_condition": 166781679.9487027, "lr": 0.00096093157579425, "time_sec": 32.51687932014465 }, { "epoch": 20, "train_loss": 1.6451108572006226, "train_acc": 0.54392, "test_loss": 2.30450572013855, "test_acc": 0.4271, "lyapunov": null, "grad_norm": 1.1471849936044856, "grad_max_sv": 0.47273003607988356, "grad_min_sv": 2.1620291118518155e-08, "grad_condition": 25041556.16833921, "lr": 0.0009567727288213001, "time_sec": 32.532697916030884 }, { "epoch": 21, "train_loss": 1.6014679947662354, "train_acc": 0.55142, "test_loss": 2.1664475830078125, "test_acc": 0.4584, "lyapunov": null, "grad_norm": 1.1229957179757897, "grad_max_sv": 0.4562165729701519, "grad_min_sv": 2.1112780196341775e-08, "grad_condition": 26298334.51243094, "lr": 0.0009524135262330095, "time_sec": 32.53035640716553 }, { "epoch": 22, "train_loss": 1.5620909811401367, "train_acc": 0.5613, "test_loss": 2.162712843322754, "test_acc": 0.4535, "lyapunov": null, "grad_norm": 1.1030961025754331, "grad_max_sv": 0.4406334914267063, "grad_min_sv": 2.045089818741852e-08, "grad_condition": 43337785.20413343, "lr": 0.0009478558801197061, "time_sec": 32.51555895805359 }, { "epoch": 23, "train_loss": 1.5185724276351928, "train_acc": 0.56968, "test_loss": 2.1629050983428955, "test_acc": 0.4642, "lyapunov": null, "grad_norm": 1.0796470270409146, "grad_max_sv": 0.4365608513355255, "grad_min_sv": 2.0348640585379775e-08, "grad_condition": 199103454.04638118, "lr": 0.000943101789615607, "time_sec": 32.51700782775879 }, { "epoch": 24, "train_loss": 1.4762262714385985, "train_acc": 0.58122, "test_loss": 2.0623104194641115, "test_acc": 0.4808, "lyapunov": null, "grad_norm": 1.058223580636924, "grad_max_sv": 0.422040344029665, "grad_min_sv": 1.999172487554546e-08, "grad_condition": 26445060.697539486, "lr": 0.0009381533400219313, "time_sec": 32.54439735412598 }, { "epoch": 25, "train_loss": 1.4411011653900145, "train_acc": 0.58896, "test_loss": 2.168187129974365, "test_acc": 0.4692, "lyapunov": null, "grad_norm": 1.0360388595339232, "grad_max_sv": 0.4249138444662094, "grad_min_sv": 1.99582824841546e-08, "grad_condition": 246451377.91849524, "lr": 0.0009330127018922189, "time_sec": 32.548271894454956 }, { "epoch": 26, "train_loss": 1.4043142713928223, "train_acc": 0.59902, "test_loss": 2.0536590896606444, "test_acc": 0.4891, "lyapunov": null, "grad_norm": 1.0113140938455152, "grad_max_sv": 0.3988976672291756, "grad_min_sv": 1.8759028042047988e-08, "grad_condition": 37432251.439904764, "lr": 0.000927682130080253, "time_sec": 32.561890840530396 }, { "epoch": 27, "train_loss": 1.3714225146484376, "train_acc": 0.60766, "test_loss": 2.2935733531951903, "test_acc": 0.4525, "lyapunov": null, "grad_norm": 1.0021764966836944, "grad_max_sv": 0.3959275037050247, "grad_min_sv": 1.8507436513881537e-08, "grad_condition": 44956111.71393384, "lr": 0.0009221639627510072, "time_sec": 32.53670048713684 }, { "epoch": 28, "train_loss": 1.3370341487121582, "train_acc": 0.61666, "test_loss": 2.151699178314209, "test_acc": 0.4715, "lyapunov": null, "grad_norm": 0.9794476786709188, "grad_max_sv": 0.39209934026002885, "grad_min_sv": 1.867815887374169e-08, "grad_condition": 35054340.009755686, "lr": 0.0009164606203550494, "time_sec": 32.54069757461548 }, { "epoch": 29, "train_loss": 1.3072684922790527, "train_acc": 0.62288, "test_loss": 2.177260079193115, "test_acc": 0.4723, "lyapunov": null, "grad_norm": 0.9630039914022892, "grad_max_sv": 0.38177175372838973, "grad_min_sv": 1.8039237006939324e-08, "grad_condition": 32222597.95523299, "lr": 0.0009105746045668516, "time_sec": 32.513834953308105 }, { "epoch": 30, "train_loss": 1.2830923750686645, "train_acc": 0.63006, "test_loss": 2.2779099143981933, "test_acc": 0.4655, "lyapunov": null, "grad_norm": 0.9518974286811641, "grad_max_sv": 0.38100970312953, "grad_min_sv": 1.788316939428658e-08, "grad_condition": 99211564.21329594, "lr": 0.0009045084971874733, "time_sec": 32.5218071937561 }, { "epoch": 31, "train_loss": 1.244770231819153, "train_acc": 0.6375, "test_loss": 2.1691842304229736, "test_acc": 0.4808, "lyapunov": null, "grad_norm": 0.9340551179231076, "grad_max_sv": 0.36914008632302286, "grad_min_sv": 1.7114106357074555e-08, "grad_condition": 29377579.043874025, "lr": 0.0008982649590120977, "time_sec": 32.50562572479248 }, { "epoch": 32, "train_loss": 1.2236427535629273, "train_acc": 0.64292, "test_loss": 2.128678413200378, "test_acc": 0.4897, "lyapunov": null, "grad_norm": 0.9308816117267062, "grad_max_sv": 0.3699117600917816, "grad_min_sv": 1.7350169867480502e-08, "grad_condition": 29708594.41851766, "lr": 0.0008918467286629196, "time_sec": 32.53521537780762 }, { "epoch": 33, "train_loss": 1.1827713982772827, "train_acc": 0.65544, "test_loss": 2.1373632209777833, "test_acc": 0.5017, "lyapunov": null, "grad_norm": 0.9081423627717244, "grad_max_sv": 0.3551614835858345, "grad_min_sv": 1.6811319347286718e-08, "grad_condition": 306006053.9068912, "lr": 0.0008852566213878943, "time_sec": 32.57274842262268 }, { "epoch": 34, "train_loss": 1.1642235271072388, "train_acc": 0.65892, "test_loss": 2.1604542951583863, "test_acc": 0.4885, "lyapunov": null, "grad_norm": 0.9090398412926194, "grad_max_sv": 0.35307114869356154, "grad_min_sv": 1.6331064042404696e-08, "grad_condition": 75342806.75988543, "lr": 0.000878497527825878, "time_sec": 32.53737998008728 }, { "epoch": 35, "train_loss": 1.1387675298309325, "train_acc": 0.6667, "test_loss": 2.1841554317474365, "test_acc": 0.4875, "lyapunov": null, "grad_norm": 0.8905589789768327, "grad_max_sv": 0.34435485303401947, "grad_min_sv": 1.63940996583678e-08, "grad_condition": 31858813.754447132, "lr": 0.000871572412738697, "time_sec": 32.53908848762512 }, { "epoch": 36, "train_loss": 1.112549288597107, "train_acc": 0.6711, "test_loss": 2.1255173376083376, "test_acc": 0.4972, "lyapunov": null, "grad_norm": 0.888003290237527, "grad_max_sv": 0.3482539109885693, "grad_min_sv": 1.6459002988994388e-08, "grad_condition": 106865396.27418132, "lr": 0.0008644843137107055, "time_sec": 32.52313590049744 }, { "epoch": 37, "train_loss": 1.0873542625236512, "train_acc": 0.6763, "test_loss": 2.098120114517212, "test_acc": 0.5037, "lyapunov": null, "grad_norm": 0.8726919198419328, "grad_max_sv": 0.34534994438290595, "grad_min_sv": 1.612610790874269e-08, "grad_condition": 39535112.979377694, "lr": 0.0008572363398164014, "time_sec": 32.54535698890686 }, { "epoch": 38, "train_loss": 1.0494415398788453, "train_acc": 0.6891, "test_loss": 2.1943147089004515, "test_acc": 0.4975, "lyapunov": null, "grad_norm": 0.867993871250333, "grad_max_sv": 0.3474706750363111, "grad_min_sv": 1.6011337518329062e-08, "grad_condition": 53782583.5534817, "lr": 0.0008498316702566826, "time_sec": 32.5124135017395 }, { "epoch": 39, "train_loss": 1.0355109643936158, "train_acc": 0.69258, "test_loss": 2.145528812789917, "test_acc": 0.5015, "lyapunov": null, "grad_norm": 0.8555269464693561, "grad_max_sv": 0.3424593433737755, "grad_min_sv": 1.5947514456216004e-08, "grad_condition": 33880811.6761477, "lr": 0.0008422735529643442, "time_sec": 32.515289545059204 }, { "epoch": 40, "train_loss": 1.0165967633247375, "train_acc": 0.69846, "test_loss": 2.175649596786499, "test_acc": 0.5019, "lyapunov": null, "grad_norm": 0.8376771010486573, "grad_max_sv": 0.3215891238301992, "grad_min_sv": 1.5263620372837905e-08, "grad_condition": 85010303.02194887, "lr": 0.0008345653031794289, "time_sec": 32.54841685295105 }, { "epoch": 41, "train_loss": 0.9950240628051757, "train_acc": 0.70056, "test_loss": 2.2173702697753908, "test_acc": 0.5002, "lyapunov": null, "grad_norm": 0.8305965994955763, "grad_max_sv": 0.3256087012588978, "grad_min_sv": 1.5127571602671642e-08, "grad_condition": 137474843.23784915, "lr": 0.0008267103019950526, "time_sec": 32.57811760902405 }, { "epoch": 42, "train_loss": 0.9775527880096435, "train_acc": 0.70474, "test_loss": 2.1698096994400022, "test_acc": 0.5034, "lyapunov": null, "grad_norm": 0.8275704405899154, "grad_max_sv": 0.3146204575896263, "grad_min_sv": 1.4814988586950295e-08, "grad_condition": 63410761.569527075, "lr": 0.0008187119948743447, "time_sec": 32.52773356437683 }, { "epoch": 43, "train_loss": 0.9515444298553467, "train_acc": 0.7129, "test_loss": 2.284324015045166, "test_acc": 0.4919, "lyapunov": null, "grad_norm": 0.8256111526505941, "grad_max_sv": 0.3248642094433308, "grad_min_sv": 1.5077374472538542e-08, "grad_condition": 120729497.4258703, "lr": 0.000810573890139155, "time_sec": 32.54343295097351 }, { "epoch": 44, "train_loss": 0.932089543800354, "train_acc": 0.71794, "test_loss": 2.347640796661377, "test_acc": 0.4952, "lyapunov": null, "grad_norm": 0.8221551718061502, "grad_max_sv": 0.3309069760143757, "grad_min_sv": 1.531730618592464e-08, "grad_condition": 43621618.830579884, "lr": 0.0008022995574311873, "time_sec": 32.540892362594604 }, { "epoch": 45, "train_loss": 0.9129991551589965, "train_acc": 0.72538, "test_loss": 2.3257674713134766, "test_acc": 0.4986, "lyapunov": null, "grad_norm": 0.7995996108758867, "grad_max_sv": 0.3120440490543842, "grad_min_sv": 1.4420761846635487e-08, "grad_condition": 274280638.56129825, "lr": 0.0007938926261462363, "time_sec": 32.56113886833191 }, { "epoch": 46, "train_loss": 0.8904787008476257, "train_acc": 0.72998, "test_loss": 2.3609681858062745, "test_acc": 0.4974, "lyapunov": null, "grad_norm": 0.8006123840154866, "grad_max_sv": 0.3184788428246975, "grad_min_sv": 1.479064429370236e-08, "grad_condition": 82532558.79183207, "lr": 0.0007853567838422158, "time_sec": 32.55464220046997 }, { "epoch": 47, "train_loss": 0.8791391965866089, "train_acc": 0.73118, "test_loss": 2.3235943592071533, "test_acc": 0.5011, "lyapunov": null, "grad_norm": 0.7941774318900212, "grad_max_sv": 0.31571171544492244, "grad_min_sv": 1.4471256026826751e-08, "grad_condition": 31975325.9529503, "lr": 0.0007766957746216719, "time_sec": 32.531195402145386 }, { "epoch": 48, "train_loss": 0.8462872068786621, "train_acc": 0.74152, "test_loss": 2.2702061416625976, "test_acc": 0.5127, "lyapunov": null, "grad_norm": 0.7790110299262845, "grad_max_sv": 0.31310132145881653, "grad_min_sv": 1.4011670552635525e-08, "grad_condition": 69070584.021189, "lr": 0.0007679133974894982, "time_sec": 32.550259828567505 }, { "epoch": 49, "train_loss": 0.8320243933296204, "train_acc": 0.74518, "test_loss": 2.3156275840759277, "test_acc": 0.5109, "lyapunov": null, "grad_norm": 0.7829430590909012, "grad_max_sv": 0.3146356470882893, "grad_min_sv": 1.4089187793265428e-08, "grad_condition": 233080772.68985993, "lr": 0.000759013504686565, "time_sec": 32.55922746658325 }, { "epoch": 50, "train_loss": 0.8245939933776856, "train_acc": 0.74696, "test_loss": 2.265205925178528, "test_acc": 0.5189, "lyapunov": null, "grad_norm": 0.7672411895816676, "grad_max_sv": 0.3079528912901878, "grad_min_sv": 1.4155918948415697e-08, "grad_condition": 343933636.95908105, "lr": 0.0007499999999999998, "time_sec": 32.53189420700073 }, { "epoch": 51, "train_loss": 0.7894153217315674, "train_acc": 0.7565, "test_loss": 2.3188957998275757, "test_acc": 0.5074, "lyapunov": null, "grad_norm": 0.7639570769617415, "grad_max_sv": 0.30883320979774, "grad_min_sv": 1.3941536785438969e-08, "grad_condition": 58007269.384739935, "lr": 0.0007408768370508575, "time_sec": 32.537278175354004 }, { "epoch": 52, "train_loss": 0.7845482840156556, "train_acc": 0.75934, "test_loss": 2.3104104595184327, "test_acc": 0.5194, "lyapunov": null, "grad_norm": 0.758426806815466, "grad_max_sv": 0.3017439119517803, "grad_min_sv": 1.3761643591347906e-08, "grad_condition": 64403689.199135736, "lr": 0.0007316480175599307, "time_sec": 32.567556858062744 }, { "epoch": 53, "train_loss": 0.7678517831802368, "train_acc": 0.76302, "test_loss": 2.2519205989837645, "test_acc": 0.5187, "lyapunov": null, "grad_norm": 0.7525741359749043, "grad_max_sv": 0.3043193075805902, "grad_min_sv": 1.4057699764414428e-08, "grad_condition": 603144630.5655534, "lr": 0.0007223175895924635, "time_sec": 32.54323744773865 }, { "epoch": 54, "train_loss": 0.7441292473983765, "train_acc": 0.77002, "test_loss": 2.321862815093994, "test_acc": 0.5195, "lyapunov": null, "grad_norm": 0.7385816998340842, "grad_max_sv": 0.2950198922306299, "grad_min_sv": 1.3242542280800241e-08, "grad_condition": 47788499.822593346, "lr": 0.0007128896457825361, "time_sec": 32.546525955200195 }, { "epoch": 55, "train_loss": 0.7237247510147095, "train_acc": 0.77684, "test_loss": 2.443076996231079, "test_acc": 0.5105, "lyapunov": null, "grad_norm": 0.7236745133446179, "grad_max_sv": 0.2926642097532749, "grad_min_sv": 1.3385297276298502e-08, "grad_condition": 180910825.71869814, "lr": 0.0007033683215378998, "time_sec": 32.5228271484375 }, { "epoch": 56, "train_loss": 0.714698567867279, "train_acc": 0.77636, "test_loss": 2.4090746616363528, "test_acc": 0.5073, "lyapunov": null, "grad_norm": 0.7344734039694485, "grad_max_sv": 0.2945756554603577, "grad_min_sv": 1.3372697777163517e-08, "grad_condition": 191394798.44401574, "lr": 0.0006937577932260512, "time_sec": 32.53384256362915 }, { "epoch": 57, "train_loss": 0.701706619796753, "train_acc": 0.7817, "test_loss": 2.4898623809814455, "test_acc": 0.5061, "lyapunov": null, "grad_norm": 0.7242445850699529, "grad_max_sv": 0.29475805573165414, "grad_min_sv": 1.3282284945341504e-08, "grad_condition": 139859409.2511898, "lr": 0.0006840622763423388, "time_sec": 32.55175542831421 }, { "epoch": 58, "train_loss": 0.683065224571228, "train_acc": 0.78578, "test_loss": 2.40970786857605, "test_acc": 0.5161, "lyapunov": null, "grad_norm": 0.7133541403038509, "grad_max_sv": 0.28903776630759237, "grad_min_sv": 1.2887932776279449e-08, "grad_condition": 217157653.7481032, "lr": 0.0006742860236609073, "time_sec": 32.54868960380554 }, { "epoch": 59, "train_loss": 0.658868628025055, "train_acc": 0.79364, "test_loss": 2.4330540966033936, "test_acc": 0.512, "lyapunov": null, "grad_norm": 0.7071819631685043, "grad_max_sv": 0.28152512572705746, "grad_min_sv": 1.2446668359172852e-08, "grad_condition": 53600070.902513206, "lr": 0.0006644333233692913, "time_sec": 32.54175162315369 }, { "epoch": 60, "train_loss": 0.6470879960250855, "train_acc": 0.7992, "test_loss": 2.4595475191116334, "test_acc": 0.5146, "lyapunov": null, "grad_norm": 0.7011871838547499, "grad_max_sv": 0.2868143357336521, "grad_min_sv": 1.2911446190672082e-08, "grad_condition": 55527160.04901831, "lr": 0.0006545084971874734, "time_sec": 32.56122612953186 }, { "epoch": 61, "train_loss": 0.6354982923126221, "train_acc": 0.8022, "test_loss": 2.560771873855591, "test_acc": 0.5081, "lyapunov": null, "grad_norm": 0.6984352092808961, "grad_max_sv": 0.27748913019895555, "grad_min_sv": 1.239017393675143e-08, "grad_condition": 1468960068.2366312, "lr": 0.0006445158984722354, "time_sec": 32.540645360946655 }, { "epoch": 62, "train_loss": 0.616827200679779, "train_acc": 0.80592, "test_loss": 2.4981941551208497, "test_acc": 0.5168, "lyapunov": null, "grad_norm": 0.693034220707574, "grad_max_sv": 0.27250286303460597, "grad_min_sv": 1.2243235950146896e-08, "grad_condition": 346615785.32809913, "lr": 0.0006344599103076324, "time_sec": 32.55153822898865 }, { "epoch": 63, "train_loss": 0.6024868152618408, "train_acc": 0.81298, "test_loss": 2.4579322681427, "test_acc": 0.5197, "lyapunov": null, "grad_norm": 0.6859865381743082, "grad_max_sv": 0.2814170353114605, "grad_min_sv": 1.2453174788248922e-08, "grad_condition": 71845159.85056672, "lr": 0.0006243449435824269, "time_sec": 32.56982493400574 }, { "epoch": 64, "train_loss": 0.5879015256500244, "train_acc": 0.81586, "test_loss": 2.537950067138672, "test_acc": 0.5154, "lyapunov": null, "grad_norm": 0.6770827367834238, "grad_max_sv": 0.2760712094604969, "grad_min_sv": 1.2060245246827555e-08, "grad_condition": 242477478.97334537, "lr": 0.0006141754350553275, "time_sec": 32.555153369903564 }, { "epoch": 65, "train_loss": 0.5838800269126893, "train_acc": 0.8159, "test_loss": 2.5163471378326414, "test_acc": 0.5163, "lyapunov": null, "grad_norm": 0.6785242818211942, "grad_max_sv": 0.27877960838377475, "grad_min_sv": 1.2008392599738293e-08, "grad_condition": 40446768.53559095, "lr": 0.0006039558454088793, "time_sec": 32.543633460998535 }, { "epoch": 66, "train_loss": 0.577277703781128, "train_acc": 0.81916, "test_loss": 2.4027950271606446, "test_acc": 0.53, "lyapunov": null, "grad_norm": 0.6749900226760103, "grad_max_sv": 0.2747200779616833, "grad_min_sv": 1.2062701042203639e-08, "grad_condition": 32367967.36566303, "lr": 0.000593690657292862, "time_sec": 32.588738441467285 }, { "epoch": 67, "train_loss": 0.5638121318435669, "train_acc": 0.82124, "test_loss": 2.5093120254516603, "test_acc": 0.5143, "lyapunov": null, "grad_norm": 0.6756248898956171, "grad_max_sv": 0.2708110649138689, "grad_min_sv": 1.1944636340091575e-08, "grad_condition": 75752957.05132133, "lr": 0.0005833843733580507, "time_sec": 32.55442571640015 }, { "epoch": 68, "train_loss": 0.5368257042694092, "train_acc": 0.82994, "test_loss": 2.589290417480469, "test_acc": 0.5118, "lyapunov": null, "grad_norm": 0.6598937386660447, "grad_max_sv": 0.261281393840909, "grad_min_sv": 1.1725735699075201e-08, "grad_condition": 169472540.689181, "lr": 0.0005730415142812054, "time_sec": 32.52515912055969 }, { "epoch": 69, "train_loss": 0.5388207937431335, "train_acc": 0.82916, "test_loss": 2.563585631942749, "test_acc": 0.5202, "lyapunov": null, "grad_norm": 0.6573002747793157, "grad_max_sv": 0.2725424364209175, "grad_min_sv": 1.2047364596375065e-08, "grad_condition": 444347034.8797019, "lr": 0.0005626666167821517, "time_sec": 32.586650133132935 }, { "epoch": 70, "train_loss": 0.513670022392273, "train_acc": 0.83646, "test_loss": 2.5132864803314208, "test_acc": 0.5236, "lyapunov": null, "grad_norm": 0.6431550925781278, "grad_max_sv": 0.27632256150245665, "grad_min_sv": 1.1758005316261921e-08, "grad_condition": 110006576.71894233, "lr": 0.0005522642316338265, "time_sec": 32.577406883239746 }, { "epoch": 71, "train_loss": 0.5131872615623474, "train_acc": 0.83644, "test_loss": 2.5521981464385988, "test_acc": 0.5241, "lyapunov": null, "grad_norm": 0.6453851866055248, "grad_max_sv": 0.2702975060790777, "grad_min_sv": 1.1546318178521155e-08, "grad_condition": 1790962873.9237118, "lr": 0.0005418389216661573, "time_sec": 32.55422234535217 }, { "epoch": 72, "train_loss": 0.5012564387702942, "train_acc": 0.83844, "test_loss": 2.6108884536743164, "test_acc": 0.5145, "lyapunov": null, "grad_norm": 0.641535680347223, "grad_max_sv": 0.263116517290473, "grad_min_sv": 1.133218473052533e-08, "grad_condition": 97098064.25597176, "lr": 0.0005313952597646563, "time_sec": 32.55845665931702 }, { "epoch": 73, "train_loss": 0.4879260776901245, "train_acc": 0.84454, "test_loss": 2.5678638622283936, "test_acc": 0.5233, "lyapunov": null, "grad_norm": 0.6388994964495804, "grad_max_sv": 0.26682182475924493, "grad_min_sv": 1.1433825197054715e-08, "grad_condition": 115135062.42170426, "lr": 0.0005209378268645994, "time_sec": 32.551618576049805 }, { "epoch": 74, "train_loss": 0.47297955097198485, "train_acc": 0.84948, "test_loss": 2.5823446689605714, "test_acc": 0.5234, "lyapunov": null, "grad_norm": 0.625079210207, "grad_max_sv": 0.2719780694693327, "grad_min_sv": 1.1374299929472944e-08, "grad_condition": 1819913042.7712326, "lr": 0.0005104712099416781, "time_sec": 32.56480145454407 }, { "epoch": 75, "train_loss": 0.46812099950790403, "train_acc": 0.85034, "test_loss": 2.6528441036224364, "test_acc": 0.5183, "lyapunov": null, "grad_norm": 0.6231186463016253, "grad_max_sv": 0.25995977483689786, "grad_min_sv": 1.1211473876398311e-08, "grad_condition": 1535902619.2174218, "lr": 0.0004999999999999996, "time_sec": 32.557714223861694 }, { "epoch": 76, "train_loss": 0.4614518400478363, "train_acc": 0.85322, "test_loss": 2.722090990829468, "test_acc": 0.5123, "lyapunov": null, "grad_norm": 0.6189058016152714, "grad_max_sv": 0.26107010766863825, "grad_min_sv": 1.121603938145782e-08, "grad_condition": 156852744.39388055, "lr": 0.0004895287900583212, "time_sec": 32.57050681114197 }, { "epoch": 77, "train_loss": 0.4433125625228882, "train_acc": 0.85798, "test_loss": 2.683233337402344, "test_acc": 0.5176, "lyapunov": null, "grad_norm": 0.6092718322680238, "grad_max_sv": 0.26060184724628926, "grad_min_sv": 1.0807431153128655e-08, "grad_condition": 94720998.74768767, "lr": 0.0004790621731353997, "time_sec": 32.566901445388794 }, { "epoch": 78, "train_loss": 0.43715192074775694, "train_acc": 0.85892, "test_loss": 2.8140779514312744, "test_acc": 0.5126, "lyapunov": null, "grad_norm": 0.6093756219980636, "grad_max_sv": 0.25670241452753545, "grad_min_sv": 1.0911793120807477e-08, "grad_condition": 96322404.6795116, "lr": 0.000468604740235343, "time_sec": 32.57596945762634 }, { "epoch": 79, "train_loss": 0.4312542087650299, "train_acc": 0.86156, "test_loss": 2.688641630935669, "test_acc": 0.5206, "lyapunov": null, "grad_norm": 0.6073166568575497, "grad_max_sv": 0.25702770203351977, "grad_min_sv": 1.0958630206232833e-08, "grad_condition": 250707729.3021683, "lr": 0.00045816107833384175, "time_sec": 32.56645917892456 }, { "epoch": 80, "train_loss": 0.4118970446872711, "train_acc": 0.86894, "test_loss": 2.5730819744110107, "test_acc": 0.5337, "lyapunov": null, "grad_norm": 0.5969485138195714, "grad_max_sv": 0.244117346778512, "grad_min_sv": 1.0501346974639558e-08, "grad_condition": 268969770.6987619, "lr": 0.0004477357683661729, "time_sec": 32.55648875236511 }, { "epoch": 81, "train_loss": 0.40473406177520754, "train_acc": 0.8705, "test_loss": 2.768511548614502, "test_acc": 0.5175, "lyapunov": null, "grad_norm": 0.5946234097363065, "grad_max_sv": 0.25840370543301105, "grad_min_sv": 1.0675248116140834e-08, "grad_condition": 1433985790.1272235, "lr": 0.00043733338321784746, "time_sec": 32.56024956703186 }, { "epoch": 82, "train_loss": 0.39231891386032103, "train_acc": 0.87338, "test_loss": 2.6643074661254884, "test_acc": 0.5309, "lyapunov": null, "grad_norm": 0.5900838298376547, "grad_max_sv": 0.2576967000961304, "grad_min_sv": 1.0706646371176284e-08, "grad_condition": 410914403.2919628, "lr": 0.0004269584857187939, "time_sec": 32.52906775474548 }, { "epoch": 83, "train_loss": 0.38102890924453736, "train_acc": 0.87712, "test_loss": 2.746966218185425, "test_acc": 0.5212, "lyapunov": null, "grad_norm": 0.5804702132437124, "grad_max_sv": 0.24822848811745643, "grad_min_sv": 1.0360890155157107e-08, "grad_condition": 348582315.4871143, "lr": 0.0004166156266419484, "time_sec": 32.575536489486694 }, { "epoch": 84, "train_loss": 0.37733193599700926, "train_acc": 0.87564, "test_loss": 2.7224476852416992, "test_acc": 0.5248, "lyapunov": null, "grad_norm": 0.5836201032332736, "grad_max_sv": 0.2583346772938967, "grad_min_sv": 1.070241965142084e-08, "grad_condition": 801944412.6941237, "lr": 0.0004063093427071373, "time_sec": 32.56175231933594 }, { "epoch": 85, "train_loss": 0.3640913159942627, "train_acc": 0.88294, "test_loss": 2.758930994796753, "test_acc": 0.527, "lyapunov": null, "grad_norm": 0.5660514135717984, "grad_max_sv": 0.24142069853842257, "grad_min_sv": 1.0190759017463663e-08, "grad_condition": 1202285628.3006241, "lr": 0.0003960441545911199, "time_sec": 32.5456702709198 }, { "epoch": 86, "train_loss": 0.3523704248428345, "train_acc": 0.88546, "test_loss": 2.687824221420288, "test_acc": 0.5297, "lyapunov": null, "grad_norm": 0.5608649440048047, "grad_max_sv": 0.2463057145476341, "grad_min_sv": 1.0161699044372586e-08, "grad_condition": 82146942.52646025, "lr": 0.0003858245649446718, "time_sec": 32.53918766975403 }, { "epoch": 87, "train_loss": 0.35160433542251585, "train_acc": 0.8864, "test_loss": 2.7660649963378905, "test_acc": 0.5254, "lyapunov": null, "grad_norm": 0.5647074650828036, "grad_max_sv": 0.2515272866934538, "grad_min_sv": 1.0253057474568505e-08, "grad_condition": 106198876.53293958, "lr": 0.00037565505641757235, "time_sec": 32.57175302505493 }, { "epoch": 88, "train_loss": 0.34372631204605103, "train_acc": 0.8903, "test_loss": 2.7611888675689698, "test_acc": 0.5293, "lyapunov": null, "grad_norm": 0.5539379162644149, "grad_max_sv": 0.24760488532483577, "grad_min_sv": 1.0237206365037652e-08, "grad_condition": 268378740.40175262, "lr": 0.00036554008969236695, "time_sec": 32.61865496635437 }, { "epoch": 89, "train_loss": 0.3349831074714661, "train_acc": 0.89124, "test_loss": 2.852033778381348, "test_acc": 0.5246, "lyapunov": null, "grad_norm": 0.5543234221756905, "grad_max_sv": 0.2524993114173412, "grad_min_sv": 1.0068119724645358e-08, "grad_condition": 881390959.6058903, "lr": 0.0003554841015277638, "time_sec": 32.56809163093567 }, { "epoch": 90, "train_loss": 0.3192900574111939, "train_acc": 0.8978, "test_loss": 2.8204364456176756, "test_acc": 0.5277, "lyapunov": null, "grad_norm": 0.539170960935015, "grad_max_sv": 0.23871867544949055, "grad_min_sv": 9.515663445397448e-09, "grad_condition": 82474731.67522079, "lr": 0.000345491502812526, "time_sec": 32.549994468688965 }, { "epoch": 91, "train_loss": 0.3178176963233948, "train_acc": 0.8972, "test_loss": 2.860647204208374, "test_acc": 0.527, "lyapunov": null, "grad_norm": 0.5335824951523024, "grad_max_sv": 0.24524600319564344, "grad_min_sv": 9.955028348364314e-09, "grad_condition": 189160981.0331933, "lr": 0.0003355666766307081, "time_sec": 32.5523841381073 }, { "epoch": 92, "train_loss": 0.30979349758148195, "train_acc": 0.90114, "test_loss": 2.792916820526123, "test_acc": 0.5334, "lyapunov": null, "grad_norm": 0.536022212715003, "grad_max_sv": 0.2439738731831312, "grad_min_sv": 9.802463784257254e-09, "grad_condition": 392308745.7452389, "lr": 0.00032571397633909225, "time_sec": 32.534363746643066 }, { "epoch": 93, "train_loss": 0.29998136956214905, "train_acc": 0.90294, "test_loss": 2.8000693214416503, "test_acc": 0.5371, "lyapunov": null, "grad_norm": 0.526141212631399, "grad_max_sv": 0.2302109245210886, "grad_min_sv": 9.57197021107109e-09, "grad_condition": 990380151.1551683, "lr": 0.00031593772365766094, "time_sec": 32.5524480342865 }, { "epoch": 94, "train_loss": 0.2947264695549011, "train_acc": 0.90426, "test_loss": 2.8803435722351076, "test_acc": 0.5269, "lyapunov": null, "grad_norm": 0.5244681069551711, "grad_max_sv": 0.2267349176108837, "grad_min_sv": 9.39341851901969e-09, "grad_condition": 350481322.0522052, "lr": 0.0003062422067739483, "time_sec": 32.55219221115112 }, { "epoch": 95, "train_loss": 0.2886659768772125, "train_acc": 0.90604, "test_loss": 2.9347433059692385, "test_acc": 0.5258, "lyapunov": null, "grad_norm": 0.5214353080258765, "grad_max_sv": 0.2345777176320553, "grad_min_sv": 9.640483901365155e-09, "grad_condition": 720854220.3900421, "lr": 0.00029663167846209965, "time_sec": 32.557831048965454 }, { "epoch": 96, "train_loss": 0.27894444655418393, "train_acc": 0.90976, "test_loss": 2.9434762027740478, "test_acc": 0.5285, "lyapunov": null, "grad_norm": 0.5097107775143732, "grad_max_sv": 0.2310101106762886, "grad_min_sv": 9.385787539729386e-09, "grad_condition": 526341011.33289146, "lr": 0.00028711035421746345, "time_sec": 32.542834997177124 }, { "epoch": 97, "train_loss": 0.27359901790618896, "train_acc": 0.9111, "test_loss": 2.8853713760375976, "test_acc": 0.5255, "lyapunov": null, "grad_norm": 0.5155496576192513, "grad_max_sv": 0.2377286858856678, "grad_min_sv": 9.5194454921327e-09, "grad_condition": 3878284949.6481657, "lr": 0.00027768241040753615, "time_sec": 32.55704665184021 }, { "epoch": 98, "train_loss": 0.27738544737815857, "train_acc": 0.90926, "test_loss": 2.9445196617126466, "test_acc": 0.5299, "lyapunov": null, "grad_norm": 0.5179989785468311, "grad_max_sv": 0.22777627930045127, "grad_min_sv": 9.246968936957659e-09, "grad_condition": 960537397.7931906, "lr": 0.00026835198244006903, "time_sec": 32.64381694793701 }, { "epoch": 99, "train_loss": 0.26050106247901916, "train_acc": 0.91634, "test_loss": 2.9518425941467283, "test_acc": 0.5252, "lyapunov": null, "grad_norm": 0.5021876835039283, "grad_max_sv": 0.23347571939229966, "grad_min_sv": 9.252318778490976e-09, "grad_condition": 358829344.2311903, "lr": 0.0002591231629491421, "time_sec": 32.63876390457153 }, { "epoch": 100, "train_loss": 0.258883156375885, "train_acc": 0.91784, "test_loss": 2.9451918140411375, "test_acc": 0.5271, "lyapunov": null, "grad_norm": 0.49558170482534186, "grad_max_sv": 0.22932566255331038, "grad_min_sv": 8.960364150656374e-09, "grad_condition": 133402370.68097286, "lr": 0.0002499999999999997, "time_sec": 32.63405442237854 }, { "epoch": 101, "train_loss": 0.2544194602584839, "train_acc": 0.9178, "test_loss": 2.931644026184082, "test_acc": 0.5324, "lyapunov": null, "grad_norm": 0.49432462184183484, "grad_max_sv": 0.23283861316740512, "grad_min_sv": 9.245908496593666e-09, "grad_condition": 394496802.8033221, "lr": 0.00024098649531343477, "time_sec": 32.61276388168335 }, { "epoch": 102, "train_loss": 0.2480203760242462, "train_acc": 0.92056, "test_loss": 2.8568203742980955, "test_acc": 0.5384, "lyapunov": null, "grad_norm": 0.49038134461440325, "grad_max_sv": 0.21357116661965847, "grad_min_sv": 8.517364178338947e-09, "grad_condition": 517553648.95562804, "lr": 0.0002320866025105016, "time_sec": 32.561208724975586 }, { "epoch": 103, "train_loss": 0.24091191486358643, "train_acc": 0.92288, "test_loss": 2.921445244216919, "test_acc": 0.539, "lyapunov": null, "grad_norm": 0.48403203094337405, "grad_max_sv": 0.2229804780334234, "grad_min_sv": 8.76879201030037e-09, "grad_condition": 395225985.76028645, "lr": 0.0002233042253783278, "time_sec": 32.58884024620056 }, { "epoch": 104, "train_loss": 0.2340097396659851, "train_acc": 0.92426, "test_loss": 2.952641244506836, "test_acc": 0.5359, "lyapunov": null, "grad_norm": 0.47933424227822113, "grad_max_sv": 0.21846036985516548, "grad_min_sv": 8.535758917998377e-09, "grad_condition": 633016056.7145557, "lr": 0.000214643216157784, "time_sec": 32.56481146812439 }, { "epoch": 105, "train_loss": 0.2301298531961441, "train_acc": 0.92618, "test_loss": 3.0041401138305663, "test_acc": 0.5291, "lyapunov": null, "grad_norm": 0.4740683813989447, "grad_max_sv": 0.22231761552393436, "grad_min_sv": 8.433698867145923e-09, "grad_condition": 3779496448.19964, "lr": 0.00020610737385376332, "time_sec": 32.58962845802307 }, { "epoch": 106, "train_loss": 0.23071280053138732, "train_acc": 0.92596, "test_loss": 2.902844191741943, "test_acc": 0.5388, "lyapunov": null, "grad_norm": 0.4741615782059369, "grad_max_sv": 0.22535606250166892, "grad_min_sv": 8.869640872113949e-09, "grad_condition": 162288203.3742172, "lr": 0.00019770044256881242, "time_sec": 32.57167601585388 }, { "epoch": 107, "train_loss": 0.22119897150993348, "train_acc": 0.92908, "test_loss": 2.9124989013671874, "test_acc": 0.5401, "lyapunov": null, "grad_norm": 0.4665652562574251, "grad_max_sv": 0.22006149925291538, "grad_min_sv": 8.667695651325135e-09, "grad_condition": 151185833.18543836, "lr": 0.0001894261098608447, "time_sec": 32.57570242881775 }, { "epoch": 108, "train_loss": 0.2127019773054123, "train_acc": 0.93066, "test_loss": 2.880406095504761, "test_acc": 0.5451, "lyapunov": null, "grad_norm": 0.4590032433316164, "grad_max_sv": 0.2255195803940296, "grad_min_sv": 9.011924857207053e-09, "grad_condition": 814863477.0120376, "lr": 0.000181288005125655, "time_sec": 32.57649230957031 }, { "epoch": 109, "train_loss": 0.21624571283340455, "train_acc": 0.9307, "test_loss": 2.967872815322876, "test_acc": 0.5365, "lyapunov": null, "grad_norm": 0.46217449604521815, "grad_max_sv": 0.22467305175960064, "grad_min_sv": 8.434571406850528e-09, "grad_condition": 269913512.95570815, "lr": 0.0001732896980049473, "time_sec": 32.688621520996094 }, { "epoch": 110, "train_loss": 0.21068411350250243, "train_acc": 0.93312, "test_loss": 2.9756517448425295, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.4560381046604994, "grad_max_sv": 0.2259811393916607, "grad_min_sv": 8.584292448838432e-09, "grad_condition": 247618387.92470437, "lr": 0.00016543469682057076, "time_sec": 32.61171579360962 }, { "epoch": 111, "train_loss": 0.20692597856521605, "train_acc": 0.93424, "test_loss": 2.9772758766174316, "test_acc": 0.5401, "lyapunov": null, "grad_norm": 0.4537336475301346, "grad_max_sv": 0.22052315585315227, "grad_min_sv": 8.457724332781163e-09, "grad_condition": 209643026.63441467, "lr": 0.00015772644703565552, "time_sec": 32.74080443382263 }, { "epoch": 112, "train_loss": 0.19982836018562317, "train_acc": 0.93464, "test_loss": 2.9877874111175537, "test_acc": 0.5374, "lyapunov": null, "grad_norm": 0.4502543545130326, "grad_max_sv": 0.21837349496781827, "grad_min_sv": 8.382589276531572e-09, "grad_condition": 190131911.5426251, "lr": 0.00015016832974331713, "time_sec": 32.61341071128845 }, { "epoch": 113, "train_loss": 0.19814088920593262, "train_acc": 0.93678, "test_loss": 3.0002061031341554, "test_acc": 0.5372, "lyapunov": null, "grad_norm": 0.4475396172239947, "grad_max_sv": 0.20673769935965539, "grad_min_sv": 8.026082756024642e-09, "grad_condition": 821010169.1913308, "lr": 0.00014276366018359834, "time_sec": 32.59360718727112 }, { "epoch": 114, "train_loss": 0.19049308371543885, "train_acc": 0.93866, "test_loss": 3.0283890243530274, "test_acc": 0.5348, "lyapunov": null, "grad_norm": 0.4406442112045554, "grad_max_sv": 0.21337005980312823, "grad_min_sv": 8.07762924176763e-09, "grad_condition": 667248655.8256387, "lr": 0.00013551568628929425, "time_sec": 32.58922576904297 }, { "epoch": 115, "train_loss": 0.18477844835281373, "train_acc": 0.9408, "test_loss": 2.979667907714844, "test_acc": 0.538, "lyapunov": null, "grad_norm": 0.4338873325468347, "grad_max_sv": 0.20222999081015586, "grad_min_sv": 7.837895723032327e-09, "grad_condition": 353434541.5259349, "lr": 0.00012842758726130276, "time_sec": 32.564921617507935 }, { "epoch": 116, "train_loss": 0.1859721972846985, "train_acc": 0.93958, "test_loss": 3.0662242183685304, "test_acc": 0.5393, "lyapunov": null, "grad_norm": 0.436884545053576, "grad_max_sv": 0.2168640349060297, "grad_min_sv": 8.084562923496817e-09, "grad_condition": 9428488559.560253, "lr": 0.0001215024721741218, "time_sec": 32.58519434928894 }, { "epoch": 117, "train_loss": 0.1802575473511219, "train_acc": 0.9417, "test_loss": 2.9826597057342528, "test_acc": 0.5406, "lyapunov": null, "grad_norm": 0.42742032333852065, "grad_max_sv": 0.2029492624104023, "grad_min_sv": 7.847825115431771e-09, "grad_condition": 1633268903.8573327, "lr": 0.00011474337861210538, "time_sec": 32.59012532234192 }, { "epoch": 118, "train_loss": 0.1823931166434288, "train_acc": 0.94122, "test_loss": 3.021400856399536, "test_acc": 0.5422, "lyapunov": null, "grad_norm": 0.43215599630315543, "grad_max_sv": 0.20591359175741672, "grad_min_sv": 8.091189306514043e-09, "grad_condition": 1689348599.2248282, "lr": 0.00010815327133708009, "time_sec": 32.5699896812439 }, { "epoch": 119, "train_loss": 0.17618105165958406, "train_acc": 0.94406, "test_loss": 3.000937869644165, "test_acc": 0.5384, "lyapunov": null, "grad_norm": 0.4237935060578588, "grad_max_sv": 0.20426486507058145, "grad_min_sv": 7.760857991326308e-09, "grad_condition": 126737655.38842675, "lr": 0.00010173504098790182, "time_sec": 32.55027508735657 }, { "epoch": 120, "train_loss": 0.17707269381523133, "train_acc": 0.9433, "test_loss": 3.0262657794952394, "test_acc": 0.5423, "lyapunov": null, "grad_norm": 0.4262563994652449, "grad_max_sv": 0.20858144126832484, "grad_min_sv": 7.881152512198563e-09, "grad_condition": 309539963.7397119, "lr": 9.549150281252629e-05, "time_sec": 32.56339383125305 }, { "epoch": 121, "train_loss": 0.17405739032268525, "train_acc": 0.94424, "test_loss": 3.066022943115234, "test_acc": 0.5357, "lyapunov": null, "grad_norm": 0.4209047902648977, "grad_max_sv": 0.208182505145669, "grad_min_sv": 7.926291366831817e-09, "grad_condition": 1481844022.098684, "lr": 8.942539543314794e-05, "time_sec": 32.55572319030762 }, { "epoch": 122, "train_loss": 0.1722756038427353, "train_acc": 0.94372, "test_loss": 2.9237624008178713, "test_acc": 0.5501, "lyapunov": null, "grad_norm": 0.42147984672159844, "grad_max_sv": 0.2044668670743704, "grad_min_sv": 7.998760296129494e-09, "grad_condition": 3201646284.8678083, "lr": 8.353937964495024e-05, "time_sec": 32.587459087371826 }, { "epoch": 123, "train_loss": 0.16738181323051451, "train_acc": 0.9461, "test_loss": 3.094963736343384, "test_acc": 0.5344, "lyapunov": null, "grad_norm": 0.41903231386737333, "grad_max_sv": 0.20275984779000283, "grad_min_sv": 7.716203944308116e-09, "grad_condition": 621612446.7663743, "lr": 7.783603724899243e-05, "time_sec": 32.584996461868286 }, { "epoch": 124, "train_loss": 0.16972655351161955, "train_acc": 0.94622, "test_loss": 3.0508366065979002, "test_acc": 0.5412, "lyapunov": null, "grad_norm": 0.4200695555516322, "grad_max_sv": 0.2031144231557846, "grad_min_sv": 7.729263715579261e-09, "grad_condition": 3217546779.4275866, "lr": 7.231786991974666e-05, "time_sec": 32.571866035461426 }, { "epoch": 125, "train_loss": 0.16630077925682069, "train_acc": 0.94662, "test_loss": 3.022613596343994, "test_acc": 0.5392, "lyapunov": null, "grad_norm": 0.41758178037006294, "grad_max_sv": 0.20861225724220275, "grad_min_sv": 7.841609751726292e-09, "grad_condition": 338985297.6185556, "lr": 6.698729810778072e-05, "time_sec": 32.5552761554718 }, { "epoch": 126, "train_loss": 0.15956245457649232, "train_acc": 0.94972, "test_loss": 3.0561922130584716, "test_acc": 0.5398, "lyapunov": null, "grad_norm": 0.40878054032118605, "grad_max_sv": 0.19741955921053886, "grad_min_sv": 7.37841599316065e-09, "grad_condition": 303424830.56526506, "lr": 6.184665997806817e-05, "time_sec": 32.54996180534363 }, { "epoch": 127, "train_loss": 0.15993500823020934, "train_acc": 0.9489, "test_loss": 3.026379292297363, "test_acc": 0.5441, "lyapunov": null, "grad_norm": 0.40620434130290156, "grad_max_sv": 0.20242127142846583, "grad_min_sv": 7.71886330243679e-09, "grad_condition": 171983926.969037, "lr": 5.6898210384392595e-05, "time_sec": 32.630762577056885 }, { "epoch": 128, "train_loss": 0.15721613983869553, "train_acc": 0.94976, "test_loss": 3.0123806335449217, "test_acc": 0.543, "lyapunov": null, "grad_norm": 0.40771760456255063, "grad_max_sv": 0.19883232600986958, "grad_min_sv": 7.65689685735399e-09, "grad_condition": 140452566.13847277, "lr": 5.214411988029363e-05, "time_sec": 32.56053280830383 }, { "epoch": 129, "train_loss": 0.15980393629074097, "train_acc": 0.9494, "test_loss": 3.0619752151489257, "test_acc": 0.5385, "lyapunov": null, "grad_norm": 0.40680055079987404, "grad_max_sv": 0.21151602938771247, "grad_min_sv": 7.960656847678569e-09, "grad_condition": 6835345348.5200405, "lr": 4.7586473766990294e-05, "time_sec": 32.56260585784912 }, { "epoch": 130, "train_loss": 0.1551200196647644, "train_acc": 0.95066, "test_loss": 3.0138941650390625, "test_acc": 0.5454, "lyapunov": null, "grad_norm": 0.4023235762601659, "grad_max_sv": 0.19708200730383396, "grad_min_sv": 7.800858144299192e-09, "grad_condition": 626827866.159754, "lr": 4.32272711786996e-05, "time_sec": 32.59095644950867 }, { "epoch": 131, "train_loss": 0.15415350935935973, "train_acc": 0.95194, "test_loss": 2.9972058124542236, "test_acc": 0.5443, "lyapunov": null, "grad_norm": 0.40269684147235807, "grad_max_sv": 0.20214904472231865, "grad_min_sv": 7.632781651861764e-09, "grad_condition": 3110137965.882431, "lr": 3.906842420574966e-05, "time_sec": 32.64683389663696 }, { "epoch": 132, "train_loss": 0.15071093450546263, "train_acc": 0.95362, "test_loss": 3.058548362350464, "test_acc": 0.5406, "lyapunov": null, "grad_norm": 0.3962388158117765, "grad_max_sv": 0.20194376222789287, "grad_min_sv": 7.476556948202151e-09, "grad_condition": 251161532.73020416, "lr": 3.5111757055874305e-05, "time_sec": 32.57603096961975 }, { "epoch": 133, "train_loss": 0.15083105179309844, "train_acc": 0.95186, "test_loss": 3.0908397106170655, "test_acc": 0.5372, "lyapunov": null, "grad_norm": 0.396089047457992, "grad_max_sv": 0.19243778996169567, "grad_min_sv": 7.3091202180313244e-09, "grad_condition": 798644628.4177251, "lr": 3.1359005254054254e-05, "time_sec": 32.73746132850647 }, { "epoch": 134, "train_loss": 0.14782890917301178, "train_acc": 0.95342, "test_loss": 3.050483916091919, "test_acc": 0.5423, "lyapunov": null, "grad_norm": 0.3935039829273189, "grad_max_sv": 0.1971876610070467, "grad_min_sv": 7.67425883595142e-09, "grad_condition": 2485965444.639862, "lr": 2.7811814881259484e-05, "time_sec": 32.72033095359802 }, { "epoch": 135, "train_loss": 0.1471274660015106, "train_acc": 0.95372, "test_loss": 2.9947123558044435, "test_acc": 0.5426, "lyapunov": null, "grad_norm": 0.3920191534951485, "grad_max_sv": 0.20197632759809495, "grad_min_sv": 7.500751369148018e-09, "grad_condition": 520365917.2206461, "lr": 2.4471741852423218e-05, "time_sec": 32.67989182472229 }, { "epoch": 136, "train_loss": 0.1491823548412323, "train_acc": 0.9526, "test_loss": 3.0622998500823972, "test_acc": 0.5417, "lyapunov": null, "grad_norm": 0.3958637689339096, "grad_max_sv": 0.1968228505924344, "grad_min_sv": 7.479480308540676e-09, "grad_condition": 707924605.8880411, "lr": 2.1340251233966362e-05, "time_sec": 32.66845107078552 }, { "epoch": 137, "train_loss": 0.1438249187850952, "train_acc": 0.95456, "test_loss": 3.0126154830932617, "test_acc": 0.5438, "lyapunov": null, "grad_norm": 0.3880549357238996, "grad_max_sv": 0.1975066963583231, "grad_min_sv": 7.686822375862525e-09, "grad_condition": 958291083.1124929, "lr": 1.8418716601170932e-05, "time_sec": 32.62222647666931 }, { "epoch": 138, "train_loss": 0.14332568585395813, "train_acc": 0.95562, "test_loss": 2.970457587814331, "test_acc": 0.5475, "lyapunov": null, "grad_norm": 0.387864370948264, "grad_max_sv": 0.19698900803923608, "grad_min_sv": 7.3030646496365096e-09, "grad_condition": 522257153.2510088, "lr": 1.570841943568445e-05, "time_sec": 32.588345527648926 }, { "epoch": 139, "train_loss": 0.14504710802555085, "train_acc": 0.95396, "test_loss": 3.0413112239837647, "test_acc": 0.5442, "lyapunov": null, "grad_norm": 0.39046406821011487, "grad_max_sv": 0.19658712521195412, "grad_min_sv": 7.706623579399608e-09, "grad_condition": 210757363.08798447, "lr": 1.3210548563419845e-05, "time_sec": 32.57579827308655 }, { "epoch": 140, "train_loss": 0.1440677634191513, "train_acc": 0.9551, "test_loss": 3.0336122520446778, "test_acc": 0.5421, "lyapunov": null, "grad_norm": 0.3879105148922517, "grad_max_sv": 0.20634672362357379, "grad_min_sv": 7.609137083592308e-09, "grad_condition": 799925132.5815533, "lr": 1.0926199633097203e-05, "time_sec": 32.56750822067261 }, { "epoch": 141, "train_loss": 0.1450736529636383, "train_acc": 0.9539, "test_loss": 3.0418475845336914, "test_acc": 0.542, "lyapunov": null, "grad_norm": 0.3893245206754723, "grad_max_sv": 0.19981114380061626, "grad_min_sv": 7.533249978951707e-09, "grad_condition": 1055093430.0963647, "lr": 8.856374635655688e-06, "time_sec": 32.5803439617157 }, { "epoch": 142, "train_loss": 0.14690097001075744, "train_acc": 0.9539, "test_loss": 3.085536852264404, "test_acc": 0.5402, "lyapunov": null, "grad_norm": 0.393962854701407, "grad_max_sv": 0.19642856512218715, "grad_min_sv": 7.33013154697107e-09, "grad_condition": 1287238710.5116677, "lr": 7.001981464747503e-06, "time_sec": 32.587260246276855 }, { "epoch": 143, "train_loss": 0.14333253172159194, "train_acc": 0.95502, "test_loss": 3.0491490406036377, "test_acc": 0.5422, "lyapunov": null, "grad_norm": 0.38524967986058734, "grad_max_sv": 0.1963527824729681, "grad_min_sv": 7.358908829112505e-09, "grad_condition": 554422862.0300386, "lr": 5.3638335185058295e-06, "time_sec": 32.558162450790405 }, { "epoch": 144, "train_loss": 0.14636923120975495, "train_acc": 0.95354, "test_loss": 3.061640990829468, "test_acc": 0.5427, "lyapunov": null, "grad_norm": 0.39405435868542676, "grad_max_sv": 0.20560368224978448, "grad_min_sv": 7.55005881126168e-09, "grad_condition": 511328197.16483086, "lr": 3.942649342761114e-06, "time_sec": 32.583282709121704 }, { "epoch": 145, "train_loss": 0.14265491032361985, "train_acc": 0.95596, "test_loss": 3.0034291164398192, "test_acc": 0.5447, "lyapunov": null, "grad_norm": 0.38473538959699044, "grad_max_sv": 0.20014677122235297, "grad_min_sv": 7.530181120709092e-09, "grad_condition": 337796403.57093, "lr": 2.7390523158633524e-06, "time_sec": 32.637805223464966 }, { "epoch": 146, "train_loss": 0.14478088060855865, "train_acc": 0.95472, "test_loss": 3.0147633277893067, "test_acc": 0.5419, "lyapunov": null, "grad_norm": 0.3885491395116739, "grad_max_sv": 0.19666519686579703, "grad_min_sv": 7.584344775216773e-09, "grad_condition": 547643565.9603722, "lr": 1.7535703752478133e-06, "time_sec": 32.652307748794556 }, { "epoch": 147, "train_loss": 0.14279501497268676, "train_acc": 0.9546, "test_loss": 3.0440410163879394, "test_acc": 0.541, "lyapunov": null, "grad_norm": 0.38669357310585645, "grad_max_sv": 0.21015651226043702, "grad_min_sv": 7.688521032247348e-09, "grad_condition": 469600192.5783922, "lr": 9.866357858642196e-07, "time_sec": 32.59567952156067 }, { "epoch": 148, "train_loss": 0.14565588755607606, "train_acc": 0.9541, "test_loss": 3.0802265747070314, "test_acc": 0.5416, "lyapunov": null, "grad_norm": 0.38859455199964604, "grad_max_sv": 0.19257190506905317, "grad_min_sv": 7.505198252591092e-09, "grad_condition": 881395202.1431038, "lr": 4.38584950570808e-07, "time_sec": 32.61454796791077 }, { "epoch": 149, "train_loss": 0.14538168624401093, "train_acc": 0.9543, "test_loss": 3.0341483921051027, "test_acc": 0.5461, "lyapunov": null, "grad_norm": 0.3912198061226822, "grad_max_sv": 0.19850266501307487, "grad_min_sv": 7.570504590619434e-09, "grad_condition": 1146760478.7303884, "lr": 1.096582625772501e-07, "time_sec": 32.57002377510071 }, { "epoch": 150, "train_loss": 0.14344769035339355, "train_acc": 0.95432, "test_loss": 3.151827312850952, "test_acc": 0.5351, "lyapunov": null, "grad_norm": 0.38700258459733883, "grad_max_sv": 0.19427692480385303, "grad_min_sv": 7.459068278141413e-09, "grad_condition": 795616674.0450132, "lr": 0.0, "time_sec": 32.58071160316467 } ], "12": [ { "epoch": 1, "train_loss": 4.869130941009521, "train_acc": 0.0299, "test_loss": 4.81726124420166, "test_acc": 0.0158, "lyapunov": null, "grad_norm": 5.958599870859213, "grad_max_sv": 5.32314133644104, "grad_min_sv": 1.0002176032419818e-07, "grad_condition": 117638897.02667244, "lr": 0.0009998903417374227, "time_sec": 49.630311012268066 }, { "epoch": 2, "train_loss": 4.33411005065918, "train_acc": 0.05812, "test_loss": 4.9022071792602535, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 4.4717426818192445, "grad_max_sv": 3.9425308763980866, "grad_min_sv": 7.707211335805653e-08, "grad_condition": 68733255.35507934, "lr": 0.0009995614150494292, "time_sec": 49.65966987609863 }, { "epoch": 3, "train_loss": 4.058719948577881, "train_acc": 0.08542, "test_loss": 4.564939413452149, "test_acc": 0.0316, "lyapunov": null, "grad_norm": 3.6062592227635153, "grad_max_sv": 3.0093896448612214, "grad_min_sv": 6.351203426790964e-08, "grad_condition": 159552980.8120403, "lr": 0.0009990133642141358, "time_sec": 49.6358323097229 }, { "epoch": 4, "train_loss": 3.8575441249084474, "train_acc": 0.11032, "test_loss": 4.524412051391602, "test_acc": 0.0409, "lyapunov": null, "grad_norm": 2.92902742157696, "grad_max_sv": 2.357221654057503, "grad_min_sv": 5.122935820833785e-08, "grad_condition": 93072427.1014817, "lr": 0.0009982464296247522, "time_sec": 49.63461923599243 }, { "epoch": 5, "train_loss": 3.6889766606140135, "train_acc": 0.13372, "test_loss": 4.625890071105957, "test_acc": 0.0423, "lyapunov": null, "grad_norm": 2.3880731569941602, "grad_max_sv": 1.768235558271408, "grad_min_sv": 4.081188793129964e-08, "grad_condition": 393314864.55004865, "lr": 0.0009972609476841367, "time_sec": 49.89368748664856 }, { "epoch": 6, "train_loss": 3.5618105076599123, "train_acc": 0.15236, "test_loss": 4.4743853515625, "test_acc": 0.0606, "lyapunov": null, "grad_norm": 1.9549034892194537, "grad_max_sv": 1.3601578801870347, "grad_min_sv": 3.461635420948239e-08, "grad_condition": 108039525.34253314, "lr": 0.000996057350657239, "time_sec": 49.63013410568237 }, { "epoch": 7, "train_loss": 3.449751102294922, "train_acc": 0.17348, "test_loss": 4.566000821304321, "test_acc": 0.0583, "lyapunov": null, "grad_norm": 1.6054375498086935, "grad_max_sv": 0.970761476457119, "grad_min_sv": 2.837226934226944e-08, "grad_condition": 97915375.34094961, "lr": 0.000994636166481494, "time_sec": 49.65112805366516 }, { "epoch": 8, "train_loss": 3.362903434448242, "train_acc": 0.18704, "test_loss": 5.157250576019287, "test_acc": 0.0509, "lyapunov": null, "grad_norm": 1.4122949125779343, "grad_max_sv": 0.7663216680288315, "grad_min_sv": 2.498295813726896e-08, "grad_condition": 819581329.8584878, "lr": 0.0009929980185352525, "time_sec": 49.64129614830017 }, { "epoch": 9, "train_loss": 3.2836685932922363, "train_acc": 0.20434, "test_loss": 4.776924538803101, "test_acc": 0.0722, "lyapunov": null, "grad_norm": 1.3022948327813888, "grad_max_sv": 0.6469943135976791, "grad_min_sv": 2.306396500451058e-08, "grad_condition": 39951536.65872553, "lr": 0.0009911436253643444, "time_sec": 49.625274658203125 }, { "epoch": 10, "train_loss": 3.2231285871887208, "train_acc": 0.21402, "test_loss": 4.61860969619751, "test_acc": 0.0698, "lyapunov": null, "grad_norm": 1.2196486517440839, "grad_max_sv": 0.5692647032439708, "grad_min_sv": 2.19049595906462e-08, "grad_condition": 33845479.69359137, "lr": 0.0009890738003669028, "time_sec": 49.660149335861206 }, { "epoch": 11, "train_loss": 3.1583662706756592, "train_acc": 0.22336, "test_loss": 4.968407231903076, "test_acc": 0.0756, "lyapunov": null, "grad_norm": 1.1538157456115983, "grad_max_sv": 0.5210241436958313, "grad_min_sv": 2.0956197309580926e-08, "grad_condition": 525394408.4356891, "lr": 0.00098678945143658, "time_sec": 49.65011477470398 }, { "epoch": 12, "train_loss": 3.109931953125, "train_acc": 0.23662, "test_loss": 4.948040252685547, "test_acc": 0.0649, "lyapunov": null, "grad_norm": 1.1104505996303506, "grad_max_sv": 0.49291609674692155, "grad_min_sv": 2.0293893665535024e-08, "grad_condition": 28415855.264934354, "lr": 0.0009842915805643154, "time_sec": 49.63184213638306 }, { "epoch": 13, "train_loss": 3.0547399656677245, "train_acc": 0.24656, "test_loss": 4.970808222198486, "test_acc": 0.071, "lyapunov": null, "grad_norm": 1.0601665770785784, "grad_max_sv": 0.43972166776657107, "grad_min_sv": 1.913768455791276e-08, "grad_condition": 43447965.04145826, "lr": 0.000981581283398829, "time_sec": 49.61093473434448 }, { "epoch": 14, "train_loss": 3.017925659484863, "train_acc": 0.25326, "test_loss": 4.814505133056641, "test_acc": 0.0837, "lyapunov": null, "grad_norm": 1.014870172987229, "grad_max_sv": 0.42207302525639534, "grad_min_sv": 1.853980992200244e-08, "grad_condition": 39195315.53960514, "lr": 0.0009786597487660333, "time_sec": 49.673532009124756 }, { "epoch": 15, "train_loss": 2.9702432484436034, "train_acc": 0.2631, "test_loss": 5.807154141235351, "test_acc": 0.063, "lyapunov": null, "grad_norm": 0.9937971972307359, "grad_max_sv": 0.4026923879981041, "grad_min_sv": 1.8250485112059068e-08, "grad_condition": 40167603.205859475, "lr": 0.0009755282581475766, "time_sec": 49.618321657180786 }, { "epoch": 16, "train_loss": 2.944736771850586, "train_acc": 0.26722, "test_loss": 5.26193563079834, "test_acc": 0.0679, "lyapunov": null, "grad_norm": 0.9522428456453783, "grad_max_sv": 0.38795666843652726, "grad_min_sv": 1.7932681539711838e-08, "grad_condition": 23883480.656060785, "lr": 0.0009721881851187403, "time_sec": 49.62830376625061 }, { "epoch": 17, "train_loss": 2.9034721049499512, "train_acc": 0.27602, "test_loss": 5.7925373001098635, "test_acc": 0.064, "lyapunov": null, "grad_norm": 0.9254531496563255, "grad_max_sv": 0.3589652024209499, "grad_min_sv": 1.6935554087902337e-08, "grad_condition": 1457602436.4631252, "lr": 0.0009686409947459456, "time_sec": 49.61351823806763 }, { "epoch": 18, "train_loss": 2.8702178131866454, "train_acc": 0.27916, "test_loss": 5.747376763916016, "test_acc": 0.0602, "lyapunov": null, "grad_norm": 0.886880691282622, "grad_max_sv": 0.35455706864595415, "grad_min_sv": 1.661939068586804e-08, "grad_condition": 37189913.97942409, "lr": 0.0009648882429441254, "time_sec": 49.602774143218994 }, { "epoch": 19, "train_loss": 2.8457236665344237, "train_acc": 0.28346, "test_loss": 5.225064262390137, "test_acc": 0.0742, "lyapunov": null, "grad_norm": 0.8745352102009426, "grad_max_sv": 0.33497569262981414, "grad_min_sv": 1.610201680879442e-08, "grad_condition": 37118382.124889985, "lr": 0.00096093157579425, "time_sec": 49.60137701034546 }, { "epoch": 20, "train_loss": 2.8215041007995607, "train_acc": 0.28872, "test_loss": 6.004126496887207, "test_acc": 0.0566, "lyapunov": null, "grad_norm": 0.8595248383665987, "grad_max_sv": 0.3317968972027302, "grad_min_sv": 1.6277641995410263e-08, "grad_condition": 25076117.492004953, "lr": 0.0009567727288213001, "time_sec": 49.606021881103516 }, { "epoch": 21, "train_loss": 2.7879924519348145, "train_acc": 0.296, "test_loss": 5.8324502685546875, "test_acc": 0.0713, "lyapunov": null, "grad_norm": 0.8282095227121367, "grad_max_sv": 0.3175826959311962, "grad_min_sv": 1.5523823382324054e-08, "grad_condition": 33473762.080522645, "lr": 0.0009524135262330095, "time_sec": 49.607139110565186 }, { "epoch": 22, "train_loss": 2.758204474105835, "train_acc": 0.30248, "test_loss": 6.578706220245361, "test_acc": 0.0618, "lyapunov": null, "grad_norm": 0.8257961231351345, "grad_max_sv": 0.30810598842799664, "grad_min_sv": 1.5302382311288555e-08, "grad_condition": 24529675.495205637, "lr": 0.0009478558801197061, "time_sec": 49.624640464782715 }, { "epoch": 23, "train_loss": 2.738676343231201, "train_acc": 0.30592, "test_loss": 5.4664344863891605, "test_acc": 0.0861, "lyapunov": null, "grad_norm": 0.8065233040737523, "grad_max_sv": 0.30156193524599073, "grad_min_sv": 1.49054265444204e-08, "grad_condition": 33421080.710955955, "lr": 0.000943101789615607, "time_sec": 49.63160300254822 }, { "epoch": 24, "train_loss": 2.716878635177612, "train_acc": 0.31244, "test_loss": 6.44300007019043, "test_acc": 0.0749, "lyapunov": null, "grad_norm": 0.786905827456602, "grad_max_sv": 0.30066613033413886, "grad_min_sv": 1.476351601525927e-08, "grad_condition": 22958316.6446944, "lr": 0.0009381533400219313, "time_sec": 49.617870569229126 }, { "epoch": 25, "train_loss": 2.694182593231201, "train_acc": 0.31604, "test_loss": 5.382769798278809, "test_acc": 0.0916, "lyapunov": null, "grad_norm": 0.7761045602879763, "grad_max_sv": 0.2905112482607365, "grad_min_sv": 1.4682144194866353e-08, "grad_condition": 23004874.738089267, "lr": 0.0009330127018922189, "time_sec": 49.63197326660156 }, { "epoch": 26, "train_loss": 2.665074285736084, "train_acc": 0.3195, "test_loss": 6.5514334884643555, "test_acc": 0.0798, "lyapunov": null, "grad_norm": 0.7692786817334373, "grad_max_sv": 0.28090294301509855, "grad_min_sv": 1.4502390317805425e-08, "grad_condition": 76981810.64111714, "lr": 0.000927682130080253, "time_sec": 49.62014698982239 }, { "epoch": 27, "train_loss": 2.6460686820983885, "train_acc": 0.32446, "test_loss": 5.83518740234375, "test_acc": 0.0812, "lyapunov": null, "grad_norm": 0.754398795054657, "grad_max_sv": 0.27323813289403914, "grad_min_sv": 1.4150497623655057e-08, "grad_condition": 21603221.75046044, "lr": 0.0009221639627510072, "time_sec": 49.62936043739319 }, { "epoch": 28, "train_loss": 2.6265927952575683, "train_acc": 0.32812, "test_loss": 6.598120281982422, "test_acc": 0.0812, "lyapunov": null, "grad_norm": 0.7495858584128283, "grad_max_sv": 0.2764635566622019, "grad_min_sv": 1.3928179298794419e-08, "grad_condition": 26592087.597849313, "lr": 0.0009164606203550494, "time_sec": 49.65487575531006 }, { "epoch": 29, "train_loss": 2.5989754135131835, "train_acc": 0.33438, "test_loss": 6.019640913391113, "test_acc": 0.0853, "lyapunov": null, "grad_norm": 0.7328457671272296, "grad_max_sv": 0.26275444217026234, "grad_min_sv": 1.3466245638027452e-08, "grad_condition": 27074823.030799665, "lr": 0.0009105746045668516, "time_sec": 49.61575961112976 }, { "epoch": 30, "train_loss": 2.569355689697266, "train_acc": 0.3403, "test_loss": 5.656453500366211, "test_acc": 0.1069, "lyapunov": null, "grad_norm": 0.7285247723431758, "grad_max_sv": 0.2620399072766304, "grad_min_sv": 1.3607302561113865e-08, "grad_condition": 36595154.18813526, "lr": 0.0009045084971874733, "time_sec": 49.61033368110657 }, { "epoch": 31, "train_loss": 2.5531623433685304, "train_acc": 0.34344, "test_loss": 5.512335840606689, "test_acc": 0.1014, "lyapunov": null, "grad_norm": 0.7271132291276766, "grad_max_sv": 0.2741693131625652, "grad_min_sv": 1.3862067549386126e-08, "grad_condition": 23784567.90840191, "lr": 0.0008982649590120977, "time_sec": 49.62810754776001 }, { "epoch": 32, "train_loss": 2.540181041793823, "train_acc": 0.3433, "test_loss": 6.18716075592041, "test_acc": 0.0672, "lyapunov": null, "grad_norm": 0.7235480377928197, "grad_max_sv": 0.2649095542728901, "grad_min_sv": 1.3458577613478795e-08, "grad_condition": 45957043.50585803, "lr": 0.0008918467286629196, "time_sec": 49.6074960231781 }, { "epoch": 33, "train_loss": 2.5191816319274905, "train_acc": 0.34908, "test_loss": 6.582100025939941, "test_acc": 0.0751, "lyapunov": null, "grad_norm": 0.7200938019415711, "grad_max_sv": 0.25730164162814617, "grad_min_sv": 1.3406257262649212e-08, "grad_condition": 31538992.96164729, "lr": 0.0008852566213878943, "time_sec": 49.61494970321655 }, { "epoch": 34, "train_loss": 2.496463624954224, "train_acc": 0.35388, "test_loss": 6.577035200500489, "test_acc": 0.0824, "lyapunov": null, "grad_norm": 0.7056443924011199, "grad_max_sv": 0.2493937097489834, "grad_min_sv": 1.2909361921803475e-08, "grad_condition": 45513498.69422473, "lr": 0.000878497527825878, "time_sec": 49.61423134803772 }, { "epoch": 35, "train_loss": 2.476149175262451, "train_acc": 0.3577, "test_loss": 6.60574702758789, "test_acc": 0.0683, "lyapunov": null, "grad_norm": 0.7081960767237655, "grad_max_sv": 0.2570201367139816, "grad_min_sv": 1.3318109846893745e-08, "grad_condition": 40942846.386733145, "lr": 0.000871572412738697, "time_sec": 49.627204179763794 }, { "epoch": 36, "train_loss": 2.4584676556396485, "train_acc": 0.36174, "test_loss": 6.376377404785156, "test_acc": 0.1036, "lyapunov": null, "grad_norm": 0.7033365437967071, "grad_max_sv": 0.25586923360824587, "grad_min_sv": 1.3038588915492699e-08, "grad_condition": 29808789.927535187, "lr": 0.0008644843137107055, "time_sec": 49.658987283706665 }, { "epoch": 37, "train_loss": 2.437811667022705, "train_acc": 0.36606, "test_loss": 5.828952204895019, "test_acc": 0.1031, "lyapunov": null, "grad_norm": 0.6944168249360962, "grad_max_sv": 0.24849907420575618, "grad_min_sv": 1.295541044166182e-08, "grad_condition": 25181358.80101443, "lr": 0.0008572363398164014, "time_sec": 49.69488453865051 }, { "epoch": 38, "train_loss": 2.428686420135498, "train_acc": 0.36772, "test_loss": 5.761842573547363, "test_acc": 0.1089, "lyapunov": null, "grad_norm": 0.6926211199497188, "grad_max_sv": 0.24097422771155835, "grad_min_sv": 1.2852728982493122e-08, "grad_condition": 34221857.55107718, "lr": 0.0008498316702566826, "time_sec": 49.65219521522522 }, { "epoch": 39, "train_loss": 2.403228950653076, "train_acc": 0.37238, "test_loss": 6.327913746643066, "test_acc": 0.0717, "lyapunov": null, "grad_norm": 0.6898323608739025, "grad_max_sv": 0.24370794370770454, "grad_min_sv": 1.2873074178160193e-08, "grad_condition": 57305083.56976622, "lr": 0.0008422735529643442, "time_sec": 49.67387104034424 }, { "epoch": 40, "train_loss": 2.4002745401000976, "train_acc": 0.37394, "test_loss": 6.5177731010437014, "test_acc": 0.083, "lyapunov": null, "grad_norm": 0.6833298006535204, "grad_max_sv": 0.2354185614734888, "grad_min_sv": 1.2765965198835438e-08, "grad_condition": 21504088.72491734, "lr": 0.0008345653031794289, "time_sec": 49.617934226989746 }, { "epoch": 41, "train_loss": 2.375027209320068, "train_acc": 0.37838, "test_loss": 5.745588743591308, "test_acc": 0.0906, "lyapunov": null, "grad_norm": 0.6828029580415041, "grad_max_sv": 0.2435049433261156, "grad_min_sv": 1.2850220883556252e-08, "grad_condition": 81583325.51254459, "lr": 0.0008267103019950526, "time_sec": 49.618937492370605 }, { "epoch": 42, "train_loss": 2.3483433491516115, "train_acc": 0.38482, "test_loss": 6.884811988830567, "test_acc": 0.0781, "lyapunov": null, "grad_norm": 0.6754176682521642, "grad_max_sv": 0.23814460188150405, "grad_min_sv": 1.2720279750355611e-08, "grad_condition": 59300475.89689113, "lr": 0.0008187119948743447, "time_sec": 49.61317276954651 }, { "epoch": 43, "train_loss": 2.3344376317596436, "train_acc": 0.38764, "test_loss": 6.61351337890625, "test_acc": 0.0969, "lyapunov": null, "grad_norm": 0.6769988439891311, "grad_max_sv": 0.23613341376185418, "grad_min_sv": 1.2639965266819653e-08, "grad_condition": 52119429.92492165, "lr": 0.000810573890139155, "time_sec": 49.61902713775635 }, { "epoch": 44, "train_loss": 2.3136163584899903, "train_acc": 0.39148, "test_loss": 6.608843360137939, "test_acc": 0.0931, "lyapunov": null, "grad_norm": 0.6707039764412329, "grad_max_sv": 0.23947011977434157, "grad_min_sv": 1.2690825271916007e-08, "grad_condition": 66659408.04853566, "lr": 0.0008022995574311873, "time_sec": 49.651583671569824 }, { "epoch": 45, "train_loss": 2.303262007751465, "train_acc": 0.3968, "test_loss": 7.3357599853515625, "test_acc": 0.0763, "lyapunov": null, "grad_norm": 0.6720641219214196, "grad_max_sv": 0.2344801113009453, "grad_min_sv": 1.2468999964487804e-08, "grad_condition": 28252178.039376438, "lr": 0.0007938926261462363, "time_sec": 49.6513557434082 }, { "epoch": 46, "train_loss": 2.294885206298828, "train_acc": 0.39602, "test_loss": 7.143599510192871, "test_acc": 0.0808, "lyapunov": null, "grad_norm": 0.6723751960213503, "grad_max_sv": 0.23659461848437785, "grad_min_sv": 1.2819257341756262e-08, "grad_condition": 24273419.96656149, "lr": 0.0007853567838422158, "time_sec": 49.67392659187317 }, { "epoch": 47, "train_loss": 2.2797239797973634, "train_acc": 0.39734, "test_loss": 7.214380073547363, "test_acc": 0.0775, "lyapunov": null, "grad_norm": 0.6804834576699708, "grad_max_sv": 0.23809269666671753, "grad_min_sv": 1.2608010335757313e-08, "grad_condition": 25254183.290313803, "lr": 0.0007766957746216719, "time_sec": 49.69322681427002 }, { "epoch": 48, "train_loss": 2.265524502334595, "train_acc": 0.40104, "test_loss": 7.091396580505371, "test_acc": 0.0731, "lyapunov": null, "grad_norm": 0.667046368857113, "grad_max_sv": 0.23234264142811298, "grad_min_sv": 1.2433218019025638e-08, "grad_condition": 22653859.281439293, "lr": 0.0007679133974894982, "time_sec": 49.65531873703003 }, { "epoch": 49, "train_loss": 2.2435117234802244, "train_acc": 0.40428, "test_loss": 7.294827133178711, "test_acc": 0.0737, "lyapunov": null, "grad_norm": 0.6646443647443216, "grad_max_sv": 0.23331840261816977, "grad_min_sv": 1.2566753440634847e-08, "grad_condition": 29559825.642532967, "lr": 0.000759013504686565, "time_sec": 49.66777467727661 }, { "epoch": 50, "train_loss": 2.2254374363708496, "train_acc": 0.4097, "test_loss": 8.604184033203126, "test_acc": 0.0731, "lyapunov": null, "grad_norm": 0.6690954918149841, "grad_max_sv": 0.22841170839965344, "grad_min_sv": 1.2475536101397288e-08, "grad_condition": 21723914.29311887, "lr": 0.0007499999999999998, "time_sec": 49.67113780975342 }, { "epoch": 51, "train_loss": 2.2072127560424804, "train_acc": 0.41446, "test_loss": 6.9883695976257325, "test_acc": 0.0803, "lyapunov": null, "grad_norm": 0.6607736738937507, "grad_max_sv": 0.2331558234989643, "grad_min_sv": 1.243218040875016e-08, "grad_condition": 27632939.34803492, "lr": 0.0007408768370508575, "time_sec": 49.65227961540222 }, { "epoch": 52, "train_loss": 2.1981446758270264, "train_acc": 0.41588, "test_loss": 8.058159327697753, "test_acc": 0.0799, "lyapunov": null, "grad_norm": 0.6648453996346088, "grad_max_sv": 0.2446960099041462, "grad_min_sv": 1.2652686252889733e-08, "grad_condition": 41197472.85285741, "lr": 0.0007316480175599307, "time_sec": 49.61691617965698 }, { "epoch": 53, "train_loss": 2.174496583709717, "train_acc": 0.42132, "test_loss": 7.289675385284424, "test_acc": 0.0877, "lyapunov": null, "grad_norm": 0.6618427859375565, "grad_max_sv": 0.2312875609844923, "grad_min_sv": 1.239080896497935e-08, "grad_condition": 23822848.628154784, "lr": 0.0007223175895924635, "time_sec": 49.65499806404114 }, { "epoch": 54, "train_loss": 2.16634906211853, "train_acc": 0.42064, "test_loss": 7.236015202331543, "test_acc": 0.0958, "lyapunov": null, "grad_norm": 0.6619124781918282, "grad_max_sv": 0.2310062251985073, "grad_min_sv": 1.2317981715193049e-08, "grad_condition": 26820300.581125747, "lr": 0.0007128896457825361, "time_sec": 49.61980724334717 }, { "epoch": 55, "train_loss": 2.14550412109375, "train_acc": 0.4265, "test_loss": 6.8394420608520505, "test_acc": 0.0943, "lyapunov": null, "grad_norm": 0.6625916025346076, "grad_max_sv": 0.23202612698078157, "grad_min_sv": 1.2528317372417775e-08, "grad_condition": 25612000.25663858, "lr": 0.0007033683215378998, "time_sec": 49.674599170684814 }, { "epoch": 56, "train_loss": 2.1276820320892336, "train_acc": 0.42994, "test_loss": 6.964908208465576, "test_acc": 0.0954, "lyapunov": null, "grad_norm": 0.6554659738718382, "grad_max_sv": 0.2207026917487383, "grad_min_sv": 1.2088878859062292e-08, "grad_condition": 21085232.116952278, "lr": 0.0006937577932260512, "time_sec": 49.67076587677002 }, { "epoch": 57, "train_loss": 2.1337597509765627, "train_acc": 0.42926, "test_loss": 8.229502785491944, "test_acc": 0.0862, "lyapunov": null, "grad_norm": 0.65752559961672, "grad_max_sv": 0.2246583230793476, "grad_min_sv": 1.2207756456758534e-08, "grad_condition": 64230626.47705172, "lr": 0.0006840622763423388, "time_sec": 49.64063334465027 }, { "epoch": 58, "train_loss": 2.1041818314361573, "train_acc": 0.43524, "test_loss": 6.589992712402344, "test_acc": 0.1085, "lyapunov": null, "grad_norm": 0.6598697025296996, "grad_max_sv": 0.23252296969294547, "grad_min_sv": 1.2361365446522666e-08, "grad_condition": 30301917.129872173, "lr": 0.0006742860236609073, "time_sec": 49.61933445930481 }, { "epoch": 59, "train_loss": 2.096152271270752, "train_acc": 0.4375, "test_loss": 6.983989217376709, "test_acc": 0.0982, "lyapunov": null, "grad_norm": 0.6560896741871133, "grad_max_sv": 0.23231945298612117, "grad_min_sv": 1.251871321050757e-08, "grad_condition": 22362788.103550732, "lr": 0.0006644333233692913, "time_sec": 49.61751055717468 }, { "epoch": 60, "train_loss": 2.081830069847107, "train_acc": 0.43602, "test_loss": 7.386634468841553, "test_acc": 0.1014, "lyapunov": null, "grad_norm": 0.6536599782236483, "grad_max_sv": 0.22322102561593055, "grad_min_sv": 1.2262779891525356e-08, "grad_condition": 23489422.867959693, "lr": 0.0006545084971874734, "time_sec": 49.620344161987305 }, { "epoch": 61, "train_loss": 2.0558355644226074, "train_acc": 0.44474, "test_loss": 7.227272665405273, "test_acc": 0.1013, "lyapunov": null, "grad_norm": 0.6572328158390935, "grad_max_sv": 0.22376591265201567, "grad_min_sv": 1.238219781984906e-08, "grad_condition": 31021778.17636667, "lr": 0.0006445158984722354, "time_sec": 49.6348340511322 }, { "epoch": 62, "train_loss": 2.0572922328948975, "train_acc": 0.44566, "test_loss": 7.505316355133057, "test_acc": 0.0927, "lyapunov": null, "grad_norm": 0.656923815023976, "grad_max_sv": 0.23445738479495049, "grad_min_sv": 1.2478020391688133e-08, "grad_condition": 262812298.93435702, "lr": 0.0006344599103076324, "time_sec": 49.62543535232544 }, { "epoch": 63, "train_loss": 2.0413633464813232, "train_acc": 0.44668, "test_loss": 7.251725723266602, "test_acc": 0.0991, "lyapunov": null, "grad_norm": 0.6568909181034195, "grad_max_sv": 0.2302928999066353, "grad_min_sv": 1.2521502933821038e-08, "grad_condition": 42011077.53000567, "lr": 0.0006243449435824269, "time_sec": 49.68104648590088 }, { "epoch": 64, "train_loss": 2.0206649338531495, "train_acc": 0.4545, "test_loss": 7.670287243652344, "test_acc": 0.0929, "lyapunov": null, "grad_norm": 0.6597611249894066, "grad_max_sv": 0.2243791937828064, "grad_min_sv": 1.2141039159446754e-08, "grad_condition": 44929605.00249899, "lr": 0.0006141754350553275, "time_sec": 49.63578200340271 }, { "epoch": 65, "train_loss": 2.005788911895752, "train_acc": 0.45556, "test_loss": 8.490129399871826, "test_acc": 0.0881, "lyapunov": null, "grad_norm": 0.6550260718391842, "grad_max_sv": 0.2345993619412184, "grad_min_sv": 1.2238496998467907e-08, "grad_condition": 51372022.47833033, "lr": 0.0006039558454088793, "time_sec": 49.70135450363159 }, { "epoch": 66, "train_loss": 1.9908720332336425, "train_acc": 0.45934, "test_loss": 7.83362244720459, "test_acc": 0.086, "lyapunov": null, "grad_norm": 0.6563592700125107, "grad_max_sv": 0.22401900850236417, "grad_min_sv": 1.2119369038193772e-08, "grad_condition": 33434586.35249608, "lr": 0.000593690657292862, "time_sec": 49.64280724525452 }, { "epoch": 67, "train_loss": 1.9691172955703735, "train_acc": 0.46306, "test_loss": 7.884465830230713, "test_acc": 0.0818, "lyapunov": null, "grad_norm": 0.6567132328483392, "grad_max_sv": 0.231986141204834, "grad_min_sv": 1.2402723173488006e-08, "grad_condition": 25823647.646229025, "lr": 0.0005833843733580507, "time_sec": 49.62420701980591 }, { "epoch": 68, "train_loss": 1.9622927265167236, "train_acc": 0.46458, "test_loss": 8.4931605758667, "test_acc": 0.0703, "lyapunov": null, "grad_norm": 0.6522693664046653, "grad_max_sv": 0.2248720645904541, "grad_min_sv": 1.232144753449127e-08, "grad_condition": 20661085.738957692, "lr": 0.0005730415142812054, "time_sec": 49.61964273452759 }, { "epoch": 69, "train_loss": 1.936687505493164, "train_acc": 0.47236, "test_loss": 8.64132734375, "test_acc": 0.0679, "lyapunov": null, "grad_norm": 0.6510309265124044, "grad_max_sv": 0.21742373295128345, "grad_min_sv": 1.1974758069681346e-08, "grad_condition": 304726416.82408583, "lr": 0.0005626666167821517, "time_sec": 49.644230365753174 }, { "epoch": 70, "train_loss": 1.9254214583587645, "train_acc": 0.47336, "test_loss": 7.787073600769043, "test_acc": 0.0873, "lyapunov": null, "grad_norm": 0.6550976880903316, "grad_max_sv": 0.23343021050095558, "grad_min_sv": 1.22054698495919e-08, "grad_condition": 998661796.8752277, "lr": 0.0005522642316338265, "time_sec": 49.61548924446106 }, { "epoch": 71, "train_loss": 1.916664266433716, "train_acc": 0.47384, "test_loss": 8.817724546051025, "test_acc": 0.0687, "lyapunov": null, "grad_norm": 0.6548099516468633, "grad_max_sv": 0.21803590469062328, "grad_min_sv": 1.2030009292202104e-08, "grad_condition": 43118102.26962634, "lr": 0.0005418389216661573, "time_sec": 49.63275456428528 }, { "epoch": 72, "train_loss": 1.907302893638611, "train_acc": 0.47762, "test_loss": 9.211192407989502, "test_acc": 0.0704, "lyapunov": null, "grad_norm": 0.6550135667381578, "grad_max_sv": 0.22547000497579575, "grad_min_sv": 1.232130381889629e-08, "grad_condition": 21984085.02642382, "lr": 0.0005313952597646563, "time_sec": 49.6118586063385 }, { "epoch": 73, "train_loss": 1.877649710121155, "train_acc": 0.4827, "test_loss": 9.066388426208496, "test_acc": 0.0801, "lyapunov": null, "grad_norm": 0.6600796471066996, "grad_max_sv": 0.23919763825833798, "grad_min_sv": 1.2670018244287374e-08, "grad_condition": 42742098.34257165, "lr": 0.0005209378268645994, "time_sec": 49.67570900917053 }, { "epoch": 74, "train_loss": 1.8662859315490723, "train_acc": 0.48722, "test_loss": 9.122249521636963, "test_acc": 0.0675, "lyapunov": null, "grad_norm": 0.6547425237687021, "grad_max_sv": 0.22284357100725175, "grad_min_sv": 1.2111998770603094e-08, "grad_condition": 21063233.798650313, "lr": 0.0005104712099416781, "time_sec": 49.62467122077942 }, { "epoch": 75, "train_loss": 1.8634462587738037, "train_acc": 0.48572, "test_loss": 8.603226243591308, "test_acc": 0.07, "lyapunov": null, "grad_norm": 0.6594891408678691, "grad_max_sv": 0.2292952246963978, "grad_min_sv": 1.216953539884269e-08, "grad_condition": 23304533.995393943, "lr": 0.0004999999999999996, "time_sec": 49.6065719127655 }, { "epoch": 76, "train_loss": 1.8428347550964355, "train_acc": 0.49222, "test_loss": 9.348575830841064, "test_acc": 0.0716, "lyapunov": null, "grad_norm": 0.6514940871880716, "grad_max_sv": 0.2246335681527853, "grad_min_sv": 1.197331944077784e-08, "grad_condition": 79775997.36608414, "lr": 0.0004895287900583212, "time_sec": 49.633445262908936 }, { "epoch": 77, "train_loss": 1.8474174691390992, "train_acc": 0.49038, "test_loss": 9.063310955810547, "test_acc": 0.0749, "lyapunov": null, "grad_norm": 0.6555213730500407, "grad_max_sv": 0.22386705875396729, "grad_min_sv": 1.1975305359845923e-08, "grad_condition": 30024891.493045498, "lr": 0.0004790621731353997, "time_sec": 49.6582727432251 }, { "epoch": 78, "train_loss": 1.8240000118255615, "train_acc": 0.496, "test_loss": 7.937534573364258, "test_acc": 0.1042, "lyapunov": null, "grad_norm": 0.6578278625054611, "grad_max_sv": 0.22472502514719964, "grad_min_sv": 1.2227204815307146e-08, "grad_condition": 24809414.276176114, "lr": 0.000468604740235343, "time_sec": 49.60278058052063 }, { "epoch": 79, "train_loss": 1.7988454669952392, "train_acc": 0.50146, "test_loss": 7.830693682098389, "test_acc": 0.0946, "lyapunov": null, "grad_norm": 0.6564839484635767, "grad_max_sv": 0.23010910004377366, "grad_min_sv": 1.2367765268861408e-08, "grad_condition": 34528993.96450578, "lr": 0.00045816107833384175, "time_sec": 49.63169765472412 }, { "epoch": 80, "train_loss": 1.7962154034423827, "train_acc": 0.50466, "test_loss": 7.877956019592285, "test_acc": 0.0834, "lyapunov": null, "grad_norm": 0.6560300351960439, "grad_max_sv": 0.22126091420650482, "grad_min_sv": 1.2213627020862816e-08, "grad_condition": 21445784.707883697, "lr": 0.0004477357683661729, "time_sec": 49.672850131988525 }, { "epoch": 81, "train_loss": 1.7689838317871094, "train_acc": 0.5108, "test_loss": 8.936191275024415, "test_acc": 0.073, "lyapunov": null, "grad_norm": 0.6546524429638407, "grad_max_sv": 0.22751210294663907, "grad_min_sv": 1.2090203325293424e-08, "grad_condition": 37126500.828596935, "lr": 0.00043733338321784746, "time_sec": 49.6825795173645 }, { "epoch": 82, "train_loss": 1.7687132528686524, "train_acc": 0.50962, "test_loss": 8.322722315979004, "test_acc": 0.0867, "lyapunov": null, "grad_norm": 0.657879277273411, "grad_max_sv": 0.23299325592815875, "grad_min_sv": 1.2289513051655376e-08, "grad_condition": 29654551.548070945, "lr": 0.0004269584857187939, "time_sec": 49.77833390235901 }, { "epoch": 83, "train_loss": 1.7514041207885742, "train_acc": 0.51362, "test_loss": 7.874627603149414, "test_acc": 0.095, "lyapunov": null, "grad_norm": 0.65464844079956, "grad_max_sv": 0.22664147801697254, "grad_min_sv": 1.2152483562510863e-08, "grad_condition": 25844246.169428695, "lr": 0.0004166156266419484, "time_sec": 49.665401220321655 }, { "epoch": 84, "train_loss": 1.7470465963745117, "train_acc": 0.5132, "test_loss": 8.254433164978026, "test_acc": 0.0915, "lyapunov": null, "grad_norm": 0.6562560461399737, "grad_max_sv": 0.22655668184161187, "grad_min_sv": 1.2271174511246929e-08, "grad_condition": 46640276.774946496, "lr": 0.0004063093427071373, "time_sec": 49.66734290122986 }, { "epoch": 85, "train_loss": 1.7298235196685792, "train_acc": 0.51892, "test_loss": 8.706323757171631, "test_acc": 0.0911, "lyapunov": null, "grad_norm": 0.6550616576389223, "grad_max_sv": 0.23714832365512847, "grad_min_sv": 1.223523634630297e-08, "grad_condition": 29585164.78334018, "lr": 0.0003960441545911199, "time_sec": 49.640406370162964 }, { "epoch": 86, "train_loss": 1.724207964477539, "train_acc": 0.51926, "test_loss": 8.765803309631348, "test_acc": 0.0835, "lyapunov": null, "grad_norm": 0.6508855742051911, "grad_max_sv": 0.2245300356298685, "grad_min_sv": 1.2214838868152e-08, "grad_condition": 20628200.471479602, "lr": 0.0003858245649446718, "time_sec": 49.63991856575012 }, { "epoch": 87, "train_loss": 1.7018416146087647, "train_acc": 0.52598, "test_loss": 8.139996655273437, "test_acc": 0.096, "lyapunov": null, "grad_norm": 0.6595894571592862, "grad_max_sv": 0.2325576465576887, "grad_min_sv": 1.2264047567420167e-08, "grad_condition": 62109028.98086828, "lr": 0.00037565505641757235, "time_sec": 49.62706279754639 }, { "epoch": 88, "train_loss": 1.690174805984497, "train_acc": 0.52992, "test_loss": 8.284830725860596, "test_acc": 0.0946, "lyapunov": null, "grad_norm": 0.6523549145137596, "grad_max_sv": 0.22278686761856079, "grad_min_sv": 1.2230143851127417e-08, "grad_condition": 41887788.39074431, "lr": 0.00036554008969236695, "time_sec": 49.6299991607666 }, { "epoch": 89, "train_loss": 1.6808083280181885, "train_acc": 0.5298, "test_loss": 8.205404133605956, "test_acc": 0.0955, "lyapunov": null, "grad_norm": 0.6525447581270152, "grad_max_sv": 0.22465928830206394, "grad_min_sv": 1.2332067528264546e-08, "grad_condition": 23009318.737796, "lr": 0.0003554841015277638, "time_sec": 49.66408705711365 }, { "epoch": 90, "train_loss": 1.6637053575134277, "train_acc": 0.5337, "test_loss": 8.177736569213867, "test_acc": 0.0899, "lyapunov": null, "grad_norm": 0.6537473055068921, "grad_max_sv": 0.22377123720943928, "grad_min_sv": 1.2110254177244429e-08, "grad_condition": 25938015.098525234, "lr": 0.000345491502812526, "time_sec": 49.63126850128174 }, { "epoch": 91, "train_loss": 1.6554726396942139, "train_acc": 0.5354, "test_loss": 8.995069329833985, "test_acc": 0.08, "lyapunov": null, "grad_norm": 0.6575477667608048, "grad_max_sv": 0.23422496095299722, "grad_min_sv": 1.246219855713382e-08, "grad_condition": 41932891.920117736, "lr": 0.0003355666766307081, "time_sec": 49.63232660293579 }, { "epoch": 92, "train_loss": 1.6413372038269043, "train_acc": 0.54098, "test_loss": 9.550636445617675, "test_acc": 0.0761, "lyapunov": null, "grad_norm": 0.6610051290863374, "grad_max_sv": 0.23229929022490978, "grad_min_sv": 1.2352718607028245e-08, "grad_condition": 41078160.523768075, "lr": 0.00032571397633909225, "time_sec": 49.653891801834106 }, { "epoch": 93, "train_loss": 1.6310989672470093, "train_acc": 0.54374, "test_loss": 9.458463846588135, "test_acc": 0.0736, "lyapunov": null, "grad_norm": 0.6572216683080783, "grad_max_sv": 0.23672427460551262, "grad_min_sv": 1.2539241084352782e-08, "grad_condition": 23064462.944409598, "lr": 0.00031593772365766094, "time_sec": 49.65013003349304 }, { "epoch": 94, "train_loss": 1.6185439474868775, "train_acc": 0.5456, "test_loss": 9.447592375946044, "test_acc": 0.0781, "lyapunov": null, "grad_norm": 0.6543172085287396, "grad_max_sv": 0.2255704291164875, "grad_min_sv": 1.1963030848924361e-08, "grad_condition": 48501470.614931956, "lr": 0.0003062422067739483, "time_sec": 49.68069577217102 }, { "epoch": 95, "train_loss": 1.6036190982055665, "train_acc": 0.54806, "test_loss": 9.521705908203124, "test_acc": 0.0835, "lyapunov": null, "grad_norm": 0.6561083866637782, "grad_max_sv": 0.23088240325450898, "grad_min_sv": 1.2247599834314115e-08, "grad_condition": 26484829.628142, "lr": 0.00029663167846209965, "time_sec": 49.62816071510315 }, { "epoch": 96, "train_loss": 1.6020113516998291, "train_acc": 0.54904, "test_loss": 9.115081603240967, "test_acc": 0.0889, "lyapunov": null, "grad_norm": 0.6572025699230744, "grad_max_sv": 0.22745007649064064, "grad_min_sv": 1.2209962416132036e-08, "grad_condition": 32247618.106625605, "lr": 0.00028711035421746345, "time_sec": 49.61973428726196 }, { "epoch": 97, "train_loss": 1.589581788368225, "train_acc": 0.55386, "test_loss": 9.091486672973632, "test_acc": 0.0752, "lyapunov": null, "grad_norm": 0.6480214804623958, "grad_max_sv": 0.22622964382171631, "grad_min_sv": 1.213211238138001e-08, "grad_condition": 23427245.234249383, "lr": 0.00027768241040753615, "time_sec": 49.67304968833923 }, { "epoch": 98, "train_loss": 1.5766529482269287, "train_acc": 0.55484, "test_loss": 8.739159268188477, "test_acc": 0.0912, "lyapunov": null, "grad_norm": 0.6545216229967632, "grad_max_sv": 0.22466104663908482, "grad_min_sv": 1.2034743685634952e-08, "grad_condition": 37920262.92732872, "lr": 0.00026835198244006903, "time_sec": 49.6529438495636 }, { "epoch": 99, "train_loss": 1.5610430017852783, "train_acc": 0.55952, "test_loss": 9.326904290771484, "test_acc": 0.0857, "lyapunov": null, "grad_norm": 0.6510280187361254, "grad_max_sv": 0.22991822883486748, "grad_min_sv": 1.2031296814374315e-08, "grad_condition": 33021222.855397005, "lr": 0.0002591231629491421, "time_sec": 49.64146590232849 }, { "epoch": 100, "train_loss": 1.5503544171142578, "train_acc": 0.56096, "test_loss": 8.863075296783448, "test_acc": 0.0956, "lyapunov": null, "grad_norm": 0.6587934740560508, "grad_max_sv": 0.22904604896903039, "grad_min_sv": 1.2335589709942807e-08, "grad_condition": 85131461.34992474, "lr": 0.0002499999999999997, "time_sec": 49.6390540599823 }, { "epoch": 101, "train_loss": 1.5390491861343383, "train_acc": 0.56416, "test_loss": 8.707357301330566, "test_acc": 0.1024, "lyapunov": null, "grad_norm": 0.662018499627777, "grad_max_sv": 0.23979119583964348, "grad_min_sv": 1.238348213417062e-08, "grad_condition": 33906848.52058145, "lr": 0.00024098649531343477, "time_sec": 49.63421368598938 }, { "epoch": 102, "train_loss": 1.5312192189788818, "train_acc": 0.56726, "test_loss": 9.40553295135498, "test_acc": 0.0875, "lyapunov": null, "grad_norm": 0.6540742670514875, "grad_max_sv": 0.23145525828003882, "grad_min_sv": 1.2288377408686824e-08, "grad_condition": 37958642.13054756, "lr": 0.0002320866025105016, "time_sec": 49.65552067756653 }, { "epoch": 103, "train_loss": 1.5286355770111084, "train_acc": 0.56548, "test_loss": 9.07997163925171, "test_acc": 0.1043, "lyapunov": null, "grad_norm": 0.6557756421519878, "grad_max_sv": 0.24100108593702316, "grad_min_sv": 1.2461116480344537e-08, "grad_condition": 25662204.639090188, "lr": 0.0002233042253783278, "time_sec": 49.6308536529541 }, { "epoch": 104, "train_loss": 1.5213085984420776, "train_acc": 0.56866, "test_loss": 9.145785698699951, "test_acc": 0.0859, "lyapunov": null, "grad_norm": 0.6504666354250909, "grad_max_sv": 0.2253209725022316, "grad_min_sv": 1.1966959748144212e-08, "grad_condition": 54876833.04192768, "lr": 0.000214643216157784, "time_sec": 49.63847613334656 }, { "epoch": 105, "train_loss": 1.5079352280044556, "train_acc": 0.5695, "test_loss": 8.336384162902831, "test_acc": 0.1061, "lyapunov": null, "grad_norm": 0.6571653396229992, "grad_max_sv": 0.23069135881960393, "grad_min_sv": 1.2210977743190576e-08, "grad_condition": 88846977.18417618, "lr": 0.00020610737385376332, "time_sec": 49.627315044403076 }, { "epoch": 106, "train_loss": 1.4935028577423095, "train_acc": 0.57654, "test_loss": 9.006987256622315, "test_acc": 0.0957, "lyapunov": null, "grad_norm": 0.651656183779343, "grad_max_sv": 0.22712415568530558, "grad_min_sv": 1.2032355989344268e-08, "grad_condition": 25049163.560516536, "lr": 0.00019770044256881242, "time_sec": 49.62053084373474 }, { "epoch": 107, "train_loss": 1.4878737406158447, "train_acc": 0.57426, "test_loss": 10.11307799987793, "test_acc": 0.075, "lyapunov": null, "grad_norm": 0.6524830728325739, "grad_max_sv": 0.22892994433641434, "grad_min_sv": 1.2128688251650255e-08, "grad_condition": 43366733.79550102, "lr": 0.0001894261098608447, "time_sec": 49.60416531562805 }, { "epoch": 108, "train_loss": 1.4871094806671143, "train_acc": 0.57634, "test_loss": 9.736641611480714, "test_acc": 0.0847, "lyapunov": null, "grad_norm": 0.6526478556992521, "grad_max_sv": 0.2283865675330162, "grad_min_sv": 1.2084086392638583e-08, "grad_condition": 30684405.14241614, "lr": 0.000181288005125655, "time_sec": 49.599942207336426 }, { "epoch": 109, "train_loss": 1.4713194018936158, "train_acc": 0.5814, "test_loss": 9.849570913696288, "test_acc": 0.0735, "lyapunov": null, "grad_norm": 0.6520669107663062, "grad_max_sv": 0.22863508015871048, "grad_min_sv": 1.206205209880462e-08, "grad_condition": 22397938.389471006, "lr": 0.0001732896980049473, "time_sec": 49.610928773880005 }, { "epoch": 110, "train_loss": 1.463755881729126, "train_acc": 0.58362, "test_loss": 10.715107778930664, "test_acc": 0.0741, "lyapunov": null, "grad_norm": 0.6526504347541894, "grad_max_sv": 0.2301381327211857, "grad_min_sv": 1.2070842162273388e-08, "grad_condition": 58529848.61276511, "lr": 0.00016543469682057076, "time_sec": 49.607982873916626 }, { "epoch": 111, "train_loss": 1.458272280807495, "train_acc": 0.58544, "test_loss": 9.91223872833252, "test_acc": 0.0829, "lyapunov": null, "grad_norm": 0.657140008872575, "grad_max_sv": 0.23369005173444748, "grad_min_sv": 1.2170888367274423e-08, "grad_condition": 42634071.92220701, "lr": 0.00015772644703565552, "time_sec": 49.6121985912323 }, { "epoch": 112, "train_loss": 1.4423779841613769, "train_acc": 0.58982, "test_loss": 10.218679902648926, "test_acc": 0.0785, "lyapunov": null, "grad_norm": 0.6570457541981778, "grad_max_sv": 0.2342597097158432, "grad_min_sv": 1.2216584609550663e-08, "grad_condition": 64070619.26224355, "lr": 0.00015016832974331713, "time_sec": 49.62796497344971 }, { "epoch": 113, "train_loss": 1.4301787731170654, "train_acc": 0.58978, "test_loss": 9.96994764251709, "test_acc": 0.0848, "lyapunov": null, "grad_norm": 0.6545785705102263, "grad_max_sv": 0.23776416704058648, "grad_min_sv": 1.2195284053440059e-08, "grad_condition": 29429303.691607207, "lr": 0.00014276366018359834, "time_sec": 49.63600516319275 }, { "epoch": 114, "train_loss": 1.431484651260376, "train_acc": 0.59188, "test_loss": 9.352456809234619, "test_acc": 0.0912, "lyapunov": null, "grad_norm": 0.6560872782233574, "grad_max_sv": 0.23789514154195784, "grad_min_sv": 1.2277434646712493e-08, "grad_condition": 29643562.652553707, "lr": 0.00013551568628929425, "time_sec": 49.64847278594971 }, { "epoch": 115, "train_loss": 1.4156108039093018, "train_acc": 0.59466, "test_loss": 9.393049124145508, "test_acc": 0.0902, "lyapunov": null, "grad_norm": 0.6560202611490502, "grad_max_sv": 0.23022275194525718, "grad_min_sv": 1.211471579581902e-08, "grad_condition": 29752416.717853196, "lr": 0.00012842758726130276, "time_sec": 49.646286725997925 }, { "epoch": 116, "train_loss": 1.419507451171875, "train_acc": 0.59538, "test_loss": 9.898611540222168, "test_acc": 0.0823, "lyapunov": null, "grad_norm": 0.6554438751866899, "grad_max_sv": 0.23169372119009496, "grad_min_sv": 1.2254989865956301e-08, "grad_condition": 32739963.172941543, "lr": 0.0001215024721741218, "time_sec": 49.66101384162903 }, { "epoch": 117, "train_loss": 1.4052832598495484, "train_acc": 0.59742, "test_loss": 9.80786139831543, "test_acc": 0.0746, "lyapunov": null, "grad_norm": 0.6502624050693765, "grad_max_sv": 0.23535267189145087, "grad_min_sv": 1.2210560307313046e-08, "grad_condition": 34512756.66701891, "lr": 0.00011474337861210538, "time_sec": 49.635112285614014 }, { "epoch": 118, "train_loss": 1.407028383216858, "train_acc": 0.59456, "test_loss": 9.323918186950683, "test_acc": 0.0923, "lyapunov": null, "grad_norm": 0.6532731757355527, "grad_max_sv": 0.23146636895835399, "grad_min_sv": 1.2073984001492733e-08, "grad_condition": 27415450.93514964, "lr": 0.00010815327133708009, "time_sec": 49.67300295829773 }, { "epoch": 119, "train_loss": 1.3942961041641235, "train_acc": 0.60004, "test_loss": 9.392257122802734, "test_acc": 0.0923, "lyapunov": null, "grad_norm": 0.6512526041128694, "grad_max_sv": 0.2304602511227131, "grad_min_sv": 1.196873851000424e-08, "grad_condition": 27052501.627034713, "lr": 0.00010173504098790182, "time_sec": 49.66038250923157 }, { "epoch": 120, "train_loss": 1.3861536862182617, "train_acc": 0.60168, "test_loss": 9.79215132522583, "test_acc": 0.0883, "lyapunov": null, "grad_norm": 0.6546312963164914, "grad_max_sv": 0.23524674400687218, "grad_min_sv": 1.2223635334485117e-08, "grad_condition": 23146281.84709592, "lr": 9.549150281252629e-05, "time_sec": 49.64855408668518 }, { "epoch": 121, "train_loss": 1.382921607093811, "train_acc": 0.60466, "test_loss": 9.083266135406495, "test_acc": 0.1, "lyapunov": null, "grad_norm": 0.6533990071886453, "grad_max_sv": 0.22603939548134805, "grad_min_sv": 1.2147275964269344e-08, "grad_condition": 31306417.63450122, "lr": 8.942539543314794e-05, "time_sec": 49.62118649482727 }, { "epoch": 122, "train_loss": 1.3776706603240967, "train_acc": 0.60552, "test_loss": 10.107886312866212, "test_acc": 0.0771, "lyapunov": null, "grad_norm": 0.650347981554726, "grad_max_sv": 0.22755396254360677, "grad_min_sv": 1.200875722057182e-08, "grad_condition": 26822439.671770982, "lr": 8.353937964495024e-05, "time_sec": 49.625091552734375 }, { "epoch": 123, "train_loss": 1.3719213924789428, "train_acc": 0.60596, "test_loss": 9.897831336212159, "test_acc": 0.0827, "lyapunov": null, "grad_norm": 0.6494680388920978, "grad_max_sv": 0.23135662637650967, "grad_min_sv": 1.2129681067896137e-08, "grad_condition": 24324265.536500372, "lr": 7.783603724899243e-05, "time_sec": 49.683146476745605 }, { "epoch": 124, "train_loss": 1.372097077255249, "train_acc": 0.60532, "test_loss": 9.392827641296387, "test_acc": 0.091, "lyapunov": null, "grad_norm": 0.650191030859608, "grad_max_sv": 0.2314681064337492, "grad_min_sv": 1.2054343853651339e-08, "grad_condition": 27641091.69673177, "lr": 7.231786991974666e-05, "time_sec": 49.71274280548096 }, { "epoch": 125, "train_loss": 1.370953790550232, "train_acc": 0.6058, "test_loss": 9.41628999938965, "test_acc": 0.0969, "lyapunov": null, "grad_norm": 0.6479408268968022, "grad_max_sv": 0.22912745289504527, "grad_min_sv": 1.1926550955165816e-08, "grad_condition": 38383449.24679903, "lr": 6.698729810778072e-05, "time_sec": 49.61937499046326 }, { "epoch": 126, "train_loss": 1.35777675239563, "train_acc": 0.61084, "test_loss": 9.729599977111816, "test_acc": 0.084, "lyapunov": null, "grad_norm": 0.6511889017989357, "grad_max_sv": 0.23615461364388465, "grad_min_sv": 1.21181827100747e-08, "grad_condition": 23269107.95301483, "lr": 6.184665997806817e-05, "time_sec": 49.616145610809326 }, { "epoch": 127, "train_loss": 1.3525141822052003, "train_acc": 0.60988, "test_loss": 9.375829245758057, "test_acc": 0.0908, "lyapunov": null, "grad_norm": 0.6536840306066181, "grad_max_sv": 0.23197561018168927, "grad_min_sv": 1.2315820041575164e-08, "grad_condition": 24883789.486126114, "lr": 5.6898210384392595e-05, "time_sec": 49.629499435424805 }, { "epoch": 128, "train_loss": 1.3482640004730224, "train_acc": 0.61222, "test_loss": 9.813197325134277, "test_acc": 0.0856, "lyapunov": null, "grad_norm": 0.6514039873738223, "grad_max_sv": 0.23501852825284003, "grad_min_sv": 1.2142686500737909e-08, "grad_condition": 25266297.201565318, "lr": 5.214411988029363e-05, "time_sec": 49.605358600616455 }, { "epoch": 129, "train_loss": 1.3569378799057006, "train_acc": 0.60816, "test_loss": 9.541576918029785, "test_acc": 0.0874, "lyapunov": null, "grad_norm": 0.6517316484787671, "grad_max_sv": 0.23406252562999724, "grad_min_sv": 1.2258221140926118e-08, "grad_condition": 29626662.60122323, "lr": 4.7586473766990294e-05, "time_sec": 49.625590085983276 }, { "epoch": 130, "train_loss": 1.3529891060638428, "train_acc": 0.60898, "test_loss": 9.487888061523437, "test_acc": 0.0929, "lyapunov": null, "grad_norm": 0.6538198266172623, "grad_max_sv": 0.23005600720643998, "grad_min_sv": 1.201972722117417e-08, "grad_condition": 37209362.20372974, "lr": 4.32272711786996e-05, "time_sec": 49.65739893913269 }, { "epoch": 131, "train_loss": 1.3454697626495362, "train_acc": 0.61572, "test_loss": 9.924783717346191, "test_acc": 0.0811, "lyapunov": null, "grad_norm": 0.6551713288471978, "grad_max_sv": 0.240146154910326, "grad_min_sv": 1.2333497152738903e-08, "grad_condition": 66623015.95467502, "lr": 3.906842420574966e-05, "time_sec": 49.62453866004944 }, { "epoch": 132, "train_loss": 1.3360938589859008, "train_acc": 0.61616, "test_loss": 9.586818018341065, "test_acc": 0.0889, "lyapunov": null, "grad_norm": 0.6504956714032589, "grad_max_sv": 0.23334665820002556, "grad_min_sv": 1.2104059498446728e-08, "grad_condition": 52369707.49757277, "lr": 3.5111757055874305e-05, "time_sec": 49.62921142578125 }, { "epoch": 133, "train_loss": 1.339883793449402, "train_acc": 0.61552, "test_loss": 9.673538793945312, "test_acc": 0.0929, "lyapunov": null, "grad_norm": 0.6476453899351778, "grad_max_sv": 0.23297516368329524, "grad_min_sv": 1.2124888488021512e-08, "grad_condition": 68199072.30592722, "lr": 3.1359005254054254e-05, "time_sec": 49.593669414520264 }, { "epoch": 134, "train_loss": 1.3361684355545045, "train_acc": 0.61882, "test_loss": 9.66245351715088, "test_acc": 0.0778, "lyapunov": null, "grad_norm": 0.6491838850685481, "grad_max_sv": 0.23596667721867562, "grad_min_sv": 1.1881547391789926e-08, "grad_condition": 40898877.174065895, "lr": 2.7811814881259484e-05, "time_sec": 49.60944747924805 }, { "epoch": 135, "train_loss": 1.3277960977554322, "train_acc": 0.61818, "test_loss": 9.974994463348388, "test_acc": 0.0794, "lyapunov": null, "grad_norm": 0.6475029366208067, "grad_max_sv": 0.2263253577053547, "grad_min_sv": 1.206646519577581e-08, "grad_condition": 59123509.407670066, "lr": 2.4471741852423218e-05, "time_sec": 49.63754081726074 }, { "epoch": 136, "train_loss": 1.3390293844604493, "train_acc": 0.6147, "test_loss": 9.827523893737792, "test_acc": 0.0857, "lyapunov": null, "grad_norm": 0.6539959690699623, "grad_max_sv": 0.2373226772993803, "grad_min_sv": 1.2036285343408615e-08, "grad_condition": 24295457.361463245, "lr": 2.1340251233966362e-05, "time_sec": 49.649282455444336 }, { "epoch": 137, "train_loss": 1.320917113571167, "train_acc": 0.62042, "test_loss": 10.049297039031982, "test_acc": 0.0816, "lyapunov": null, "grad_norm": 0.6470381085306396, "grad_max_sv": 0.22178312465548516, "grad_min_sv": 1.1698476365396004e-08, "grad_condition": 21323664.731712654, "lr": 1.8418716601170932e-05, "time_sec": 49.63605809211731 }, { "epoch": 138, "train_loss": 1.3167627235412598, "train_acc": 0.6236, "test_loss": 9.956857801055909, "test_acc": 0.0836, "lyapunov": null, "grad_norm": 0.6460826791518621, "grad_max_sv": 0.23469048999249936, "grad_min_sv": 1.2084183138643886e-08, "grad_condition": 303408536.5105225, "lr": 1.570841943568445e-05, "time_sec": 49.59550142288208 }, { "epoch": 139, "train_loss": 1.3184237383270263, "train_acc": 0.6197, "test_loss": 10.09333883972168, "test_acc": 0.0839, "lyapunov": null, "grad_norm": 0.6477507203630667, "grad_max_sv": 0.2281213853508234, "grad_min_sv": 1.203405910962796e-08, "grad_condition": 39837437.01020629, "lr": 1.3210548563419845e-05, "time_sec": 49.6094229221344 }, { "epoch": 140, "train_loss": 1.3220056551361083, "train_acc": 0.61976, "test_loss": 9.424947094726562, "test_acc": 0.0942, "lyapunov": null, "grad_norm": 0.644643549451068, "grad_max_sv": 0.22695489414036274, "grad_min_sv": 1.1866805089966182e-08, "grad_condition": 49710189.62801478, "lr": 1.0926199633097203e-05, "time_sec": 49.65405297279358 }, { "epoch": 141, "train_loss": 1.3249128121566773, "train_acc": 0.61924, "test_loss": 10.150922741699219, "test_acc": 0.0839, "lyapunov": null, "grad_norm": 0.6496616529807254, "grad_max_sv": 0.23303747363388538, "grad_min_sv": 1.2297343177092301e-08, "grad_condition": 32251173.502706695, "lr": 8.856374635655688e-06, "time_sec": 49.62998151779175 }, { "epoch": 142, "train_loss": 1.3221977783966063, "train_acc": 0.61854, "test_loss": 9.545345922851563, "test_acc": 0.0896, "lyapunov": null, "grad_norm": 0.6498976979178819, "grad_max_sv": 0.23321284241974355, "grad_min_sv": 1.2192657036780297e-08, "grad_condition": 38327958.94438372, "lr": 7.001981464747503e-06, "time_sec": 49.62353038787842 }, { "epoch": 143, "train_loss": 1.3161465112304687, "train_acc": 0.62108, "test_loss": 9.518995339202881, "test_acc": 0.0904, "lyapunov": null, "grad_norm": 0.65049671322247, "grad_max_sv": 0.2355397418141365, "grad_min_sv": 1.2113919437006793e-08, "grad_condition": 34055758.838127285, "lr": 5.3638335185058295e-06, "time_sec": 49.636550426483154 }, { "epoch": 144, "train_loss": 1.3199945546722411, "train_acc": 0.61928, "test_loss": 9.653044511413574, "test_acc": 0.0889, "lyapunov": null, "grad_norm": 0.6510219033687272, "grad_max_sv": 0.23736767545342446, "grad_min_sv": 1.2120116818503668e-08, "grad_condition": 26653772.592295133, "lr": 3.942649342761114e-06, "time_sec": 49.64809012413025 }, { "epoch": 145, "train_loss": 1.310637080039978, "train_acc": 0.62316, "test_loss": 10.082862811279297, "test_acc": 0.0865, "lyapunov": null, "grad_norm": 0.6486131550644274, "grad_max_sv": 0.23344326205551624, "grad_min_sv": 1.1724270552321281e-08, "grad_condition": 226542482.35064834, "lr": 2.7390523158633524e-06, "time_sec": 49.61792755126953 }, { "epoch": 146, "train_loss": 1.3224388639450073, "train_acc": 0.62, "test_loss": 10.004590126037598, "test_acc": 0.083, "lyapunov": null, "grad_norm": 0.6514083277071326, "grad_max_sv": 0.23273181915283203, "grad_min_sv": 1.1958840047718951e-08, "grad_condition": 1281589470.9369996, "lr": 1.7535703752478133e-06, "time_sec": 49.663915157318115 }, { "epoch": 147, "train_loss": 1.3165813917160034, "train_acc": 0.62328, "test_loss": 9.630343141174317, "test_acc": 0.0889, "lyapunov": null, "grad_norm": 0.6474798234673506, "grad_max_sv": 0.22821973785758018, "grad_min_sv": 1.1936759166872312e-08, "grad_condition": 467313215.8090695, "lr": 9.866357858642196e-07, "time_sec": 49.623547077178955 }, { "epoch": 148, "train_loss": 1.3181095361328126, "train_acc": 0.61742, "test_loss": 10.228155642700195, "test_acc": 0.0788, "lyapunov": null, "grad_norm": 0.6510409626330189, "grad_max_sv": 0.23130737692117692, "grad_min_sv": 1.1935725464928826e-08, "grad_condition": 55668871.204657175, "lr": 4.38584950570808e-07, "time_sec": 49.621832609176636 }, { "epoch": 149, "train_loss": 1.31113261013031, "train_acc": 0.6221, "test_loss": 9.91230221786499, "test_acc": 0.0822, "lyapunov": null, "grad_norm": 0.6472982694090295, "grad_max_sv": 0.2277739927172661, "grad_min_sv": 1.1845563784029788e-08, "grad_condition": 25904808.412874807, "lr": 1.096582625772501e-07, "time_sec": 49.62464380264282 }, { "epoch": 150, "train_loss": 1.3088498344039916, "train_acc": 0.62396, "test_loss": 9.814052784729004, "test_acc": 0.0858, "lyapunov": null, "grad_norm": 0.6471687901699209, "grad_max_sv": 0.23137033209204674, "grad_min_sv": 1.2163310093502022e-08, "grad_condition": 48891964.404683754, "lr": 0.0, "time_sec": 49.660566329956055 } ], "16": [ { "epoch": 1, "train_loss": 5.089254416656495, "train_acc": 0.01344, "test_loss": 4.870831555175781, "test_acc": 0.01, "lyapunov": null, "grad_norm": 5.582063459208639, "grad_max_sv": 5.0306542873382565, "grad_min_sv": 8.441757832766683e-08, "grad_condition": 74707534.78681344, "lr": 0.0009998903417374227, "time_sec": 66.70783400535583 }, { "epoch": 2, "train_loss": 4.736304296569824, "train_acc": 0.02172, "test_loss": 4.92340059890747, "test_acc": 0.01, "lyapunov": null, "grad_norm": 4.087296772772229, "grad_max_sv": 3.672157108783722, "grad_min_sv": 6.109624839933935e-08, "grad_condition": 230714811.36310124, "lr": 0.0009995614150494292, "time_sec": 66.69390416145325 }, { "epoch": 3, "train_loss": 4.52685978515625, "train_acc": 0.03204, "test_loss": 5.045831031799317, "test_acc": 0.0094, "lyapunov": null, "grad_norm": 3.1470044543912175, "grad_max_sv": 2.6447540044784548, "grad_min_sv": 4.639755384339139e-08, "grad_condition": 65625701.84585605, "lr": 0.0009990133642141358, "time_sec": 66.70076084136963 }, { "epoch": 4, "train_loss": 4.371717319641113, "train_acc": 0.04112, "test_loss": 4.993129699707032, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 2.5123688948843395, "grad_max_sv": 2.1027904629707335, "grad_min_sv": 3.615837387664633e-08, "grad_condition": 418817692.03399765, "lr": 0.0009982464296247522, "time_sec": 66.71976566314697 }, { "epoch": 5, "train_loss": 4.27407361251831, "train_acc": 0.0488, "test_loss": 5.161634465789795, "test_acc": 0.0119, "lyapunov": null, "grad_norm": 1.9573801826064445, "grad_max_sv": 1.613087645173073, "grad_min_sv": 2.8529539808364034e-08, "grad_condition": 62747668.20627429, "lr": 0.0009972609476841367, "time_sec": 66.74850869178772 }, { "epoch": 6, "train_loss": 4.183251854553222, "train_acc": 0.05812, "test_loss": 5.447854755401611, "test_acc": 0.0093, "lyapunov": null, "grad_norm": 1.436449079599314, "grad_max_sv": 1.0459295481443405, "grad_min_sv": 2.0654144772258576e-08, "grad_condition": 94732574.16372415, "lr": 0.000996057350657239, "time_sec": 66.69263577461243 }, { "epoch": 7, "train_loss": 4.103355536193848, "train_acc": 0.06872, "test_loss": 5.544150679016114, "test_acc": 0.0124, "lyapunov": null, "grad_norm": 1.082624040556548, "grad_max_sv": 0.678101472556591, "grad_min_sv": 1.6660088839048904e-08, "grad_condition": 49338508.46283151, "lr": 0.000994636166481494, "time_sec": 66.69370245933533 }, { "epoch": 8, "train_loss": 4.040529095458984, "train_acc": 0.07876, "test_loss": 5.577163777160645, "test_acc": 0.0172, "lyapunov": null, "grad_norm": 0.963869121683512, "grad_max_sv": 0.5578698106110096, "grad_min_sv": 1.4817374840991882e-08, "grad_condition": 46172185.25999212, "lr": 0.0009929980185352525, "time_sec": 66.70931386947632 }, { "epoch": 9, "train_loss": 3.999490645446777, "train_acc": 0.0856, "test_loss": 5.472281336975097, "test_acc": 0.0116, "lyapunov": null, "grad_norm": 0.9198022107734598, "grad_max_sv": 0.5003849364817142, "grad_min_sv": 1.3862486752946878e-08, "grad_condition": 137028895.09887612, "lr": 0.0009911436253643444, "time_sec": 66.70475840568542 }, { "epoch": 10, "train_loss": 3.9641557629394533, "train_acc": 0.09124, "test_loss": 5.43024553604126, "test_acc": 0.0112, "lyapunov": null, "grad_norm": 0.8539816540258655, "grad_max_sv": 0.4397390566766262, "grad_min_sv": 1.3177782898221579e-08, "grad_condition": 50953468.3517745, "lr": 0.0009890738003669028, "time_sec": 66.75189590454102 }, { "epoch": 11, "train_loss": 3.912582547149658, "train_acc": 0.09724, "test_loss": 5.977069612121582, "test_acc": 0.0115, "lyapunov": null, "grad_norm": 0.8304366482521061, "grad_max_sv": 0.4253105387091637, "grad_min_sv": 1.2851445623657253e-08, "grad_condition": 192581837.7575304, "lr": 0.00098678945143658, "time_sec": 66.72230935096741 }, { "epoch": 12, "train_loss": 3.885940095291138, "train_acc": 0.10388, "test_loss": 5.707202329254151, "test_acc": 0.0161, "lyapunov": null, "grad_norm": 0.7930567752358824, "grad_max_sv": 0.3784016497433186, "grad_min_sv": 1.2496499026196095e-08, "grad_condition": 121475679.84002523, "lr": 0.0009842915805643154, "time_sec": 66.80430769920349 }, { "epoch": 13, "train_loss": 3.848949595184326, "train_acc": 0.10982, "test_loss": 5.604932201385498, "test_acc": 0.0138, "lyapunov": null, "grad_norm": 0.7694655756397059, "grad_max_sv": 0.36012797653675077, "grad_min_sv": 1.2309415998654205e-08, "grad_condition": 96913763.80192877, "lr": 0.000981581283398829, "time_sec": 66.77498316764832 }, { "epoch": 14, "train_loss": 3.822469270477295, "train_acc": 0.11176, "test_loss": 5.5594536964416505, "test_acc": 0.0144, "lyapunov": null, "grad_norm": 0.751737952115685, "grad_max_sv": 0.34815125875175, "grad_min_sv": 1.1860258068707719e-08, "grad_condition": 63821387.65591574, "lr": 0.0009786597487660333, "time_sec": 66.78450131416321 }, { "epoch": 15, "train_loss": 3.8008637019348144, "train_acc": 0.11732, "test_loss": 5.8510744079589845, "test_acc": 0.0165, "lyapunov": null, "grad_norm": 0.7274896957635634, "grad_max_sv": 0.3341310672461987, "grad_min_sv": 1.185839371142805e-08, "grad_condition": 51068114.03076443, "lr": 0.0009755282581475766, "time_sec": 66.75975847244263 }, { "epoch": 16, "train_loss": 3.7793116706085206, "train_acc": 0.12078, "test_loss": 6.094802139282226, "test_acc": 0.0135, "lyapunov": null, "grad_norm": 0.7029997372387793, "grad_max_sv": 0.31635181941092017, "grad_min_sv": 1.1313535006052256e-08, "grad_condition": 34061221.316739336, "lr": 0.0009721881851187403, "time_sec": 66.70034837722778 }, { "epoch": 17, "train_loss": 3.756349168548584, "train_acc": 0.12318, "test_loss": 6.524116158294678, "test_acc": 0.0149, "lyapunov": null, "grad_norm": 0.6891476510098721, "grad_max_sv": 0.30746029056608676, "grad_min_sv": 1.1205093228272567e-08, "grad_condition": 55101632.74828547, "lr": 0.0009686409947459456, "time_sec": 66.70887970924377 }, { "epoch": 18, "train_loss": 3.736860103225708, "train_acc": 0.12666, "test_loss": 6.334092637634277, "test_acc": 0.0151, "lyapunov": null, "grad_norm": 0.6735913591792417, "grad_max_sv": 0.3038469754159451, "grad_min_sv": 1.1184529693109707e-08, "grad_condition": 266599149.22808576, "lr": 0.0009648882429441254, "time_sec": 66.7028694152832 }, { "epoch": 19, "train_loss": 3.721009854812622, "train_acc": 0.13104, "test_loss": 6.503785885620117, "test_acc": 0.0158, "lyapunov": null, "grad_norm": 0.6543898752326373, "grad_max_sv": 0.2952485930174589, "grad_min_sv": 1.0702305973386839e-08, "grad_condition": 36178987.94815246, "lr": 0.00096093157579425, "time_sec": 66.91662836074829 }, { "epoch": 20, "train_loss": 3.6978233711242674, "train_acc": 0.13484, "test_loss": 7.133095213317871, "test_acc": 0.014, "lyapunov": null, "grad_norm": 0.6416047326169007, "grad_max_sv": 0.2835653819143772, "grad_min_sv": 1.061290202941656e-08, "grad_condition": 29580333.508830875, "lr": 0.0009567727288213001, "time_sec": 66.7187888622284 }, { "epoch": 21, "train_loss": 3.678186371612549, "train_acc": 0.13804, "test_loss": 6.526899772644043, "test_acc": 0.0165, "lyapunov": null, "grad_norm": 0.6346445495636812, "grad_max_sv": 0.2758004698902369, "grad_min_sv": 1.0650165743059103e-08, "grad_condition": 50339413.533409506, "lr": 0.0009524135262330095, "time_sec": 66.77347826957703 }, { "epoch": 22, "train_loss": 3.6615531184387207, "train_acc": 0.13652, "test_loss": 7.463528224182129, "test_acc": 0.0149, "lyapunov": null, "grad_norm": 0.6211761686754148, "grad_max_sv": 0.2590024430304766, "grad_min_sv": 1.0093259970866963e-08, "grad_condition": 54350139.527433194, "lr": 0.0009478558801197061, "time_sec": 66.74172306060791 }, { "epoch": 23, "train_loss": 3.646244419708252, "train_acc": 0.14018, "test_loss": 7.247557836151123, "test_acc": 0.0133, "lyapunov": null, "grad_norm": 0.6087560504487702, "grad_max_sv": 0.26471212282776835, "grad_min_sv": 1.0175153231789525e-08, "grad_condition": 76037868.51400027, "lr": 0.000943101789615607, "time_sec": 66.74379682540894 }, { "epoch": 24, "train_loss": 3.6286012983703615, "train_acc": 0.14502, "test_loss": 7.168135193634034, "test_acc": 0.0191, "lyapunov": null, "grad_norm": 0.5998778506859267, "grad_max_sv": 0.24980814158916473, "grad_min_sv": 1.0037150326158706e-08, "grad_condition": 32920800.60529256, "lr": 0.0009381533400219313, "time_sec": 66.68860864639282 }, { "epoch": 25, "train_loss": 3.6192829264831543, "train_acc": 0.14634, "test_loss": 7.535636337280273, "test_acc": 0.0161, "lyapunov": null, "grad_norm": 0.5983012708829252, "grad_max_sv": 0.2530865453183651, "grad_min_sv": 9.982956203358206e-09, "grad_condition": 29219670.862144046, "lr": 0.0009330127018922189, "time_sec": 66.75418090820312 }, { "epoch": 26, "train_loss": 3.6001767744445803, "train_acc": 0.1487, "test_loss": 6.850593623352051, "test_acc": 0.0151, "lyapunov": null, "grad_norm": 0.5947140415117098, "grad_max_sv": 0.24490244090557098, "grad_min_sv": 9.946103620567249e-09, "grad_condition": 94915701.68580723, "lr": 0.000927682130080253, "time_sec": 66.72897815704346 }, { "epoch": 27, "train_loss": 3.5885346211242677, "train_acc": 0.15218, "test_loss": 7.121657147216797, "test_acc": 0.0175, "lyapunov": null, "grad_norm": 0.5825348653665754, "grad_max_sv": 0.2360658310353756, "grad_min_sv": 9.758478072829923e-09, "grad_condition": 28325624.288454544, "lr": 0.0009221639627510072, "time_sec": 66.82140755653381 }, { "epoch": 28, "train_loss": 3.5699786253356933, "train_acc": 0.15318, "test_loss": 7.339261558532715, "test_acc": 0.0157, "lyapunov": null, "grad_norm": 0.5731165313342855, "grad_max_sv": 0.23213129304349422, "grad_min_sv": 9.869128861361709e-09, "grad_condition": 27851276.279406942, "lr": 0.0009164606203550494, "time_sec": 66.72496843338013 }, { "epoch": 29, "train_loss": 3.562197733078003, "train_acc": 0.15604, "test_loss": 7.580322309875489, "test_acc": 0.0165, "lyapunov": null, "grad_norm": 0.5656101207986921, "grad_max_sv": 0.21968504451215268, "grad_min_sv": 9.579083420918621e-09, "grad_condition": 25012099.962059125, "lr": 0.0009105746045668516, "time_sec": 66.69681811332703 }, { "epoch": 30, "train_loss": 3.560017660369873, "train_acc": 0.15662, "test_loss": 7.44054066619873, "test_acc": 0.0173, "lyapunov": null, "grad_norm": 0.5599580597173339, "grad_max_sv": 0.2209590796381235, "grad_min_sv": 9.39374856998021e-09, "grad_condition": 61658396.11314602, "lr": 0.0009045084971874733, "time_sec": 66.69601655006409 }, { "epoch": 31, "train_loss": 3.5422336725616455, "train_acc": 0.1599, "test_loss": 7.076059481048584, "test_acc": 0.0198, "lyapunov": null, "grad_norm": 0.5515859229373342, "grad_max_sv": 0.21789075396955013, "grad_min_sv": 9.395337015327687e-09, "grad_condition": 33141907.468724538, "lr": 0.0008982649590120977, "time_sec": 66.75024151802063 }, { "epoch": 32, "train_loss": 3.529042202835083, "train_acc": 0.15972, "test_loss": 7.7532018966674805, "test_acc": 0.0155, "lyapunov": null, "grad_norm": 0.5497951397745081, "grad_max_sv": 0.20885453820228578, "grad_min_sv": 9.25596560404085e-09, "grad_condition": 82473516.26766083, "lr": 0.0008918467286629196, "time_sec": 66.80956888198853 }, { "epoch": 33, "train_loss": 3.51621552734375, "train_acc": 0.1644, "test_loss": 6.8358760055542, "test_acc": 0.0194, "lyapunov": null, "grad_norm": 0.5469890700179638, "grad_max_sv": 0.21847443841397762, "grad_min_sv": 9.440127946014343e-09, "grad_condition": 25421324.334352963, "lr": 0.0008852566213878943, "time_sec": 66.7693350315094 }, { "epoch": 34, "train_loss": 3.5162335932922364, "train_acc": 0.16484, "test_loss": 6.398185224914551, "test_acc": 0.0185, "lyapunov": null, "grad_norm": 0.5383581492940669, "grad_max_sv": 0.20689108446240426, "grad_min_sv": 9.233877815151281e-09, "grad_condition": 27064375.409329318, "lr": 0.000878497527825878, "time_sec": 66.79785513877869 }, { "epoch": 35, "train_loss": 3.5035785108184814, "train_acc": 0.16536, "test_loss": 7.335230517578125, "test_acc": 0.0195, "lyapunov": null, "grad_norm": 0.5402027402758915, "grad_max_sv": 0.20682688914239405, "grad_min_sv": 9.348574800394082e-09, "grad_condition": 28438563.468850803, "lr": 0.000871572412738697, "time_sec": 66.81045579910278 }, { "epoch": 36, "train_loss": 3.493286726074219, "train_acc": 0.16834, "test_loss": 6.502911682128906, "test_acc": 0.0259, "lyapunov": null, "grad_norm": 0.5280034242832364, "grad_max_sv": 0.19797059781849385, "grad_min_sv": 9.105119513908022e-09, "grad_condition": 25415325.485806335, "lr": 0.0008644843137107055, "time_sec": 66.76097869873047 }, { "epoch": 37, "train_loss": 3.4780256481933596, "train_acc": 0.1702, "test_loss": 7.499637036132812, "test_acc": 0.0188, "lyapunov": null, "grad_norm": 0.5321877448382957, "grad_max_sv": 0.19945566728711128, "grad_min_sv": 9.11805770470453e-09, "grad_condition": 72290792.90222318, "lr": 0.0008572363398164014, "time_sec": 66.87902355194092 }, { "epoch": 38, "train_loss": 3.4674857460021973, "train_acc": 0.17068, "test_loss": 6.972921762847901, "test_acc": 0.0224, "lyapunov": null, "grad_norm": 0.5289491654487876, "grad_max_sv": 0.19467646181583403, "grad_min_sv": 9.052938640397023e-09, "grad_condition": 27977910.49401158, "lr": 0.0008498316702566826, "time_sec": 66.71038794517517 }, { "epoch": 39, "train_loss": 3.456567892379761, "train_acc": 0.1718, "test_loss": 7.583123879241944, "test_acc": 0.0204, "lyapunov": null, "grad_norm": 0.5257287769620685, "grad_max_sv": 0.19668871462345122, "grad_min_sv": 9.095625710942024e-09, "grad_condition": 27660923.67992892, "lr": 0.0008422735529643442, "time_sec": 66.70259189605713 }, { "epoch": 40, "train_loss": 3.439600283050537, "train_acc": 0.17702, "test_loss": 7.07623366394043, "test_acc": 0.0194, "lyapunov": null, "grad_norm": 0.5218212705616453, "grad_max_sv": 0.19257443137466906, "grad_min_sv": 8.974160192742886e-09, "grad_condition": 24645717.0349477, "lr": 0.0008345653031794289, "time_sec": 66.69467544555664 }, { "epoch": 41, "train_loss": 3.441303518218994, "train_acc": 0.17488, "test_loss": 7.0255078727722164, "test_acc": 0.0229, "lyapunov": null, "grad_norm": 0.51868028277477, "grad_max_sv": 0.19331826008856295, "grad_min_sv": 9.044294972671008e-09, "grad_condition": 26826321.000719573, "lr": 0.0008267103019950526, "time_sec": 66.69299244880676 }, { "epoch": 42, "train_loss": 3.4292957513427735, "train_acc": 0.17452, "test_loss": 7.204381840515136, "test_acc": 0.0259, "lyapunov": null, "grad_norm": 0.5253643254473546, "grad_max_sv": 0.19751012995839118, "grad_min_sv": 9.221263796987956e-09, "grad_condition": 24125885.16929126, "lr": 0.0008187119948743447, "time_sec": 66.71035814285278 }, { "epoch": 43, "train_loss": 3.4281089696502685, "train_acc": 0.17694, "test_loss": 7.537664138793946, "test_acc": 0.0211, "lyapunov": null, "grad_norm": 0.5194108534896916, "grad_max_sv": 0.2011748518794775, "grad_min_sv": 9.108393971002382e-09, "grad_condition": 44095500.51692389, "lr": 0.000810573890139155, "time_sec": 66.8431122303009 }, { "epoch": 44, "train_loss": 3.4221175812530515, "train_acc": 0.1796, "test_loss": 7.407726572418213, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.5178702018876962, "grad_max_sv": 0.19308201856911184, "grad_min_sv": 9.019754657058065e-09, "grad_condition": 26647196.819321267, "lr": 0.0008022995574311873, "time_sec": 66.78941011428833 }, { "epoch": 45, "train_loss": 3.400263899459839, "train_acc": 0.18424, "test_loss": 6.749155438232422, "test_acc": 0.0251, "lyapunov": null, "grad_norm": 0.518187566195941, "grad_max_sv": 0.18997054174542427, "grad_min_sv": 8.950063522597528e-09, "grad_condition": 64164305.6683145, "lr": 0.0007938926261462363, "time_sec": 66.72000646591187 }, { "epoch": 46, "train_loss": 3.395167677078247, "train_acc": 0.18308, "test_loss": 6.933445383453369, "test_acc": 0.0219, "lyapunov": null, "grad_norm": 0.5105878399725617, "grad_max_sv": 0.18559869714081287, "grad_min_sv": 8.806649112215459e-09, "grad_condition": 120544633.7455566, "lr": 0.0007853567838422158, "time_sec": 66.71739363670349 }, { "epoch": 47, "train_loss": 3.3893753800964355, "train_acc": 0.18392, "test_loss": 7.526408071899414, "test_acc": 0.0222, "lyapunov": null, "grad_norm": 0.5062040296706847, "grad_max_sv": 0.18082244805991649, "grad_min_sv": 8.976306442587401e-09, "grad_condition": 29608816.90495221, "lr": 0.0007766957746216719, "time_sec": 66.72174620628357 }, { "epoch": 48, "train_loss": 3.3721413567352294, "train_acc": 0.18658, "test_loss": 6.825230180358886, "test_acc": 0.0242, "lyapunov": null, "grad_norm": 0.5095470173179549, "grad_max_sv": 0.18853078819811345, "grad_min_sv": 8.948983057366356e-09, "grad_condition": 26865035.338588893, "lr": 0.0007679133974894982, "time_sec": 66.80622148513794 }, { "epoch": 49, "train_loss": 3.3716752050018313, "train_acc": 0.18754, "test_loss": 7.223709740447998, "test_acc": 0.0303, "lyapunov": null, "grad_norm": 0.5066211171288654, "grad_max_sv": 0.1869507610797882, "grad_min_sv": 8.992035052668434e-09, "grad_condition": 23283441.10076283, "lr": 0.000759013504686565, "time_sec": 66.81845688819885 }, { "epoch": 50, "train_loss": 3.3587275280761717, "train_acc": 0.19086, "test_loss": 6.7569826782226565, "test_acc": 0.0243, "lyapunov": null, "grad_norm": 0.506317038211902, "grad_max_sv": 0.18107994161546231, "grad_min_sv": 8.999141074342299e-09, "grad_condition": 200538246.60999444, "lr": 0.0007499999999999998, "time_sec": 66.70761036872864 }, { "epoch": 51, "train_loss": 3.3526639527130127, "train_acc": 0.19188, "test_loss": 6.670795946502685, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.5023637852793532, "grad_max_sv": 0.1799766130745411, "grad_min_sv": 9.005793131719453e-09, "grad_condition": 60303250.12300022, "lr": 0.0007408768370508575, "time_sec": 66.8078305721283 }, { "epoch": 52, "train_loss": 3.3506644287872316, "train_acc": 0.19068, "test_loss": 7.382517870330811, "test_acc": 0.022, "lyapunov": null, "grad_norm": 0.49959851459507565, "grad_max_sv": 0.17121989093720913, "grad_min_sv": 8.849344752120958e-09, "grad_condition": 34334249.77637265, "lr": 0.0007316480175599307, "time_sec": 66.78811454772949 }, { "epoch": 53, "train_loss": 3.3417568744659425, "train_acc": 0.19254, "test_loss": 8.142177056884766, "test_acc": 0.0233, "lyapunov": null, "grad_norm": 0.4981274188163727, "grad_max_sv": 0.17399160973727704, "grad_min_sv": 8.837567241903877e-09, "grad_condition": 24739202.69426199, "lr": 0.0007223175895924635, "time_sec": 66.85724830627441 }, { "epoch": 54, "train_loss": 3.3355814123535157, "train_acc": 0.1957, "test_loss": 6.92948182220459, "test_acc": 0.0248, "lyapunov": null, "grad_norm": 0.49764414817443375, "grad_max_sv": 0.17371546551585199, "grad_min_sv": 8.84867411088744e-09, "grad_condition": 150304225.8365222, "lr": 0.0007128896457825361, "time_sec": 66.71973633766174 }, { "epoch": 55, "train_loss": 3.326216081542969, "train_acc": 0.19418, "test_loss": 7.809853678131104, "test_acc": 0.023, "lyapunov": null, "grad_norm": 0.4993878218606792, "grad_max_sv": 0.17109079472720623, "grad_min_sv": 8.849828239676505e-09, "grad_condition": 22057140.335132368, "lr": 0.0007033683215378998, "time_sec": 66.97141337394714 }, { "epoch": 56, "train_loss": 3.319088702545166, "train_acc": 0.19614, "test_loss": 7.596286960601807, "test_acc": 0.0212, "lyapunov": null, "grad_norm": 0.49667047439168693, "grad_max_sv": 0.16795397438108922, "grad_min_sv": 8.856667624290716e-09, "grad_condition": 21032117.189596005, "lr": 0.0006937577932260512, "time_sec": 66.70526051521301 }, { "epoch": 57, "train_loss": 3.303804122848511, "train_acc": 0.19878, "test_loss": 7.291678775024414, "test_acc": 0.02, "lyapunov": null, "grad_norm": 0.499572780086862, "grad_max_sv": 0.17316541597247123, "grad_min_sv": 8.944026716473098e-09, "grad_condition": 23580602.560242586, "lr": 0.0006840622763423388, "time_sec": 66.72219276428223 }, { "epoch": 58, "train_loss": 3.2961739293670655, "train_acc": 0.20036, "test_loss": 7.379423007202148, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.49780422530713136, "grad_max_sv": 0.17306868806481362, "grad_min_sv": 8.897491003689862e-09, "grad_condition": 33645085.03834008, "lr": 0.0006742860236609073, "time_sec": 66.7072229385376 }, { "epoch": 59, "train_loss": 3.292852275466919, "train_acc": 0.20314, "test_loss": 6.699318830871582, "test_acc": 0.0262, "lyapunov": null, "grad_norm": 0.49686323718116887, "grad_max_sv": 0.17558623403310775, "grad_min_sv": 8.761962172476601e-09, "grad_condition": 38386994.848281495, "lr": 0.0006644333233692913, "time_sec": 66.72137403488159 }, { "epoch": 60, "train_loss": 3.2881739818573, "train_acc": 0.20208, "test_loss": 6.617448914337158, "test_acc": 0.0235, "lyapunov": null, "grad_norm": 0.4972800368236651, "grad_max_sv": 0.17418485544621945, "grad_min_sv": 8.887109359534406e-09, "grad_condition": 23772781.473704576, "lr": 0.0006545084971874734, "time_sec": 66.76340699195862 }, { "epoch": 61, "train_loss": 3.2832211613464355, "train_acc": 0.20396, "test_loss": 7.8168681640625, "test_acc": 0.0196, "lyapunov": null, "grad_norm": 0.49347264852603, "grad_max_sv": 0.16998312883079053, "grad_min_sv": 8.87461152343505e-09, "grad_condition": 22196538.972435523, "lr": 0.0006445158984722354, "time_sec": 66.69128584861755 }, { "epoch": 62, "train_loss": 3.267657317352295, "train_acc": 0.20602, "test_loss": 6.787965573120117, "test_acc": 0.0226, "lyapunov": null, "grad_norm": 0.4942819436191628, "grad_max_sv": 0.1665095403790474, "grad_min_sv": 8.805719026172553e-09, "grad_condition": 21888086.61137065, "lr": 0.0006344599103076324, "time_sec": 66.72603845596313 }, { "epoch": 63, "train_loss": 3.264744351043701, "train_acc": 0.20522, "test_loss": 7.947964939117432, "test_acc": 0.0218, "lyapunov": null, "grad_norm": 0.49153660537625127, "grad_max_sv": 0.16237439326941966, "grad_min_sv": 8.742884187451505e-09, "grad_condition": 23911997.384101003, "lr": 0.0006243449435824269, "time_sec": 66.6943769454956 }, { "epoch": 64, "train_loss": 3.2640425563812254, "train_acc": 0.20452, "test_loss": 7.12151423034668, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.49384434943361655, "grad_max_sv": 0.168024880066514, "grad_min_sv": 8.758979427869739e-09, "grad_condition": 21739668.66096285, "lr": 0.0006141754350553275, "time_sec": 66.69389152526855 }, { "epoch": 65, "train_loss": 3.244006223831177, "train_acc": 0.21052, "test_loss": 7.017924461364746, "test_acc": 0.0234, "lyapunov": null, "grad_norm": 0.49421653603545956, "grad_max_sv": 0.1682070516049862, "grad_min_sv": 8.867816919666538e-09, "grad_condition": 33570918.978102654, "lr": 0.0006039558454088793, "time_sec": 66.70642900466919 }, { "epoch": 66, "train_loss": 3.2429666870880127, "train_acc": 0.2095, "test_loss": 7.507377795410156, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.4920675755358138, "grad_max_sv": 0.16653703041374684, "grad_min_sv": 8.782905018545061e-09, "grad_condition": 33037433.310028076, "lr": 0.000593690657292862, "time_sec": 66.69945740699768 }, { "epoch": 67, "train_loss": 3.235812818222046, "train_acc": 0.21004, "test_loss": 8.179235096740722, "test_acc": 0.0199, "lyapunov": null, "grad_norm": 0.49143560072681164, "grad_max_sv": 0.16453767009079456, "grad_min_sv": 8.906316832646422e-09, "grad_condition": 24459655.594651837, "lr": 0.0005833843733580507, "time_sec": 66.68722915649414 }, { "epoch": 68, "train_loss": 3.2230448572540285, "train_acc": 0.21154, "test_loss": 7.499305305480957, "test_acc": 0.0213, "lyapunov": null, "grad_norm": 0.49248528868620167, "grad_max_sv": 0.16838400289416314, "grad_min_sv": 8.870841536334773e-09, "grad_condition": 21419108.58487917, "lr": 0.0005730415142812054, "time_sec": 66.70680451393127 }, { "epoch": 69, "train_loss": 3.2205778658294677, "train_acc": 0.21464, "test_loss": 7.50203574142456, "test_acc": 0.0244, "lyapunov": null, "grad_norm": 0.4909914070718711, "grad_max_sv": 0.1646382961422205, "grad_min_sv": 8.7063952491917e-09, "grad_condition": 22220196.366961446, "lr": 0.0005626666167821517, "time_sec": 66.76639890670776 }, { "epoch": 70, "train_loss": 3.207180488128662, "train_acc": 0.21516, "test_loss": 7.001610806274414, "test_acc": 0.0258, "lyapunov": null, "grad_norm": 0.495424727651562, "grad_max_sv": 0.16553561352193355, "grad_min_sv": 8.972080669383819e-09, "grad_condition": 47422658.54318248, "lr": 0.0005522642316338265, "time_sec": 66.70834302902222 }, { "epoch": 71, "train_loss": 3.2062013800048828, "train_acc": 0.21612, "test_loss": 6.927703591156006, "test_acc": 0.0308, "lyapunov": null, "grad_norm": 0.49114896439763267, "grad_max_sv": 0.16479650065302848, "grad_min_sv": 8.813466856327778e-09, "grad_condition": 43207807.33314108, "lr": 0.0005418389216661573, "time_sec": 66.71610283851624 }, { "epoch": 72, "train_loss": 3.1919854682922364, "train_acc": 0.21694, "test_loss": 6.498612490844726, "test_acc": 0.0294, "lyapunov": null, "grad_norm": 0.49506236999909303, "grad_max_sv": 0.16502842903137208, "grad_min_sv": 8.951233382292757e-09, "grad_condition": 20833946.329851203, "lr": 0.0005313952597646563, "time_sec": 66.70564031600952 }, { "epoch": 73, "train_loss": 3.19263421005249, "train_acc": 0.22014, "test_loss": 7.917480190277099, "test_acc": 0.0215, "lyapunov": null, "grad_norm": 0.4934923943021254, "grad_max_sv": 0.1658387891948223, "grad_min_sv": 8.915270069409509e-09, "grad_condition": 23230788.976801574, "lr": 0.0005209378268645994, "time_sec": 66.77329587936401 }, { "epoch": 74, "train_loss": 3.185640338821411, "train_acc": 0.21906, "test_loss": 7.357819847106933, "test_acc": 0.0252, "lyapunov": null, "grad_norm": 0.4911097758269761, "grad_max_sv": 0.16611208710819483, "grad_min_sv": 8.851672780169073e-09, "grad_condition": 58442839.12499788, "lr": 0.0005104712099416781, "time_sec": 66.684730052948 }, { "epoch": 75, "train_loss": 3.1690349718475344, "train_acc": 0.2239, "test_loss": 7.2397661224365235, "test_acc": 0.0256, "lyapunov": null, "grad_norm": 0.4906690124125115, "grad_max_sv": 0.16415953114628792, "grad_min_sv": 8.816434821090625e-09, "grad_condition": 20409708.15696338, "lr": 0.0004999999999999996, "time_sec": 66.71101260185242 }, { "epoch": 76, "train_loss": 3.1630740728759767, "train_acc": 0.2228, "test_loss": 7.3856810913085935, "test_acc": 0.0247, "lyapunov": null, "grad_norm": 0.4942494495158576, "grad_max_sv": 0.16416314020752906, "grad_min_sv": 8.881746908773192e-09, "grad_condition": 22916920.692442246, "lr": 0.0004895287900583212, "time_sec": 66.72276592254639 }, { "epoch": 77, "train_loss": 3.157883042678833, "train_acc": 0.2226, "test_loss": 7.461940403747558, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.48944835890506283, "grad_max_sv": 0.16295542381703854, "grad_min_sv": 8.790652895884766e-09, "grad_condition": 25190467.13440006, "lr": 0.0004790621731353997, "time_sec": 66.73238253593445 }, { "epoch": 78, "train_loss": 3.15415998550415, "train_acc": 0.2232, "test_loss": 7.546776051330567, "test_acc": 0.027, "lyapunov": null, "grad_norm": 0.48925024138964845, "grad_max_sv": 0.1628365319222212, "grad_min_sv": 8.811498453109578e-09, "grad_condition": 23075857.06663191, "lr": 0.000468604740235343, "time_sec": 66.73092246055603 }, { "epoch": 79, "train_loss": 3.1458859318542483, "train_acc": 0.22802, "test_loss": 7.108101511383056, "test_acc": 0.0285, "lyapunov": null, "grad_norm": 0.495366871838511, "grad_max_sv": 0.1650368317961693, "grad_min_sv": 9.025954333247154e-09, "grad_condition": 38457801.29496137, "lr": 0.00045816107833384175, "time_sec": 66.74371480941772 }, { "epoch": 80, "train_loss": 3.140154826583862, "train_acc": 0.2266, "test_loss": 7.284811801147461, "test_acc": 0.0302, "lyapunov": null, "grad_norm": 0.4914271153786783, "grad_max_sv": 0.16505839116871357, "grad_min_sv": 8.893962011443865e-09, "grad_condition": 369021517.7075845, "lr": 0.0004477357683661729, "time_sec": 66.69183111190796 }, { "epoch": 81, "train_loss": 3.1333287098693847, "train_acc": 0.22694, "test_loss": 7.571458190917968, "test_acc": 0.0209, "lyapunov": null, "grad_norm": 0.494073529942036, "grad_max_sv": 0.1608546230942011, "grad_min_sv": 9.091243879932875e-09, "grad_condition": 20891716.667523753, "lr": 0.00043733338321784746, "time_sec": 66.71526265144348 }, { "epoch": 82, "train_loss": 3.1283695087432863, "train_acc": 0.23006, "test_loss": 7.788016625976563, "test_acc": 0.024, "lyapunov": null, "grad_norm": 0.49129892073668435, "grad_max_sv": 0.16086806021630765, "grad_min_sv": 8.920912475049448e-09, "grad_condition": 47898591.96295839, "lr": 0.0004269584857187939, "time_sec": 66.69153666496277 }, { "epoch": 83, "train_loss": 3.130916413574219, "train_acc": 0.23138, "test_loss": 7.913901668548584, "test_acc": 0.0261, "lyapunov": null, "grad_norm": 0.48912391484879925, "grad_max_sv": 0.16135921962559224, "grad_min_sv": 9.076431696855569e-09, "grad_condition": 50854672.26653309, "lr": 0.0004166156266419484, "time_sec": 66.75194883346558 }, { "epoch": 84, "train_loss": 3.116759624481201, "train_acc": 0.22928, "test_loss": 7.443206707763672, "test_acc": 0.0267, "lyapunov": null, "grad_norm": 0.49216768079497325, "grad_max_sv": 0.16190627813339234, "grad_min_sv": 9.013408105995602e-09, "grad_condition": 22062192.06550083, "lr": 0.0004063093427071373, "time_sec": 66.76291751861572 }, { "epoch": 85, "train_loss": 3.1119228192138673, "train_acc": 0.23272, "test_loss": 7.789751325988769, "test_acc": 0.028, "lyapunov": null, "grad_norm": 0.4906237938270759, "grad_max_sv": 0.16028195321559907, "grad_min_sv": 8.904607010085108e-09, "grad_condition": 21362215.652891032, "lr": 0.0003960441545911199, "time_sec": 66.72702622413635 }, { "epoch": 86, "train_loss": 3.095892171173096, "train_acc": 0.23322, "test_loss": 7.520130683135986, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.49558582555905584, "grad_max_sv": 0.15913640297949314, "grad_min_sv": 9.008386794850943e-09, "grad_condition": 19711267.83894111, "lr": 0.0003858245649446718, "time_sec": 66.69949555397034 }, { "epoch": 87, "train_loss": 3.0982225965118406, "train_acc": 0.23538, "test_loss": 7.958539725494385, "test_acc": 0.0227, "lyapunov": null, "grad_norm": 0.4928264723148802, "grad_max_sv": 0.16157768219709395, "grad_min_sv": 9.009624502009927e-09, "grad_condition": 22513594.923468076, "lr": 0.00037565505641757235, "time_sec": 66.7021861076355 }, { "epoch": 88, "train_loss": 3.0881566471099853, "train_acc": 0.23704, "test_loss": 7.651519326782227, "test_acc": 0.0317, "lyapunov": null, "grad_norm": 0.4925350840337203, "grad_max_sv": 0.16133950129151345, "grad_min_sv": 8.917141037720344e-09, "grad_condition": 46990788.85548556, "lr": 0.00036554008969236695, "time_sec": 66.71680331230164 }, { "epoch": 89, "train_loss": 3.0752701135253906, "train_acc": 0.24002, "test_loss": 8.03997054977417, "test_acc": 0.0266, "lyapunov": null, "grad_norm": 0.49191590245060596, "grad_max_sv": 0.16232036016881465, "grad_min_sv": 8.918097575694173e-09, "grad_condition": 40862815.39075501, "lr": 0.0003554841015277638, "time_sec": 66.69313955307007 }, { "epoch": 90, "train_loss": 3.078908212738037, "train_acc": 0.24046, "test_loss": 7.6376062118530275, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.4911817237537404, "grad_max_sv": 0.1551229476928711, "grad_min_sv": 8.927438248373943e-09, "grad_condition": 22037340.73214477, "lr": 0.000345491502812526, "time_sec": 66.69833588600159 }, { "epoch": 91, "train_loss": 3.068959038543701, "train_acc": 0.23882, "test_loss": 8.130451618957519, "test_acc": 0.0246, "lyapunov": null, "grad_norm": 0.4906750851127587, "grad_max_sv": 0.15804662480950354, "grad_min_sv": 8.945024668194357e-09, "grad_condition": 20238836.161220632, "lr": 0.0003355666766307081, "time_sec": 66.82877826690674 }, { "epoch": 92, "train_loss": 3.0708934452819823, "train_acc": 0.23938, "test_loss": 7.4464682083129885, "test_acc": 0.0273, "lyapunov": null, "grad_norm": 0.49334078113347807, "grad_max_sv": 0.16077993027865886, "grad_min_sv": 9.145524822347373e-09, "grad_condition": 187037203.19992697, "lr": 0.00032571397633909225, "time_sec": 66.74011158943176 }, { "epoch": 93, "train_loss": 3.0600284594726563, "train_acc": 0.24034, "test_loss": 7.877293493652344, "test_acc": 0.024, "lyapunov": null, "grad_norm": 0.4935640341843895, "grad_max_sv": 0.1569301776587963, "grad_min_sv": 9.054515949513675e-09, "grad_condition": 27829600.056863032, "lr": 0.00031593772365766094, "time_sec": 66.81489491462708 }, { "epoch": 94, "train_loss": 3.051695512161255, "train_acc": 0.23988, "test_loss": 7.893620376586914, "test_acc": 0.026, "lyapunov": null, "grad_norm": 0.49337091451194337, "grad_max_sv": 0.15855305679142476, "grad_min_sv": 8.944794831905467e-09, "grad_condition": 38859308.23023894, "lr": 0.0003062422067739483, "time_sec": 66.7299313545227 }, { "epoch": 95, "train_loss": 3.0489727338409423, "train_acc": 0.2417, "test_loss": 8.291682899475097, "test_acc": 0.0277, "lyapunov": null, "grad_norm": 0.49538404769918437, "grad_max_sv": 0.1582469828426838, "grad_min_sv": 8.944870299315566e-09, "grad_condition": 46091432.107807726, "lr": 0.00029663167846209965, "time_sec": 66.69549345970154 }, { "epoch": 96, "train_loss": 3.0484196520233153, "train_acc": 0.243, "test_loss": 7.872291290283203, "test_acc": 0.0265, "lyapunov": null, "grad_norm": 0.49220383248292715, "grad_max_sv": 0.15892123989760876, "grad_min_sv": 9.01737370051503e-09, "grad_condition": 21302011.98175659, "lr": 0.00028711035421746345, "time_sec": 66.71452689170837 }, { "epoch": 97, "train_loss": 3.037676093826294, "train_acc": 0.246, "test_loss": 7.654231861877442, "test_acc": 0.0293, "lyapunov": null, "grad_norm": 0.49508860986225445, "grad_max_sv": 0.15910031460225582, "grad_min_sv": 9.107966224752503e-09, "grad_condition": 219510223.0929153, "lr": 0.00027768241040753615, "time_sec": 66.68213939666748 }, { "epoch": 98, "train_loss": 3.0303984658813476, "train_acc": 0.2483, "test_loss": 7.705853749084473, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.4955532184661232, "grad_max_sv": 0.1598552517592907, "grad_min_sv": 9.178445775637201e-09, "grad_condition": 19678066.130865358, "lr": 0.00026835198244006903, "time_sec": 66.72349858283997 }, { "epoch": 99, "train_loss": 3.0224529089355467, "train_acc": 0.24928, "test_loss": 8.284590560913086, "test_acc": 0.0288, "lyapunov": null, "grad_norm": 0.49667728346438245, "grad_max_sv": 0.16261373981833457, "grad_min_sv": 9.261911344468631e-09, "grad_condition": 43957646.17011832, "lr": 0.0002591231629491421, "time_sec": 66.71236634254456 }, { "epoch": 100, "train_loss": 3.026221090545654, "train_acc": 0.24816, "test_loss": 8.147641947174073, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.4973181888980844, "grad_max_sv": 0.161344700306654, "grad_min_sv": 9.093790653835754e-09, "grad_condition": 22073209.92013366, "lr": 0.0002499999999999997, "time_sec": 66.67841935157776 }, { "epoch": 101, "train_loss": 3.024826983642578, "train_acc": 0.24746, "test_loss": 8.172234124755859, "test_acc": 0.0299, "lyapunov": null, "grad_norm": 0.4987508334210676, "grad_max_sv": 0.1609908178448677, "grad_min_sv": 9.188273343563313e-09, "grad_condition": 29575100.287913345, "lr": 0.00024098649531343477, "time_sec": 66.66067171096802 }, { "epoch": 102, "train_loss": 3.00824671585083, "train_acc": 0.25088, "test_loss": 8.115251203918458, "test_acc": 0.0287, "lyapunov": null, "grad_norm": 0.49705452560220326, "grad_max_sv": 0.16128522865474224, "grad_min_sv": 9.071875566209197e-09, "grad_condition": 183987800.30718166, "lr": 0.0002320866025105016, "time_sec": 66.69079804420471 }, { "epoch": 103, "train_loss": 3.012382175140381, "train_acc": 0.2474, "test_loss": 7.876342864227295, "test_acc": 0.0358, "lyapunov": null, "grad_norm": 0.49759795132738194, "grad_max_sv": 0.15578284673392773, "grad_min_sv": 9.15119064692771e-09, "grad_condition": 20274304.806162156, "lr": 0.0002233042253783278, "time_sec": 66.68386912345886 }, { "epoch": 104, "train_loss": 2.999149740066528, "train_acc": 0.25194, "test_loss": 8.156604473876953, "test_acc": 0.0334, "lyapunov": null, "grad_norm": 0.4993865662081535, "grad_max_sv": 0.16031337156891823, "grad_min_sv": 9.130539890822575e-09, "grad_condition": 20692502.69173783, "lr": 0.000214643216157784, "time_sec": 66.76614332199097 }, { "epoch": 105, "train_loss": 2.993046808395386, "train_acc": 0.25322, "test_loss": 8.206476106262206, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.49628166690763564, "grad_max_sv": 0.1620720062404871, "grad_min_sv": 9.0822705509086e-09, "grad_condition": 31802699.452992357, "lr": 0.00020610737385376332, "time_sec": 66.92790508270264 }, { "epoch": 106, "train_loss": 2.9957507374572754, "train_acc": 0.25204, "test_loss": 8.32369485168457, "test_acc": 0.0313, "lyapunov": null, "grad_norm": 0.499844986274271, "grad_max_sv": 0.15692994557321072, "grad_min_sv": 9.113036909119687e-09, "grad_condition": 37954326.83555563, "lr": 0.00019770044256881242, "time_sec": 66.69280505180359 }, { "epoch": 107, "train_loss": 2.986658691177368, "train_acc": 0.25358, "test_loss": 8.158060417938232, "test_acc": 0.0315, "lyapunov": null, "grad_norm": 0.5001001823423601, "grad_max_sv": 0.16076837331056595, "grad_min_sv": 9.191752022019718e-09, "grad_condition": 24107799.99388643, "lr": 0.0001894261098608447, "time_sec": 66.8065435886383 }, { "epoch": 108, "train_loss": 2.9821577393341063, "train_acc": 0.25654, "test_loss": 8.488254710388183, "test_acc": 0.0271, "lyapunov": null, "grad_norm": 0.502485476242763, "grad_max_sv": 0.1583723586052656, "grad_min_sv": 9.112645133618757e-09, "grad_condition": 75568130.83148949, "lr": 0.000181288005125655, "time_sec": 66.69794940948486 }, { "epoch": 109, "train_loss": 2.9782085455322265, "train_acc": 0.25542, "test_loss": 8.012923631286622, "test_acc": 0.0329, "lyapunov": null, "grad_norm": 0.4984903393296528, "grad_max_sv": 0.15951386988162994, "grad_min_sv": 9.13156463222542e-09, "grad_condition": 19541255.215787858, "lr": 0.0001732896980049473, "time_sec": 66.75459599494934 }, { "epoch": 110, "train_loss": 2.977617024688721, "train_acc": 0.25416, "test_loss": 7.927994426727295, "test_acc": 0.0312, "lyapunov": null, "grad_norm": 0.5009242415138291, "grad_max_sv": 0.15868730172514917, "grad_min_sv": 9.178975504675613e-09, "grad_condition": 20582427.94600161, "lr": 0.00016543469682057076, "time_sec": 66.69332385063171 }, { "epoch": 111, "train_loss": 2.9753467011260986, "train_acc": 0.25596, "test_loss": 8.319595712280274, "test_acc": 0.0307, "lyapunov": null, "grad_norm": 0.5005941372001506, "grad_max_sv": 0.16290293373167514, "grad_min_sv": 9.188780414337571e-09, "grad_condition": 58141904.50898675, "lr": 0.00015772644703565552, "time_sec": 66.67908811569214 }, { "epoch": 112, "train_loss": 2.964190831069946, "train_acc": 0.2586, "test_loss": 8.675558572387695, "test_acc": 0.0264, "lyapunov": null, "grad_norm": 0.49904161219237203, "grad_max_sv": 0.15657965913414956, "grad_min_sv": 9.138289626658274e-09, "grad_condition": 176788840.7312159, "lr": 0.00015016832974331713, "time_sec": 66.7088508605957 }, { "epoch": 113, "train_loss": 2.954090965118408, "train_acc": 0.26176, "test_loss": 8.300330653381348, "test_acc": 0.0295, "lyapunov": null, "grad_norm": 0.49993834308283913, "grad_max_sv": 0.16308558471500872, "grad_min_sv": 9.294466957188163e-09, "grad_condition": 21663432.51767642, "lr": 0.00014276366018359834, "time_sec": 66.69772529602051 }, { "epoch": 114, "train_loss": 2.963344728240967, "train_acc": 0.25764, "test_loss": 8.330418551635741, "test_acc": 0.0289, "lyapunov": null, "grad_norm": 0.5018230989792033, "grad_max_sv": 0.15932467840611936, "grad_min_sv": 9.236983548877032e-09, "grad_condition": 27736134.476570655, "lr": 0.00013551568628929425, "time_sec": 66.70325803756714 }, { "epoch": 115, "train_loss": 2.9565879733276366, "train_acc": 0.25964, "test_loss": 7.8575323272705075, "test_acc": 0.0326, "lyapunov": null, "grad_norm": 0.5008809900364136, "grad_max_sv": 0.1622266974300146, "grad_min_sv": 9.12305047895412e-09, "grad_condition": 30845128.19165374, "lr": 0.00012842758726130276, "time_sec": 66.68990015983582 }, { "epoch": 116, "train_loss": 2.9527316310119627, "train_acc": 0.25978, "test_loss": 8.399875411987304, "test_acc": 0.0331, "lyapunov": null, "grad_norm": 0.501442711033118, "grad_max_sv": 0.15974901132285596, "grad_min_sv": 9.164257287058719e-09, "grad_condition": 38992915.8072435, "lr": 0.0001215024721741218, "time_sec": 66.69366478919983 }, { "epoch": 117, "train_loss": 2.9503427956390382, "train_acc": 0.26032, "test_loss": 7.990305528259277, "test_acc": 0.0321, "lyapunov": null, "grad_norm": 0.503589536410986, "grad_max_sv": 0.16520196348428726, "grad_min_sv": 9.264067410072464e-09, "grad_condition": 83868622.08023986, "lr": 0.00011474337861210538, "time_sec": 66.72409868240356 }, { "epoch": 118, "train_loss": 2.9452951972961428, "train_acc": 0.26186, "test_loss": 8.147903689575195, "test_acc": 0.0314, "lyapunov": null, "grad_norm": 0.5033856715448645, "grad_max_sv": 0.16233305558562278, "grad_min_sv": 9.248901002012478e-09, "grad_condition": 25081711.234670334, "lr": 0.00010815327133708009, "time_sec": 66.7026617527008 }, { "epoch": 119, "train_loss": 2.941498958053589, "train_acc": 0.26368, "test_loss": 8.610751574707031, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.5024430434883491, "grad_max_sv": 0.1590784341096878, "grad_min_sv": 9.23304959987714e-09, "grad_condition": 20494387.45624064, "lr": 0.00010173504098790182, "time_sec": 66.76532936096191 }, { "epoch": 120, "train_loss": 2.935255004730225, "train_acc": 0.26242, "test_loss": 8.297263900756835, "test_acc": 0.0331, "lyapunov": null, "grad_norm": 0.5040302766957269, "grad_max_sv": 0.163528535887599, "grad_min_sv": 9.301190626032075e-09, "grad_condition": 28694382.488496322, "lr": 9.549150281252629e-05, "time_sec": 66.68135213851929 }, { "epoch": 121, "train_loss": 2.9364529040527345, "train_acc": 0.26432, "test_loss": 8.291862780761718, "test_acc": 0.032, "lyapunov": null, "grad_norm": 0.5046029560998396, "grad_max_sv": 0.15975070968270302, "grad_min_sv": 9.412849380496801e-09, "grad_condition": 19587449.45790067, "lr": 8.942539543314794e-05, "time_sec": 66.67216777801514 }, { "epoch": 122, "train_loss": 2.936676673126221, "train_acc": 0.26518, "test_loss": 8.499242510986328, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 0.5047649009210087, "grad_max_sv": 0.16289451010525227, "grad_min_sv": 9.350050624370998e-09, "grad_condition": 55505776.29325993, "lr": 8.353937964495024e-05, "time_sec": 66.71731305122375 }, { "epoch": 123, "train_loss": 2.928475122909546, "train_acc": 0.26562, "test_loss": 8.177069671630859, "test_acc": 0.0342, "lyapunov": null, "grad_norm": 0.5048999761698001, "grad_max_sv": 0.15904909931123257, "grad_min_sv": 9.226389620364817e-09, "grad_condition": 25050377.05934065, "lr": 7.783603724899243e-05, "time_sec": 66.7349808216095 }, { "epoch": 124, "train_loss": 2.931030046463013, "train_acc": 0.2641, "test_loss": 8.353331985473632, "test_acc": 0.031, "lyapunov": null, "grad_norm": 0.5023168097041694, "grad_max_sv": 0.162389824539423, "grad_min_sv": 9.286878636938223e-09, "grad_condition": 23152814.43828611, "lr": 7.231786991974666e-05, "time_sec": 66.72571802139282 }, { "epoch": 125, "train_loss": 2.9270871754455565, "train_acc": 0.26426, "test_loss": 8.401993353271484, "test_acc": 0.0306, "lyapunov": null, "grad_norm": 0.5049758798636186, "grad_max_sv": 0.16142708584666252, "grad_min_sv": 9.297885433801056e-09, "grad_condition": 19875141.174937833, "lr": 6.698729810778072e-05, "time_sec": 66.69990706443787 }, { "epoch": 126, "train_loss": 2.930443018951416, "train_acc": 0.26334, "test_loss": 8.037101096343994, "test_acc": 0.0338, "lyapunov": null, "grad_norm": 0.5046016651861616, "grad_max_sv": 0.16035589538514614, "grad_min_sv": 9.240497411688865e-09, "grad_condition": 28125977.648946952, "lr": 6.184665997806817e-05, "time_sec": 67.14951395988464 }, { "epoch": 127, "train_loss": 2.920647982254028, "train_acc": 0.26692, "test_loss": 8.046730439758301, "test_acc": 0.0324, "lyapunov": null, "grad_norm": 0.5049604973588052, "grad_max_sv": 0.16098853275179864, "grad_min_sv": 9.3294794306642e-09, "grad_condition": 20407197.848863874, "lr": 5.6898210384392595e-05, "time_sec": 66.7223470211029 }, { "epoch": 128, "train_loss": 2.9174925131988525, "train_acc": 0.2684, "test_loss": 8.320220652770995, "test_acc": 0.0303, "lyapunov": null, "grad_norm": 0.5053571563299065, "grad_max_sv": 0.1587530255317688, "grad_min_sv": 9.217601072697424e-09, "grad_condition": 27425905.55975602, "lr": 5.214411988029363e-05, "time_sec": 66.72726678848267 }, { "epoch": 129, "train_loss": 2.912207716064453, "train_acc": 0.26822, "test_loss": 8.340176411437989, "test_acc": 0.0329, "lyapunov": null, "grad_norm": 0.5070723294876998, "grad_max_sv": 0.16541431248188018, "grad_min_sv": 9.451083940459348e-09, "grad_condition": 20567354.357769065, "lr": 4.7586473766990294e-05, "time_sec": 66.71740126609802 }, { "epoch": 130, "train_loss": 2.9202334938049317, "train_acc": 0.2674, "test_loss": 8.199926257324218, "test_acc": 0.0327, "lyapunov": null, "grad_norm": 0.5048916415346303, "grad_max_sv": 0.15801323913037776, "grad_min_sv": 9.219233110258073e-09, "grad_condition": 19376960.764617294, "lr": 4.32272711786996e-05, "time_sec": 66.70238876342773 }, { "epoch": 131, "train_loss": 2.9117065854644775, "train_acc": 0.27042, "test_loss": 8.4127576171875, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.5046808443683461, "grad_max_sv": 0.15953834764659405, "grad_min_sv": 9.310256252059723e-09, "grad_condition": 21439898.88764466, "lr": 3.906842420574966e-05, "time_sec": 66.70873999595642 }, { "epoch": 132, "train_loss": 2.910150853881836, "train_acc": 0.26928, "test_loss": 8.432557550048829, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.5068478509780873, "grad_max_sv": 0.1597142592072487, "grad_min_sv": 9.218466880817066e-09, "grad_condition": 51315275.56326776, "lr": 3.5111757055874305e-05, "time_sec": 66.67959189414978 }, { "epoch": 133, "train_loss": 2.913581671066284, "train_acc": 0.26686, "test_loss": 8.2192110748291, "test_acc": 0.0342, "lyapunov": null, "grad_norm": 0.5053193098572983, "grad_max_sv": 0.15978670455515384, "grad_min_sv": 9.38243127635019e-09, "grad_condition": 22892063.67804382, "lr": 3.1359005254054254e-05, "time_sec": 66.68708491325378 }, { "epoch": 134, "train_loss": 2.9081906867980956, "train_acc": 0.26852, "test_loss": 8.766140046691895, "test_acc": 0.0299, "lyapunov": null, "grad_norm": 0.5038449350705952, "grad_max_sv": 0.15981822535395623, "grad_min_sv": 9.258106009601974e-09, "grad_condition": 23090442.640830033, "lr": 2.7811814881259484e-05, "time_sec": 66.70866632461548 }, { "epoch": 135, "train_loss": 2.910741279144287, "train_acc": 0.26908, "test_loss": 8.568949060058594, "test_acc": 0.0305, "lyapunov": null, "grad_norm": 0.5060252593926529, "grad_max_sv": 0.16062484085559844, "grad_min_sv": 9.328420333409859e-09, "grad_condition": 20022211.16398121, "lr": 2.4471741852423218e-05, "time_sec": 66.7052571773529 }, { "epoch": 136, "train_loss": 2.904768952407837, "train_acc": 0.26876, "test_loss": 8.586251429748534, "test_acc": 0.0286, "lyapunov": null, "grad_norm": 0.5057054893343615, "grad_max_sv": 0.16051347628235818, "grad_min_sv": 9.250093449542085e-09, "grad_condition": 19758794.64532106, "lr": 2.1340251233966362e-05, "time_sec": 66.70623755455017 }, { "epoch": 137, "train_loss": 2.899753532714844, "train_acc": 0.2719, "test_loss": 8.500251341247559, "test_acc": 0.0306, "lyapunov": null, "grad_norm": 0.504993553912477, "grad_max_sv": 0.1628888875246048, "grad_min_sv": 9.47467431733351e-09, "grad_condition": 23562830.437205564, "lr": 1.8418716601170932e-05, "time_sec": 66.70105028152466 }, { "epoch": 138, "train_loss": 2.903391772613525, "train_acc": 0.26772, "test_loss": 8.47085325012207, "test_acc": 0.0328, "lyapunov": null, "grad_norm": 0.5045632679546488, "grad_max_sv": 0.158877120167017, "grad_min_sv": 9.315059612546861e-09, "grad_condition": 21175946.281570215, "lr": 1.570841943568445e-05, "time_sec": 66.6920268535614 }, { "epoch": 139, "train_loss": 2.902729499740601, "train_acc": 0.27098, "test_loss": 8.424858071136475, "test_acc": 0.0315, "lyapunov": null, "grad_norm": 0.5057203739338342, "grad_max_sv": 0.16270199753344058, "grad_min_sv": 9.42042569042467e-09, "grad_condition": 3524579699.0758705, "lr": 1.3210548563419845e-05, "time_sec": 66.71372246742249 }, { "epoch": 140, "train_loss": 2.906615010299683, "train_acc": 0.2691, "test_loss": 8.602820767211915, "test_acc": 0.03, "lyapunov": null, "grad_norm": 0.5062145592542612, "grad_max_sv": 0.16128202974796296, "grad_min_sv": 9.31656084814103e-09, "grad_condition": 91607684.02825375, "lr": 1.0926199633097203e-05, "time_sec": 66.70090675354004 }, { "epoch": 141, "train_loss": 2.9058460761260987, "train_acc": 0.26978, "test_loss": 8.383630235290527, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 0.5058119945694454, "grad_max_sv": 0.1625796493142843, "grad_min_sv": 9.312921286919184e-09, "grad_condition": 20916832.67992229, "lr": 8.856374635655688e-06, "time_sec": 66.7032151222229 }, { "epoch": 142, "train_loss": 2.901709259185791, "train_acc": 0.27014, "test_loss": 8.529939315795898, "test_acc": 0.0279, "lyapunov": null, "grad_norm": 0.50529937487535, "grad_max_sv": 0.16269058287143706, "grad_min_sv": 9.338738224395903e-09, "grad_condition": 21214498.9394589, "lr": 7.001981464747503e-06, "time_sec": 66.72001433372498 }, { "epoch": 143, "train_loss": 2.9003410097503664, "train_acc": 0.26956, "test_loss": 8.474568194580078, "test_acc": 0.0308, "lyapunov": null, "grad_norm": 0.5059546395273652, "grad_max_sv": 0.16158490478992463, "grad_min_sv": 9.306980860990244e-09, "grad_condition": 26379170.2127072, "lr": 5.3638335185058295e-06, "time_sec": 66.71419501304626 }, { "epoch": 144, "train_loss": 2.900580298156738, "train_acc": 0.27204, "test_loss": 8.518251318359376, "test_acc": 0.0304, "lyapunov": null, "grad_norm": 0.5064412723494297, "grad_max_sv": 0.16376300603151323, "grad_min_sv": 9.383655452666063e-09, "grad_condition": 20476900.61761298, "lr": 3.942649342761114e-06, "time_sec": 66.69701147079468 }, { "epoch": 145, "train_loss": 2.9021220780181887, "train_acc": 0.27056, "test_loss": 8.362188708496094, "test_acc": 0.0328, "lyapunov": null, "grad_norm": 0.5070330634175128, "grad_max_sv": 0.1640974970534444, "grad_min_sv": 9.447458995670566e-09, "grad_condition": 19525333.626517944, "lr": 2.7390523158633524e-06, "time_sec": 67.06064939498901 }, { "epoch": 146, "train_loss": 2.9056922393035887, "train_acc": 0.26996, "test_loss": 8.198326219177247, "test_acc": 0.0315, "lyapunov": null, "grad_norm": 0.5052726916497198, "grad_max_sv": 0.1608945619314909, "grad_min_sv": 9.247097532832926e-09, "grad_condition": 30881517.504121702, "lr": 1.7535703752478133e-06, "time_sec": 66.83930277824402 }, { "epoch": 147, "train_loss": 2.9056436912536623, "train_acc": 0.27088, "test_loss": 8.528380426025391, "test_acc": 0.029, "lyapunov": null, "grad_norm": 0.506185959212811, "grad_max_sv": 0.1588722374290228, "grad_min_sv": 9.394264763318283e-09, "grad_condition": 20675797.94461853, "lr": 9.866357858642196e-07, "time_sec": 66.72091388702393 }, { "epoch": 148, "train_loss": 2.8992470669555663, "train_acc": 0.27248, "test_loss": 8.531358058166504, "test_acc": 0.0283, "lyapunov": null, "grad_norm": 0.5065504938383886, "grad_max_sv": 0.16413835100829602, "grad_min_sv": 9.337682073222442e-09, "grad_condition": 78330146.63114226, "lr": 4.38584950570808e-07, "time_sec": 66.73046231269836 }, { "epoch": 149, "train_loss": 2.9046918795013426, "train_acc": 0.26942, "test_loss": 8.69618356628418, "test_acc": 0.0302, "lyapunov": null, "grad_norm": 0.5057233580127345, "grad_max_sv": 0.16292193159461021, "grad_min_sv": 9.351353436048982e-09, "grad_condition": 19471249.74441474, "lr": 1.096582625772501e-07, "time_sec": 66.730135679245 }, { "epoch": 150, "train_loss": 2.904742412261963, "train_acc": 0.2691, "test_loss": 8.56440517730713, "test_acc": 0.0303, "lyapunov": null, "grad_norm": 0.506527150487024, "grad_max_sv": 0.16403611674904822, "grad_min_sv": 9.31519477109788e-09, "grad_condition": 20813101.77306552, "lr": 0.0, "time_sec": 66.77998113632202 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 4.385416869049072, "train_acc": 0.09238, "test_loss": 3.76526393661499, "test_acc": 0.1561, "lyapunov": 2.248025039882611, "grad_norm": 6.278186010639677, "grad_max_sv": 4.849219900369644, "grad_min_sv": 1.1319616959326595e-07, "grad_condition": 56141122.1011496, "lr": 0.0009998903417374227, "time_sec": 41.7864191532135 }, { "epoch": 2, "train_loss": 3.6485818179321288, "train_acc": 0.16322, "test_loss": 3.3687725090026857, "test_acc": 0.2122, "lyapunov": 2.118248250783252, "grad_norm": 4.443263102278264, "grad_max_sv": 3.2507266819477083, "grad_min_sv": 8.233919142064395e-08, "grad_condition": 322584578.8706892, "lr": 0.0009995614150494292, "time_sec": 41.66770076751709 }, { "epoch": 3, "train_loss": 3.328380308380127, "train_acc": 0.20764, "test_loss": 3.374305525970459, "test_acc": 0.2055, "lyapunov": 1.9997802164853382, "grad_norm": 3.3578148542704875, "grad_max_sv": 2.267174106836319, "grad_min_sv": 6.252581136179103e-08, "grad_condition": 45047259.18741469, "lr": 0.0009990133642141358, "time_sec": 41.67004632949829 }, { "epoch": 4, "train_loss": 3.2626986949920656, "train_acc": 0.2146, "test_loss": 4.6115389114379886, "test_acc": 0.0743, "lyapunov": 1.77669187945783, "grad_norm": 2.671171954416308, "grad_max_sv": 1.6475970447063446, "grad_min_sv": 4.904231385438607e-08, "grad_condition": 37237118.01849495, "lr": 0.0009982464296247522, "time_sec": 41.662524461746216 }, { "epoch": 5, "train_loss": 3.2418214219665527, "train_acc": 0.21486, "test_loss": 6.85950913848877, "test_acc": 0.0383, "lyapunov": 1.577696952063714, "grad_norm": 2.24297056171998, "grad_max_sv": 1.3573209017515182, "grad_min_sv": 4.2056884189123346e-08, "grad_condition": 57071857.62248597, "lr": 0.0009972609476841367, "time_sec": 41.65110445022583 }, { "epoch": 6, "train_loss": 3.1473428995513917, "train_acc": 0.2334, "test_loss": 8.817106538391114, "test_acc": 0.0334, "lyapunov": 1.522594060739288, "grad_norm": 2.0255024337601077, "grad_max_sv": 1.1387103602290154, "grad_min_sv": 3.8490053089201837e-08, "grad_condition": 35218561.7694581, "lr": 0.000996057350657239, "time_sec": 41.70460891723633 }, { "epoch": 7, "train_loss": 3.0554499784851075, "train_acc": 0.25108, "test_loss": 10.19464548034668, "test_acc": 0.0214, "lyapunov": 1.498324869538817, "grad_norm": 1.8452595544017367, "grad_max_sv": 0.9877568006515502, "grad_min_sv": 3.479785576354644e-08, "grad_condition": 35325972.864356965, "lr": 0.000994636166481494, "time_sec": 41.68277025222778 }, { "epoch": 8, "train_loss": 2.9779827911376953, "train_acc": 0.26282, "test_loss": 11.777064636230469, "test_acc": 0.0217, "lyapunov": 1.4917038487046577, "grad_norm": 1.7112589099882383, "grad_max_sv": 0.9115550458431244, "grad_min_sv": 3.2246774489541605e-08, "grad_condition": 35535466.61101306, "lr": 0.0009929980185352525, "time_sec": 41.73534274101257 }, { "epoch": 9, "train_loss": 2.9365650801086427, "train_acc": 0.27382, "test_loss": 11.0659416595459, "test_acc": 0.0285, "lyapunov": 1.4870752608379745, "grad_norm": 1.6385351402723778, "grad_max_sv": 0.8621709123253822, "grad_min_sv": 3.1201993953844376e-08, "grad_condition": 65261212.14923034, "lr": 0.0009911436253643444, "time_sec": 41.677772760391235 }, { "epoch": 10, "train_loss": 2.8763271882629393, "train_acc": 0.28468, "test_loss": 12.026495361328125, "test_acc": 0.0238, "lyapunov": 1.483278246486888, "grad_norm": 1.529513425384814, "grad_max_sv": 0.7616375535726547, "grad_min_sv": 2.9233747178558646e-08, "grad_condition": 32138717.187251367, "lr": 0.0009890738003669028, "time_sec": 41.68400001525879 }, { "epoch": 11, "train_loss": 2.8316531258392335, "train_acc": 0.29512, "test_loss": 13.11057151184082, "test_acc": 0.0192, "lyapunov": 1.490352714153202, "grad_norm": 1.4498581032880438, "grad_max_sv": 0.7242703467607499, "grad_min_sv": 2.7478494810107e-08, "grad_condition": 41454194.81325731, "lr": 0.00098678945143658, "time_sec": 41.70621085166931 }, { "epoch": 12, "train_loss": 2.799339100418091, "train_acc": 0.29892, "test_loss": 7.575371592712402, "test_acc": 0.0262, "lyapunov": 1.4981255997782168, "grad_norm": 1.363013693713406, "grad_max_sv": 0.6757008329033851, "grad_min_sv": 2.5993861326942257e-08, "grad_condition": 160871874.0058652, "lr": 0.0009842915805643154, "time_sec": 41.677626609802246 }, { "epoch": 13, "train_loss": 2.7616972874450685, "train_acc": 0.30544, "test_loss": 10.457825009155274, "test_acc": 0.0149, "lyapunov": 1.5049866004977994, "grad_norm": 1.3009395680954525, "grad_max_sv": 0.6281382858753204, "grad_min_sv": 2.4570545004154454e-08, "grad_condition": 36433287.73809738, "lr": 0.000981581283398829, "time_sec": 41.678059816360474 }, { "epoch": 14, "train_loss": 2.7419771829223634, "train_acc": 0.31176, "test_loss": 6.96602774734497, "test_acc": 0.0273, "lyapunov": 1.5126411487989109, "grad_norm": 1.2428065154077472, "grad_max_sv": 0.6042070008814335, "grad_min_sv": 2.367223045363076e-08, "grad_condition": 28155768.001448244, "lr": 0.0009786597487660333, "time_sec": 41.6808295249939 }, { "epoch": 15, "train_loss": 2.6940654248809817, "train_acc": 0.32072, "test_loss": 8.578126625061035, "test_acc": 0.0227, "lyapunov": 1.5099453883402794, "grad_norm": 1.2169506496641136, "grad_max_sv": 0.5779954038560391, "grad_min_sv": 2.2935282436783998e-08, "grad_condition": 268648302.11607826, "lr": 0.0009755282581475766, "time_sec": 41.68640756607056 }, { "epoch": 16, "train_loss": 2.6707639625549318, "train_acc": 0.32688, "test_loss": 8.14136336288452, "test_acc": 0.018, "lyapunov": 1.5205869574071196, "grad_norm": 1.180524231835774, "grad_max_sv": 0.5504504255950451, "grad_min_sv": 2.2226173457262632e-08, "grad_condition": 33744566.308580026, "lr": 0.0009721881851187403, "time_sec": 41.68173384666443 }, { "epoch": 17, "train_loss": 2.6515627406311033, "train_acc": 0.32992, "test_loss": 8.464934133911132, "test_acc": 0.017, "lyapunov": 1.5374923237144489, "grad_norm": 1.140051503610018, "grad_max_sv": 0.5274666294455528, "grad_min_sv": 2.1756941515072015e-08, "grad_condition": 34749184.683609106, "lr": 0.0009686409947459456, "time_sec": 41.707985401153564 }, { "epoch": 18, "train_loss": 2.6277094244384767, "train_acc": 0.33546, "test_loss": 8.285575199890136, "test_acc": 0.0127, "lyapunov": 1.5355821253393618, "grad_norm": 1.117208726103555, "grad_max_sv": 0.5191602148115635, "grad_min_sv": 2.1151740331459834e-08, "grad_condition": 39519340.90094157, "lr": 0.0009648882429441254, "time_sec": 41.662739515304565 }, { "epoch": 19, "train_loss": 2.607321646118164, "train_acc": 0.34158, "test_loss": 8.017330313110351, "test_acc": 0.0171, "lyapunov": 1.552301183076161, "grad_norm": 1.0897405882008309, "grad_max_sv": 0.5023482128977775, "grad_min_sv": 2.064225344128312e-08, "grad_condition": 48287017.10977797, "lr": 0.00096093157579425, "time_sec": 41.693289041519165 }, { "epoch": 20, "train_loss": 2.5911361766052248, "train_acc": 0.34448, "test_loss": 6.698405216979981, "test_acc": 0.0142, "lyapunov": 1.5602374622583999, "grad_norm": 1.065027082262344, "grad_max_sv": 0.4803482659161091, "grad_min_sv": 2.0105638209866328e-08, "grad_condition": 53496143.92804453, "lr": 0.0009567727288213001, "time_sec": 41.69337177276611 }, { "epoch": 21, "train_loss": 2.581589804840088, "train_acc": 0.34626, "test_loss": 6.832892972564697, "test_acc": 0.01, "lyapunov": 1.5771442057226626, "grad_norm": 1.0439470300070743, "grad_max_sv": 0.4716391734778881, "grad_min_sv": 1.994593953336121e-08, "grad_condition": 29150078.74753332, "lr": 0.0009524135262330095, "time_sec": 41.680705308914185 }, { "epoch": 22, "train_loss": 2.5651588928222657, "train_acc": 0.34914, "test_loss": 9.158645959472656, "test_acc": 0.01, "lyapunov": 1.58292500716646, "grad_norm": 1.02635920685996, "grad_max_sv": 0.45573277324438094, "grad_min_sv": 1.9168616865322673e-08, "grad_condition": 70923838.75523397, "lr": 0.0009478558801197061, "time_sec": 41.669551849365234 }, { "epoch": 23, "train_loss": 2.5523301736450197, "train_acc": 0.3523, "test_loss": 8.809644000244141, "test_acc": 0.01, "lyapunov": 1.5998260813295995, "grad_norm": 1.0017883748688885, "grad_max_sv": 0.44832063987851145, "grad_min_sv": 1.9039649867824692e-08, "grad_condition": 27413330.740021694, "lr": 0.000943101789615607, "time_sec": 41.67731857299805 }, { "epoch": 24, "train_loss": 2.540596002731323, "train_acc": 0.35496, "test_loss": 9.603093579101563, "test_acc": 0.01, "lyapunov": 1.608014219557233, "grad_norm": 0.9892621492137654, "grad_max_sv": 0.4301694191992283, "grad_min_sv": 1.8367088082393846e-08, "grad_condition": 81196052.16569169, "lr": 0.0009381533400219313, "time_sec": 41.676315784454346 }, { "epoch": 25, "train_loss": 2.5427046757507323, "train_acc": 0.35626, "test_loss": 6.377327036285401, "test_acc": 0.0121, "lyapunov": 1.617281358870094, "grad_norm": 0.9690834006908926, "grad_max_sv": 0.4215060040354729, "grad_min_sv": 1.847692875367457e-08, "grad_condition": 26969157.744863987, "lr": 0.0009330127018922189, "time_sec": 41.6710147857666 }, { "epoch": 26, "train_loss": 2.5659257014465333, "train_acc": 0.35094, "test_loss": 7.642009206390381, "test_acc": 0.01, "lyapunov": 1.6466610379841016, "grad_norm": 0.9589858174241993, "grad_max_sv": 0.4141293965280056, "grad_min_sv": 1.7795701028403e-08, "grad_condition": 100155427.75409335, "lr": 0.000927682130080253, "time_sec": 41.67351698875427 }, { "epoch": 27, "train_loss": 2.5872419680023193, "train_acc": 0.3491, "test_loss": 6.126792880249023, "test_acc": 0.01, "lyapunov": 1.655874063596701, "grad_norm": 0.9488520314828451, "grad_max_sv": 0.4167667210102081, "grad_min_sv": 1.7755209749670265e-08, "grad_condition": 36482939.06456544, "lr": 0.0009221639627510072, "time_sec": 41.6674382686615 }, { "epoch": 28, "train_loss": 2.6444351440429688, "train_acc": 0.33624, "test_loss": 6.9149939208984375, "test_acc": 0.0101, "lyapunov": 1.642535175203972, "grad_norm": 0.9303399228093118, "grad_max_sv": 0.39700465872883794, "grad_min_sv": 1.7362861481906577e-08, "grad_condition": 35927282.240080185, "lr": 0.0009164606203550494, "time_sec": 41.694759130477905 }, { "epoch": 29, "train_loss": 2.5599649453735354, "train_acc": 0.35268, "test_loss": 7.456900106048584, "test_acc": 0.0106, "lyapunov": 1.640105134690814, "grad_norm": 0.9138541555575717, "grad_max_sv": 0.40499070957303046, "grad_min_sv": 1.741128121124369e-08, "grad_condition": 28008235.387952596, "lr": 0.0009105746045668516, "time_sec": 41.669721841812134 }, { "epoch": 30, "train_loss": 2.587169426727295, "train_acc": 0.34752, "test_loss": 7.112287390899658, "test_acc": 0.0119, "lyapunov": 1.679136826254218, "grad_norm": 0.9055855274318034, "grad_max_sv": 0.38519148603081704, "grad_min_sv": 1.6915865576859478e-08, "grad_condition": 154040606.17291743, "lr": 0.0009045084971874733, "time_sec": 41.68705892562866 }, { "epoch": 31, "train_loss": 2.5624461259460447, "train_acc": 0.35596, "test_loss": 7.3813514785766605, "test_acc": 0.0124, "lyapunov": 1.6608827205570154, "grad_norm": 0.887369695582494, "grad_max_sv": 0.37692187577486036, "grad_min_sv": 1.6459350740682942e-08, "grad_condition": 31475690.866420962, "lr": 0.0008982649590120977, "time_sec": 41.673012495040894 }, { "epoch": 32, "train_loss": 2.551432417373657, "train_acc": 0.35684, "test_loss": 6.42604938659668, "test_acc": 0.0121, "lyapunov": 1.6469347565375325, "grad_norm": 0.8746022274317357, "grad_max_sv": 0.3701463647186756, "grad_min_sv": 1.6476226111922233e-08, "grad_condition": 52317458.10447326, "lr": 0.0008918467286629196, "time_sec": 41.66220784187317 }, { "epoch": 33, "train_loss": 2.5348674264526365, "train_acc": 0.35962, "test_loss": 5.573617294311523, "test_acc": 0.0241, "lyapunov": 1.6317134284607284, "grad_norm": 0.8557656352746138, "grad_max_sv": 0.3519837222993374, "grad_min_sv": 1.6144081904645446e-08, "grad_condition": 26756099.798511714, "lr": 0.0008852566213878943, "time_sec": 41.66625261306763 }, { "epoch": 34, "train_loss": 2.5518150065612795, "train_acc": 0.3554, "test_loss": 7.073295845794678, "test_acc": 0.0148, "lyapunov": 1.649389718804518, "grad_norm": 0.8523798964772112, "grad_max_sv": 0.35057583153247834, "grad_min_sv": 1.5881563142361442e-08, "grad_condition": 28695640.9756914, "lr": 0.000878497527825878, "time_sec": 41.682754039764404 }, { "epoch": 35, "train_loss": 2.4595030923461914, "train_acc": 0.37624, "test_loss": 6.594732564544678, "test_acc": 0.0135, "lyapunov": 1.6497014946949757, "grad_norm": 0.8413194934076474, "grad_max_sv": 0.3433509707450867, "grad_min_sv": 1.5582725373941564e-08, "grad_condition": 32812761.595985997, "lr": 0.000871572412738697, "time_sec": 41.66791009902954 }, { "epoch": 36, "train_loss": 2.4551396466827393, "train_acc": 0.37628, "test_loss": 8.253561260986329, "test_acc": 0.0118, "lyapunov": 1.641755030892999, "grad_norm": 0.843485970719339, "grad_max_sv": 0.35417381674051285, "grad_min_sv": 1.5807648856558387e-08, "grad_condition": 26531326.086508345, "lr": 0.0008644843137107055, "time_sec": 41.667187213897705 }, { "epoch": 37, "train_loss": 2.4310810439300536, "train_acc": 0.37952, "test_loss": 6.83057543182373, "test_acc": 0.0102, "lyapunov": 1.6440746006758318, "grad_norm": 0.835329787885881, "grad_max_sv": 0.34257676601409914, "grad_min_sv": 1.570942509132589e-08, "grad_condition": 39002769.53085541, "lr": 0.0008572363398164014, "time_sec": 41.83383345603943 }, { "epoch": 38, "train_loss": 2.3961087857055663, "train_acc": 0.38468, "test_loss": 8.535474667358399, "test_acc": 0.0125, "lyapunov": 1.6436351958443136, "grad_norm": 0.8290693986791846, "grad_max_sv": 0.3357673093676567, "grad_min_sv": 1.5592837618316757e-08, "grad_condition": 29777273.236415513, "lr": 0.0008498316702566826, "time_sec": 41.67509579658508 }, { "epoch": 39, "train_loss": 2.418079302215576, "train_acc": 0.38104, "test_loss": 8.728886996459961, "test_acc": 0.0138, "lyapunov": 1.6392356294500248, "grad_norm": 0.8215527161857048, "grad_max_sv": 0.33165409713983535, "grad_min_sv": 1.5307788804423682e-08, "grad_condition": 151642365.19854102, "lr": 0.0008422735529643442, "time_sec": 41.690041065216064 }, { "epoch": 40, "train_loss": 2.385871609649658, "train_acc": 0.38864, "test_loss": 7.529428874206543, "test_acc": 0.0132, "lyapunov": 1.6354777038554706, "grad_norm": 0.8200733881789374, "grad_max_sv": 0.3330301932990551, "grad_min_sv": 1.5384999157985745e-08, "grad_condition": 37189354.004172444, "lr": 0.0008345653031794289, "time_sec": 41.66628098487854 }, { "epoch": 41, "train_loss": 2.3330577777862547, "train_acc": 0.40102, "test_loss": 7.123234498596191, "test_acc": 0.0249, "lyapunov": 1.6323570756961012, "grad_norm": 0.8204860309316497, "grad_max_sv": 0.3341449283063412, "grad_min_sv": 1.5524073795208925e-08, "grad_condition": 51332515.62539954, "lr": 0.0008267103019950526, "time_sec": 41.658520460128784 }, { "epoch": 42, "train_loss": 2.3339556999969484, "train_acc": 0.39776, "test_loss": 7.333181537628174, "test_acc": 0.0185, "lyapunov": 1.6354230733783655, "grad_norm": 0.8120092023544444, "grad_max_sv": 0.32391806691884995, "grad_min_sv": 1.5330058230483833e-08, "grad_condition": 63172058.450652756, "lr": 0.0008187119948743447, "time_sec": 41.67036032676697 }, { "epoch": 43, "train_loss": 2.3197922330474854, "train_acc": 0.40358, "test_loss": 6.427054233551026, "test_acc": 0.0136, "lyapunov": 1.6421251245166943, "grad_norm": 0.8092554387074351, "grad_max_sv": 0.330906642973423, "grad_min_sv": 1.526612713464992e-08, "grad_condition": 26225823.13057729, "lr": 0.000810573890139155, "time_sec": 41.665225982666016 }, { "epoch": 44, "train_loss": 2.3195025100708007, "train_acc": 0.4033, "test_loss": 7.0808923698425295, "test_acc": 0.0118, "lyapunov": 1.656124430239353, "grad_norm": 0.8044803007377996, "grad_max_sv": 0.31877501383423806, "grad_min_sv": 1.485775653065069e-08, "grad_condition": 62435666.9732676, "lr": 0.0008022995574311873, "time_sec": 41.6713650226593 }, { "epoch": 45, "train_loss": 2.2802742100524904, "train_acc": 0.41386, "test_loss": 6.140260126495361, "test_acc": 0.0112, "lyapunov": 1.640040697649007, "grad_norm": 0.8004818224905164, "grad_max_sv": 0.31864383071660995, "grad_min_sv": 1.4937468863218672e-08, "grad_condition": 92954234.04941478, "lr": 0.0007938926261462363, "time_sec": 41.66809844970703 }, { "epoch": 46, "train_loss": 2.262954523010254, "train_acc": 0.414, "test_loss": 7.2938560546875, "test_acc": 0.0101, "lyapunov": 1.637706352316815, "grad_norm": 0.793081854121529, "grad_max_sv": 0.31840832754969595, "grad_min_sv": 1.496939308343048e-08, "grad_condition": 25865099.124858934, "lr": 0.0007853567838422158, "time_sec": 41.66623878479004 }, { "epoch": 47, "train_loss": 2.267263908538818, "train_acc": 0.41344, "test_loss": 6.906099589538575, "test_acc": 0.012, "lyapunov": 1.6311360786637992, "grad_norm": 0.797780329526112, "grad_max_sv": 0.31469214931130407, "grad_min_sv": 1.4971078365899616e-08, "grad_condition": 25611249.79088702, "lr": 0.0007766957746216719, "time_sec": 41.708776235580444 }, { "epoch": 48, "train_loss": 2.2475574452209472, "train_acc": 0.41852, "test_loss": 8.073319694519043, "test_acc": 0.0096, "lyapunov": 1.6334223103950092, "grad_norm": 0.7869763323374519, "grad_max_sv": 0.31651476472616197, "grad_min_sv": 1.4959556110527573e-08, "grad_condition": 24572781.086960234, "lr": 0.0007679133974894982, "time_sec": 41.682409048080444 }, { "epoch": 49, "train_loss": 2.2258160152435305, "train_acc": 0.42326, "test_loss": 7.22346753692627, "test_acc": 0.01, "lyapunov": 1.6582896377119567, "grad_norm": 0.7915396840627938, "grad_max_sv": 0.31868951208889484, "grad_min_sv": 1.4694817633553736e-08, "grad_condition": 37064015.276476786, "lr": 0.000759013504686565, "time_sec": 41.66550970077515 }, { "epoch": 50, "train_loss": 2.191147954711914, "train_acc": 0.43136, "test_loss": 7.067440712738037, "test_acc": 0.0113, "lyapunov": 1.6353955543254648, "grad_norm": 0.7852910579053439, "grad_max_sv": 0.3114649154245853, "grad_min_sv": 1.4506057238912461e-08, "grad_condition": 117782435.52166636, "lr": 0.0007499999999999998, "time_sec": 41.676011085510254 }, { "epoch": 51, "train_loss": 2.1769231742095947, "train_acc": 0.43202, "test_loss": 8.091367781066895, "test_acc": 0.0106, "lyapunov": 1.6262942616591978, "grad_norm": 0.7849301566787954, "grad_max_sv": 0.31383112370967864, "grad_min_sv": 1.482414189180048e-08, "grad_condition": 24814087.204268403, "lr": 0.0007408768370508575, "time_sec": 41.71332907676697 }, { "epoch": 52, "train_loss": 2.1791525329589843, "train_acc": 0.43434, "test_loss": 6.640031047058105, "test_acc": 0.0101, "lyapunov": 1.6475636553581414, "grad_norm": 0.7748205713957207, "grad_max_sv": 0.3011137217283249, "grad_min_sv": 1.4537112300733179e-08, "grad_condition": 122190974.86962557, "lr": 0.0007316480175599307, "time_sec": 41.6874144077301 }, { "epoch": 53, "train_loss": 2.177708456039429, "train_acc": 0.43164, "test_loss": 6.330417361450196, "test_acc": 0.0124, "lyapunov": 1.6483547099106146, "grad_norm": 0.7832189933674929, "grad_max_sv": 0.3086284928023815, "grad_min_sv": 1.4681565554952592e-08, "grad_condition": 39128451.13660244, "lr": 0.0007223175895924635, "time_sec": 41.67819046974182 }, { "epoch": 54, "train_loss": 2.155647780075073, "train_acc": 0.43836, "test_loss": 6.180060083007812, "test_acc": 0.0168, "lyapunov": 1.6432840284484123, "grad_norm": 0.7691412493425369, "grad_max_sv": 0.29928392022848127, "grad_min_sv": 1.4252177091278462e-08, "grad_condition": 33900536.02069519, "lr": 0.0007128896457825361, "time_sec": 41.750109910964966 }, { "epoch": 55, "train_loss": 2.1353805670928954, "train_acc": 0.44186, "test_loss": 7.257317136383056, "test_acc": 0.0132, "lyapunov": 1.6428052202210097, "grad_norm": 0.7679438794422704, "grad_max_sv": 0.30230089724063874, "grad_min_sv": 1.4329349766473153e-08, "grad_condition": 34802929.64081846, "lr": 0.0007033683215378998, "time_sec": 41.669835805892944 }, { "epoch": 56, "train_loss": 2.128101917114258, "train_acc": 0.44428, "test_loss": 7.373139286804199, "test_acc": 0.0137, "lyapunov": 1.6414129276714666, "grad_norm": 0.7718923152736775, "grad_max_sv": 0.2989685770124197, "grad_min_sv": 1.451244842631816e-08, "grad_condition": 26370279.022705477, "lr": 0.0006937577932260512, "time_sec": 41.67406344413757 }, { "epoch": 57, "train_loss": 2.137920976486206, "train_acc": 0.44384, "test_loss": 5.424753893280029, "test_acc": 0.0111, "lyapunov": 1.6554484230173214, "grad_norm": 0.773511600768633, "grad_max_sv": 0.294682040810585, "grad_min_sv": 1.4318467259077927e-08, "grad_condition": 26244116.009311978, "lr": 0.0006840622763423388, "time_sec": 41.68566060066223 }, { "epoch": 58, "train_loss": 2.1886442722320556, "train_acc": 0.43186, "test_loss": 6.545238864135742, "test_acc": 0.0159, "lyapunov": 1.6389995575560938, "grad_norm": 0.770667566152431, "grad_max_sv": 0.2981013923883438, "grad_min_sv": 1.4503179252695065e-08, "grad_condition": 46106578.838229105, "lr": 0.0006742860236609073, "time_sec": 41.69116020202637 }, { "epoch": 59, "train_loss": 2.1066105070495604, "train_acc": 0.44986, "test_loss": 7.391026984405517, "test_acc": 0.0181, "lyapunov": 1.6416400030750753, "grad_norm": 0.7602483384951753, "grad_max_sv": 0.2911146242171526, "grad_min_sv": 1.4345006460816933e-08, "grad_condition": 63690343.21158177, "lr": 0.0006644333233692913, "time_sec": 41.654924392700195 }, { "epoch": 60, "train_loss": 2.0506089850234988, "train_acc": 0.46106, "test_loss": 8.025833796691895, "test_acc": 0.0159, "lyapunov": 1.621927274157629, "grad_norm": 0.7629731967669975, "grad_max_sv": 0.2949394479393959, "grad_min_sv": 1.4372729567613262e-08, "grad_condition": 30309204.558091305, "lr": 0.0006545084971874734, "time_sec": 41.66482877731323 }, { "epoch": 61, "train_loss": 2.038806278114319, "train_acc": 0.46484, "test_loss": 9.74862598876953, "test_acc": 0.01, "lyapunov": 1.6300551010214763, "grad_norm": 0.7587096227595913, "grad_max_sv": 0.29696495905518533, "grad_min_sv": 1.4256705770446243e-08, "grad_condition": 99834698.98389995, "lr": 0.0006445158984722354, "time_sec": 41.67584776878357 }, { "epoch": 62, "train_loss": 2.065830835571289, "train_acc": 0.45776, "test_loss": 8.374367053222656, "test_acc": 0.0106, "lyapunov": 1.6421477361713224, "grad_norm": 0.7635630118818492, "grad_max_sv": 0.29152632839977743, "grad_min_sv": 1.4168918681389808e-08, "grad_condition": 49794193.0235935, "lr": 0.0006344599103076324, "time_sec": 41.70599865913391 }, { "epoch": 63, "train_loss": 2.06199690322876, "train_acc": 0.45774, "test_loss": 9.43989691772461, "test_acc": 0.0143, "lyapunov": 1.6391434187779341, "grad_norm": 0.7626912434978755, "grad_max_sv": 0.3007299728691578, "grad_min_sv": 1.421240057031259e-08, "grad_condition": 29364542.182565797, "lr": 0.0006243449435824269, "time_sec": 41.69278836250305 }, { "epoch": 64, "train_loss": 2.0462368117523195, "train_acc": 0.46278, "test_loss": 7.563213960266113, "test_acc": 0.01, "lyapunov": 1.6542154858484293, "grad_norm": 0.7636972310186092, "grad_max_sv": 0.2974775414913893, "grad_min_sv": 1.4351465202344648e-08, "grad_condition": 27137193.96425879, "lr": 0.0006141754350553275, "time_sec": 41.68390464782715 }, { "epoch": 65, "train_loss": 2.0235327534866334, "train_acc": 0.46756, "test_loss": 6.978350220489502, "test_acc": 0.0098, "lyapunov": 1.6490768569204814, "grad_norm": 0.7584239144021073, "grad_max_sv": 0.29015346951782706, "grad_min_sv": 1.4414379233967933e-08, "grad_condition": 56409329.68513076, "lr": 0.0006039558454088793, "time_sec": 41.70132231712341 }, { "epoch": 66, "train_loss": 2.0327218698120118, "train_acc": 0.46344, "test_loss": 6.808298188781738, "test_acc": 0.016, "lyapunov": 1.6421981882256316, "grad_norm": 0.7632841139098454, "grad_max_sv": 0.2945323955267668, "grad_min_sv": 1.4372620408403813e-08, "grad_condition": 79999394.91706361, "lr": 0.000593690657292862, "time_sec": 41.77633190155029 }, { "epoch": 67, "train_loss": 1.9898056484222413, "train_acc": 0.47598, "test_loss": 7.061488777160645, "test_acc": 0.0109, "lyapunov": 1.647677140467612, "grad_norm": 0.7591590906188236, "grad_max_sv": 0.296347975358367, "grad_min_sv": 1.415571162510787e-08, "grad_condition": 25155146.125877418, "lr": 0.0005833843733580507, "time_sec": 41.705756425857544 }, { "epoch": 68, "train_loss": 2.0102797174835203, "train_acc": 0.47046, "test_loss": 7.231464897918701, "test_acc": 0.01, "lyapunov": 1.6583749330257211, "grad_norm": 0.754101966257317, "grad_max_sv": 0.28500255234539507, "grad_min_sv": 1.3903248727298312e-08, "grad_condition": 29630876.42759655, "lr": 0.0005730415142812054, "time_sec": 41.72124171257019 }, { "epoch": 69, "train_loss": 2.04611669380188, "train_acc": 0.46162, "test_loss": 5.946302236938476, "test_acc": 0.0107, "lyapunov": 1.6569105533077895, "grad_norm": 0.7572448125574305, "grad_max_sv": 0.2827830083668232, "grad_min_sv": 1.4111277255729471e-08, "grad_condition": 53632120.18934096, "lr": 0.0005626666167821517, "time_sec": 41.66360831260681 }, { "epoch": 70, "train_loss": 1.9799313236999512, "train_acc": 0.47786, "test_loss": 5.791928797912598, "test_acc": 0.0139, "lyapunov": 1.659774536976729, "grad_norm": 0.743881925858891, "grad_max_sv": 0.2895107101649046, "grad_min_sv": 1.3961023534458939e-08, "grad_condition": 29278721.035794042, "lr": 0.0005522642316338265, "time_sec": 41.70555853843689 }, { "epoch": 71, "train_loss": 1.9502769188308715, "train_acc": 0.48312, "test_loss": 5.28058690032959, "test_acc": 0.0122, "lyapunov": 1.6549167751961047, "grad_norm": 0.7494747344108936, "grad_max_sv": 0.2851333416998386, "grad_min_sv": 1.4076917760575888e-08, "grad_condition": 331119741.39895195, "lr": 0.0005418389216661573, "time_sec": 41.68225932121277 }, { "epoch": 72, "train_loss": 1.9479334468841554, "train_acc": 0.48628, "test_loss": 7.984691355895996, "test_acc": 0.0103, "lyapunov": 1.653415890300975, "grad_norm": 0.7477937354985393, "grad_max_sv": 0.28984881937503815, "grad_min_sv": 1.4043280075794196e-08, "grad_condition": 119153928.06545302, "lr": 0.0005313952597646563, "time_sec": 41.65925407409668 }, { "epoch": 73, "train_loss": 1.967646238708496, "train_acc": 0.47644, "test_loss": 6.1665235633850095, "test_acc": 0.0142, "lyapunov": 1.65852049915382, "grad_norm": 0.7579543653963434, "grad_max_sv": 0.2979495331645012, "grad_min_sv": 1.4386894665874283e-08, "grad_condition": 39194921.11896709, "lr": 0.0005209378268645994, "time_sec": 41.68930411338806 }, { "epoch": 74, "train_loss": 1.9287460524368285, "train_acc": 0.49016, "test_loss": 6.917835614776611, "test_acc": 0.011, "lyapunov": 1.6452750241969858, "grad_norm": 0.7457505107152974, "grad_max_sv": 0.2847950000315905, "grad_min_sv": 1.4118661037509916e-08, "grad_condition": 24938980.26155622, "lr": 0.0005104712099416781, "time_sec": 41.67027688026428 }, { "epoch": 75, "train_loss": 1.9238459339141847, "train_acc": 0.48922, "test_loss": 7.703335245513916, "test_acc": 0.0102, "lyapunov": 1.636191079683621, "grad_norm": 0.7456866026716246, "grad_max_sv": 0.28741468451917174, "grad_min_sv": 1.3977797050368501e-08, "grad_condition": 33299832.87362317, "lr": 0.0004999999999999996, "time_sec": 41.668753147125244 }, { "epoch": 76, "train_loss": 1.9011995269012452, "train_acc": 0.49452, "test_loss": 6.336113402557373, "test_acc": 0.0109, "lyapunov": 1.6527920217465257, "grad_norm": 0.7472940737131395, "grad_max_sv": 0.28794192261993884, "grad_min_sv": 1.3842809193365114e-08, "grad_condition": 26648537.366496623, "lr": 0.0004895287900583212, "time_sec": 41.664530515670776 }, { "epoch": 77, "train_loss": 1.9055398291778565, "train_acc": 0.49198, "test_loss": 5.844799766540527, "test_acc": 0.011, "lyapunov": 1.652166176025215, "grad_norm": 0.7477207101099883, "grad_max_sv": 0.29006113260984423, "grad_min_sv": 1.4085541283348491e-08, "grad_condition": 24059920.597129285, "lr": 0.0004790621731353997, "time_sec": 41.67645764350891 }, { "epoch": 78, "train_loss": 1.8853045474624635, "train_acc": 0.49528, "test_loss": 5.736059879302979, "test_acc": 0.0109, "lyapunov": 1.6538786385065454, "grad_norm": 0.7430364105793885, "grad_max_sv": 0.2820361901074648, "grad_min_sv": 1.3740982796224544e-08, "grad_condition": 1051094146.3111416, "lr": 0.000468604740235343, "time_sec": 41.67271661758423 }, { "epoch": 79, "train_loss": 1.8873431278610229, "train_acc": 0.49708, "test_loss": 7.06695590133667, "test_acc": 0.0098, "lyapunov": 1.6691140817559285, "grad_norm": 0.7474584387052425, "grad_max_sv": 0.2899070601910353, "grad_min_sv": 1.3942933266980483e-08, "grad_condition": 53163427.383831725, "lr": 0.00045816107833384175, "time_sec": 41.661076068878174 }, { "epoch": 80, "train_loss": 1.8736388172149658, "train_acc": 0.49874, "test_loss": 5.781377349853516, "test_acc": 0.0131, "lyapunov": 1.657112023104792, "grad_norm": 0.7444710747937686, "grad_max_sv": 0.28176243752241137, "grad_min_sv": 1.3972709403224648e-08, "grad_condition": 135132346.79221177, "lr": 0.0004477357683661729, "time_sec": 41.64565968513489 }, { "epoch": 81, "train_loss": 1.8635578856658936, "train_acc": 0.50138, "test_loss": 5.580086952209473, "test_acc": 0.0135, "lyapunov": 1.653865757195846, "grad_norm": 0.7426015737094843, "grad_max_sv": 0.2836704090237617, "grad_min_sv": 1.4010618162646134e-08, "grad_condition": 417585965.539017, "lr": 0.00043733338321784746, "time_sec": 41.66704249382019 }, { "epoch": 82, "train_loss": 1.9041340649414062, "train_acc": 0.49242, "test_loss": 6.370015201568603, "test_acc": 0.0105, "lyapunov": 1.695511110908235, "grad_norm": 0.7494004766823937, "grad_max_sv": 0.2831845413893461, "grad_min_sv": 1.4006210818928722e-08, "grad_condition": 24462326.60074065, "lr": 0.0004269584857187939, "time_sec": 41.662867307662964 }, { "epoch": 83, "train_loss": 1.854377107772827, "train_acc": 0.5052, "test_loss": 5.641559513854981, "test_acc": 0.0107, "lyapunov": 1.6620670087502132, "grad_norm": 0.7432254276366087, "grad_max_sv": 0.2882852029055357, "grad_min_sv": 1.3851731775482712e-08, "grad_condition": 26065103.969512142, "lr": 0.0004166156266419484, "time_sec": 41.68649983406067 }, { "epoch": 84, "train_loss": 1.8346456706237793, "train_acc": 0.50848, "test_loss": 6.769210389709473, "test_acc": 0.0098, "lyapunov": 1.668327778806467, "grad_norm": 0.7445172315386438, "grad_max_sv": 0.2814629077911377, "grad_min_sv": 1.3836396603461587e-08, "grad_condition": 24738537.843654584, "lr": 0.0004063093427071373, "time_sec": 41.7318229675293 }, { "epoch": 85, "train_loss": 1.8456001781845093, "train_acc": 0.50552, "test_loss": 5.615997741699219, "test_acc": 0.0104, "lyapunov": 1.6713733606021424, "grad_norm": 0.745556048003164, "grad_max_sv": 0.2879165679216385, "grad_min_sv": 1.3856432721365275e-08, "grad_condition": 45763261.566603445, "lr": 0.0003960441545911199, "time_sec": 41.671313762664795 }, { "epoch": 86, "train_loss": 1.8304506510925294, "train_acc": 0.5126, "test_loss": 7.119636929321289, "test_acc": 0.0095, "lyapunov": 1.6572847131573025, "grad_norm": 0.742253787791735, "grad_max_sv": 0.2842376373708248, "grad_min_sv": 1.3829741059290246e-08, "grad_condition": 32092921.731909145, "lr": 0.0003858245649446718, "time_sec": 41.68160605430603 }, { "epoch": 87, "train_loss": 1.8023982585525513, "train_acc": 0.51886, "test_loss": 5.729539224243164, "test_acc": 0.0113, "lyapunov": 1.6674704252911345, "grad_norm": 0.7383133748182458, "grad_max_sv": 0.2829333432018757, "grad_min_sv": 1.3776665358511409e-08, "grad_condition": 29369631.195804454, "lr": 0.00037565505641757235, "time_sec": 41.688772439956665 }, { "epoch": 88, "train_loss": 1.7957932733535766, "train_acc": 0.51898, "test_loss": 6.201405425262451, "test_acc": 0.0112, "lyapunov": 1.655544286188872, "grad_norm": 0.7434211551258653, "grad_max_sv": 0.2823782742023468, "grad_min_sv": 1.3752334167282942e-08, "grad_condition": 31024474.496423542, "lr": 0.00036554008969236695, "time_sec": 41.69476914405823 }, { "epoch": 89, "train_loss": 1.8189633627319335, "train_acc": 0.51594, "test_loss": 5.3315957733154296, "test_acc": 0.0128, "lyapunov": 1.6864432809907761, "grad_norm": 0.7442939461149828, "grad_max_sv": 0.2862010933458805, "grad_min_sv": 1.3637743116745593e-08, "grad_condition": 59934587.44977188, "lr": 0.0003554841015277638, "time_sec": 41.66425442695618 }, { "epoch": 90, "train_loss": 1.7849925768280028, "train_acc": 0.52188, "test_loss": 5.472545378112793, "test_acc": 0.0127, "lyapunov": 1.6630497878164892, "grad_norm": 0.7379404154374459, "grad_max_sv": 0.27791005559265614, "grad_min_sv": 1.3561169532293193e-08, "grad_condition": 146436762.42535684, "lr": 0.000345491502812526, "time_sec": 41.68130135536194 }, { "epoch": 91, "train_loss": 1.7678911954879761, "train_acc": 0.52792, "test_loss": 5.433208572387695, "test_acc": 0.0111, "lyapunov": 1.6612660357409426, "grad_norm": 0.7436136899756786, "grad_max_sv": 0.28643885627388954, "grad_min_sv": 1.4077170534636252e-08, "grad_condition": 141313299.4033515, "lr": 0.0003355666766307081, "time_sec": 41.69838857650757 }, { "epoch": 92, "train_loss": 1.7893417644119263, "train_acc": 0.52188, "test_loss": 5.732446333312988, "test_acc": 0.0132, "lyapunov": 1.6719880662001003, "grad_norm": 0.7430166658849362, "grad_max_sv": 0.2796207364648581, "grad_min_sv": 1.370609366835307e-08, "grad_condition": 61381680.96914546, "lr": 0.00032571397633909225, "time_sec": 41.662304639816284 }, { "epoch": 93, "train_loss": 1.793455412979126, "train_acc": 0.51948, "test_loss": 7.157857987976074, "test_acc": 0.0156, "lyapunov": 1.7097750539365022, "grad_norm": 0.7503715678180837, "grad_max_sv": 0.2879045564681292, "grad_min_sv": 1.3920300624692405e-08, "grad_condition": 46032234.96350131, "lr": 0.00031593772365766094, "time_sec": 41.68742322921753 }, { "epoch": 94, "train_loss": 1.790754737892151, "train_acc": 0.51794, "test_loss": 5.853521730041504, "test_acc": 0.0183, "lyapunov": 1.7012710964588253, "grad_norm": 0.7508761734251582, "grad_max_sv": 0.2927242830395699, "grad_min_sv": 1.3959867344037757e-08, "grad_condition": 30783098.824512742, "lr": 0.0003062422067739483, "time_sec": 41.696484327316284 }, { "epoch": 95, "train_loss": 1.7357876617050172, "train_acc": 0.53082, "test_loss": 5.843491268157959, "test_acc": 0.0169, "lyapunov": 1.6724172071422763, "grad_norm": 0.7362974967473044, "grad_max_sv": 0.28096207305788995, "grad_min_sv": 1.3731502089206483e-08, "grad_condition": 72155189.25605753, "lr": 0.00029663167846209965, "time_sec": 41.801615715026855 }, { "epoch": 96, "train_loss": 1.7516635646438599, "train_acc": 0.529, "test_loss": 5.930022283935547, "test_acc": 0.0166, "lyapunov": 1.6662769326773446, "grad_norm": 0.7418130914367154, "grad_max_sv": 0.27851024977862837, "grad_min_sv": 1.3786014568806238e-08, "grad_condition": 27146249.501743816, "lr": 0.00028711035421746345, "time_sec": 41.690131187438965 }, { "epoch": 97, "train_loss": 1.725118031539917, "train_acc": 0.53522, "test_loss": 7.037702999877929, "test_acc": 0.0131, "lyapunov": 1.6579057100178944, "grad_norm": 0.7402503506761774, "grad_max_sv": 0.2801696177572012, "grad_min_sv": 1.3907192450424154e-08, "grad_condition": 27217829.233857714, "lr": 0.00027768241040753615, "time_sec": 41.68803310394287 }, { "epoch": 98, "train_loss": 1.7803752786254883, "train_acc": 0.52198, "test_loss": 5.421708882141114, "test_acc": 0.0156, "lyapunov": 1.718612858706423, "grad_norm": 0.7413849451100987, "grad_max_sv": 0.2769254602491856, "grad_min_sv": 1.3933566225636517e-08, "grad_condition": 207039935.91921127, "lr": 0.00026835198244006903, "time_sec": 41.684860706329346 }, { "epoch": 99, "train_loss": 1.7348972189331056, "train_acc": 0.53522, "test_loss": 5.996163872528077, "test_acc": 0.0138, "lyapunov": 1.7001579844433328, "grad_norm": 0.7422689999529027, "grad_max_sv": 0.284788579121232, "grad_min_sv": 1.3718373463589284e-08, "grad_condition": 32133144.908362694, "lr": 0.0002591231629491421, "time_sec": 41.687785148620605 }, { "epoch": 100, "train_loss": 1.715971527557373, "train_acc": 0.53706, "test_loss": 5.193750161743164, "test_acc": 0.0145, "lyapunov": 1.678100373738867, "grad_norm": 0.7359745614466124, "grad_max_sv": 0.2779096748679876, "grad_min_sv": 1.3629619793897874e-08, "grad_condition": 45906662.87529864, "lr": 0.0002499999999999997, "time_sec": 41.68041801452637 }, { "epoch": 101, "train_loss": 1.7047844717025757, "train_acc": 0.54014, "test_loss": 5.4800733383178715, "test_acc": 0.0147, "lyapunov": 1.6837563725078808, "grad_norm": 0.9365648414768546, "grad_max_sv": 0.27644540667533873, "grad_min_sv": 1.338469317047064e-08, "grad_condition": 58253933.98672454, "lr": 0.00024098649531343477, "time_sec": 41.69390559196472 }, { "epoch": 102, "train_loss": 1.7108585023498535, "train_acc": 0.53936, "test_loss": 5.4571699615478515, "test_acc": 0.0158, "lyapunov": 1.6604459846720976, "grad_norm": 0.7870713313934493, "grad_max_sv": 0.2845739547163248, "grad_min_sv": 1.3875931419160548e-08, "grad_condition": 29653372.68228669, "lr": 0.0002320866025105016, "time_sec": 41.69141387939453 }, { "epoch": 103, "train_loss": 1.7227560781860352, "train_acc": 0.53538, "test_loss": 6.349255479431152, "test_acc": 0.0136, "lyapunov": 1.6870903968811035, "grad_norm": 0.7434197839636765, "grad_max_sv": 0.2914551913738251, "grad_min_sv": 1.3957845548806525e-08, "grad_condition": 32995362.81324634, "lr": 0.0002233042253783278, "time_sec": 41.680914640426636 }, { "epoch": 104, "train_loss": 1.702695262298584, "train_acc": 0.53836, "test_loss": 5.656436128234863, "test_acc": 0.015, "lyapunov": 1.6825833451717407, "grad_norm": 0.7549456718817885, "grad_max_sv": 0.2799145434051752, "grad_min_sv": 1.3645678115237203e-08, "grad_condition": 28379554.63119031, "lr": 0.000214643216157784, "time_sec": 41.65440130233765 }, { "epoch": 105, "train_loss": 1.6862115913772584, "train_acc": 0.54564, "test_loss": 5.472533478546143, "test_acc": 0.0126, "lyapunov": 1.7024933560120175, "grad_norm": 1.26630705617649, "grad_max_sv": 0.279131243750453, "grad_min_sv": 1.38689274988002e-08, "grad_condition": 38224107.421842635, "lr": 0.00020610737385376332, "time_sec": 41.66117596626282 }, { "epoch": 106, "train_loss": 1.6867632722473145, "train_acc": 0.54602, "test_loss": 5.890195466613769, "test_acc": 0.0123, "lyapunov": 1.6856458394423774, "grad_norm": 0.8947104093954833, "grad_max_sv": 0.28173881731927397, "grad_min_sv": 1.3741654582635766e-08, "grad_condition": 79792220.50526081, "lr": 0.00019770044256881242, "time_sec": 41.68054246902466 }, { "epoch": 107, "train_loss": 1.6547852846908568, "train_acc": 0.55128, "test_loss": 5.426952139282227, "test_acc": 0.0138, "lyapunov": 1.6635038605736345, "grad_norm": 0.9461038074599576, "grad_max_sv": 0.28091032803058624, "grad_min_sv": 1.3631295835148105e-08, "grad_condition": 121284689.6114355, "lr": 0.0001894261098608447, "time_sec": 41.6701295375824 }, { "epoch": 108, "train_loss": 1.6798790365219116, "train_acc": 0.54798, "test_loss": 6.159035799407959, "test_acc": 0.0164, "lyapunov": 1.6929522896056894, "grad_norm": 0.743883475009877, "grad_max_sv": 0.28309045545756817, "grad_min_sv": 1.3724124101055502e-08, "grad_condition": 39239015.729782544, "lr": 0.000181288005125655, "time_sec": 41.696985960006714 }, { "epoch": 109, "train_loss": 1.696175348777771, "train_acc": 0.54438, "test_loss": 5.6951647491455075, "test_acc": 0.016, "lyapunov": 1.7148385203402976, "grad_norm": 0.8437266984263797, "grad_max_sv": 0.27865533195436, "grad_min_sv": 1.3687295685738121e-08, "grad_condition": 84166239.98915759, "lr": 0.0001732896980049473, "time_sec": 41.71509552001953 }, { "epoch": 110, "train_loss": 1.6658023331832885, "train_acc": 0.55012, "test_loss": 5.7984600807189945, "test_acc": 0.0143, "lyapunov": 1.6841092344440158, "grad_norm": 0.9121109366716545, "grad_max_sv": 0.29167514853179455, "grad_min_sv": 1.3800432944674478e-08, "grad_condition": 144511278.99640113, "lr": 0.00016543469682057076, "time_sec": 41.66339421272278 }, { "epoch": 111, "train_loss": 1.6395328227615356, "train_acc": 0.554, "test_loss": 5.86650054473877, "test_acc": 0.0152, "lyapunov": 1.6673833018983417, "grad_norm": 0.7699631101372096, "grad_max_sv": 0.28348692767322065, "grad_min_sv": 1.3636408227601927e-08, "grad_condition": 55378180.92666749, "lr": 0.00015772644703565552, "time_sec": 41.665539026260376 }, { "epoch": 112, "train_loss": 1.6477852906799317, "train_acc": 0.55158, "test_loss": 5.940995491790772, "test_acc": 0.0112, "lyapunov": 1.6873568881808034, "grad_norm": 0.7479570199711284, "grad_max_sv": 0.28565193973481656, "grad_min_sv": 1.3545885212663486e-08, "grad_condition": 4195243968.2445326, "lr": 0.00015016832974331713, "time_sec": 41.66239333152771 }, { "epoch": 113, "train_loss": 1.6797285276412963, "train_acc": 0.54658, "test_loss": 5.699360008239746, "test_acc": 0.0169, "lyapunov": 1.7014049044655413, "grad_norm": 0.870968251009497, "grad_max_sv": 0.29082027412950995, "grad_min_sv": 1.3837160986462926e-08, "grad_condition": 38795421.79244965, "lr": 0.00014276366018359834, "time_sec": 41.68905782699585 }, { "epoch": 114, "train_loss": 1.6465518449401855, "train_acc": 0.55668, "test_loss": 6.088453164672852, "test_acc": 0.0164, "lyapunov": 1.7043657921769124, "grad_norm": 0.8946839109968647, "grad_max_sv": 0.2849067386239767, "grad_min_sv": 1.3802866963286143e-08, "grad_condition": 25630247.743903965, "lr": 0.00013551568628929425, "time_sec": 41.66656756401062 }, { "epoch": 115, "train_loss": 1.6319327460479736, "train_acc": 0.55656, "test_loss": 6.832156317138672, "test_acc": 0.0153, "lyapunov": 1.7021731708360754, "grad_norm": 0.7410352883319467, "grad_max_sv": 0.28490288034081457, "grad_min_sv": 1.3852848871828693e-08, "grad_condition": 105769705.67995845, "lr": 0.00012842758726130276, "time_sec": 41.65516543388367 }, { "epoch": 116, "train_loss": 1.6370894707107544, "train_acc": 0.55944, "test_loss": 6.086082221984864, "test_acc": 0.0152, "lyapunov": 1.704162275089937, "grad_norm": 0.7404525214110508, "grad_max_sv": 0.2851620279252529, "grad_min_sv": 1.3774486038592437e-08, "grad_condition": 64341791.17616973, "lr": 0.0001215024721741218, "time_sec": 41.70033001899719 }, { "epoch": 117, "train_loss": 1.6296995531082152, "train_acc": 0.5565, "test_loss": 5.999611178588867, "test_acc": 0.0158, "lyapunov": 1.6899978895016643, "grad_norm": 0.7413749466972203, "grad_max_sv": 0.28470359593629835, "grad_min_sv": 1.3795419027962108e-08, "grad_condition": 46293176.84023976, "lr": 0.00011474337861210538, "time_sec": 41.66957759857178 }, { "epoch": 118, "train_loss": 1.6183696263122558, "train_acc": 0.56042, "test_loss": 5.902465699768066, "test_acc": 0.0155, "lyapunov": 1.6653556753607357, "grad_norm": 0.752028873574231, "grad_max_sv": 0.2849472999572754, "grad_min_sv": 1.3723038618310146e-08, "grad_condition": 108717082.80762736, "lr": 0.00010815327133708009, "time_sec": 41.65808391571045 }, { "epoch": 119, "train_loss": 1.6181411283111573, "train_acc": 0.56246, "test_loss": 5.821061138153076, "test_acc": 0.0127, "lyapunov": 1.6990043498061198, "grad_norm": 0.9212306864426181, "grad_max_sv": 0.2813797727227211, "grad_min_sv": 1.3685392258322438e-08, "grad_condition": 36721469.46741449, "lr": 0.00010173504098790182, "time_sec": 41.65668511390686 }, { "epoch": 120, "train_loss": 1.6332576264572143, "train_acc": 0.55946, "test_loss": 5.637864579772949, "test_acc": 0.0158, "lyapunov": 1.7040051304165968, "grad_norm": 0.8758295019344725, "grad_max_sv": 0.2898151889443398, "grad_min_sv": 1.4175130585991625e-08, "grad_condition": 40539456.12140705, "lr": 9.549150281252629e-05, "time_sec": 41.7333300113678 }, { "epoch": 121, "train_loss": 1.6032706314468383, "train_acc": 0.56424, "test_loss": 6.044293823242188, "test_acc": 0.0161, "lyapunov": 1.687883598420321, "grad_norm": 0.8855358425086, "grad_max_sv": 0.28492439053952695, "grad_min_sv": 1.3791471256685561e-08, "grad_condition": 26792072.142948806, "lr": 8.942539543314794e-05, "time_sec": 41.69478678703308 }, { "epoch": 122, "train_loss": 1.6067510599517822, "train_acc": 0.56546, "test_loss": 6.217616750335694, "test_acc": 0.0169, "lyapunov": 1.6955407583500113, "grad_norm": 1.007631118576203, "grad_max_sv": 0.2878258924931288, "grad_min_sv": 1.3879796437188396e-08, "grad_condition": 33084555.795453023, "lr": 8.353937964495024e-05, "time_sec": 41.67023324966431 }, { "epoch": 123, "train_loss": 1.6053743167114258, "train_acc": 0.56268, "test_loss": 6.328966861724854, "test_acc": 0.0153, "lyapunov": 1.6795075369612944, "grad_norm": 0.8699000468731735, "grad_max_sv": 0.2898880571126938, "grad_min_sv": 1.3709727229513358e-08, "grad_condition": 124246234.40071194, "lr": 7.783603724899243e-05, "time_sec": 41.660712242126465 }, { "epoch": 124, "train_loss": 1.6071837269973754, "train_acc": 0.56286, "test_loss": 6.1388191246032715, "test_acc": 0.0167, "lyapunov": 1.7264370232286965, "grad_norm": 0.8940529497792777, "grad_max_sv": 0.28389453068375586, "grad_min_sv": 1.3959469480351316e-08, "grad_condition": 24432394.03377783, "lr": 7.231786991974666e-05, "time_sec": 41.68312621116638 }, { "epoch": 125, "train_loss": 1.6100223978042603, "train_acc": 0.56692, "test_loss": 5.9885783233642575, "test_acc": 0.0166, "lyapunov": 1.7270872559388886, "grad_norm": 1.0226142905420907, "grad_max_sv": 0.28528097458183765, "grad_min_sv": 1.3753909883229553e-08, "grad_condition": 59401243.51928474, "lr": 6.698729810778072e-05, "time_sec": 41.70276618003845 }, { "epoch": 126, "train_loss": 1.6035814072036743, "train_acc": 0.56344, "test_loss": 6.076493969726562, "test_acc": 0.011, "lyapunov": 1.6876506253581522, "grad_norm": 0.9642119889310449, "grad_max_sv": 0.2870322696864605, "grad_min_sv": 1.3708104407150756e-08, "grad_condition": 28048573.443991415, "lr": 6.184665997806817e-05, "time_sec": 41.8551926612854 }, { "epoch": 127, "train_loss": 1.6120177191162108, "train_acc": 0.56444, "test_loss": 6.843795123291016, "test_acc": 0.0159, "lyapunov": 1.7337111725526697, "grad_norm": 0.8368578920332793, "grad_max_sv": 0.28001562878489494, "grad_min_sv": 1.3889535929734187e-08, "grad_condition": 62985977.61673013, "lr": 5.6898210384392595e-05, "time_sec": 41.68673539161682 }, { "epoch": 128, "train_loss": 1.6090134407424928, "train_acc": 0.56466, "test_loss": 6.320640184783936, "test_acc": 0.0146, "lyapunov": 1.7266684904732668, "grad_norm": 0.7858511448483877, "grad_max_sv": 0.2850359447300434, "grad_min_sv": 1.3702059388498444e-08, "grad_condition": 42801480.40100025, "lr": 5.214411988029363e-05, "time_sec": 41.68818187713623 }, { "epoch": 129, "train_loss": 1.6249183625030517, "train_acc": 0.56476, "test_loss": 6.549667198181153, "test_acc": 0.0162, "lyapunov": 1.8164921944098704, "grad_norm": 1.5114520241024798, "grad_max_sv": 0.2812469657510519, "grad_min_sv": 1.3925696595862291e-08, "grad_condition": 57029114.93811275, "lr": 4.7586473766990294e-05, "time_sec": 41.79629635810852 }, { "epoch": 130, "train_loss": 1.5824087297058105, "train_acc": 0.57044, "test_loss": 6.021063035583496, "test_acc": 0.0176, "lyapunov": 1.70903730880269, "grad_norm": 0.7379608621319285, "grad_max_sv": 0.279190668836236, "grad_min_sv": 1.3621928689200313e-08, "grad_condition": 32815172.113138717, "lr": 4.32272711786996e-05, "time_sec": 41.70122241973877 }, { "epoch": 131, "train_loss": 1.595119048576355, "train_acc": 0.56984, "test_loss": 6.4952160888671875, "test_acc": 0.0155, "lyapunov": 1.754641688083444, "grad_norm": 1.0023213514600722, "grad_max_sv": 0.2834797468036413, "grad_min_sv": 1.3511996389131698e-08, "grad_condition": 68519633.56325917, "lr": 3.906842420574966e-05, "time_sec": 41.72273635864258 }, { "epoch": 132, "train_loss": 1.5923931760787964, "train_acc": 0.57014, "test_loss": 6.346144076538086, "test_acc": 0.0148, "lyapunov": 1.73292323177123, "grad_norm": 0.7501780068501551, "grad_max_sv": 0.28294241838157175, "grad_min_sv": 1.389686744160748e-08, "grad_condition": 365347440.4407994, "lr": 3.5111757055874305e-05, "time_sec": 41.898685693740845 }, { "epoch": 133, "train_loss": 1.6026707472991943, "train_acc": 0.57266, "test_loss": 6.185466950988769, "test_acc": 0.0179, "lyapunov": 1.8438011843834996, "grad_norm": 0.9394783942730687, "grad_max_sv": 0.2847215086221695, "grad_min_sv": 1.390161358527653e-08, "grad_condition": 34103085.04162355, "lr": 3.1359005254054254e-05, "time_sec": 41.84562015533447 }, { "epoch": 134, "train_loss": 1.6043600881576539, "train_acc": 0.56972, "test_loss": 6.54779362411499, "test_acc": 0.0168, "lyapunov": 1.8157421551701967, "grad_norm": 0.9578717543319566, "grad_max_sv": 0.2788985829800367, "grad_min_sv": 1.373801071791192e-08, "grad_condition": 33295442.566805385, "lr": 2.7811814881259484e-05, "time_sec": 41.748968839645386 }, { "epoch": 135, "train_loss": 1.6008320109558105, "train_acc": 0.56734, "test_loss": 6.480984884643554, "test_acc": 0.0164, "lyapunov": 1.824832089111933, "grad_norm": 0.7833960844227048, "grad_max_sv": 0.2834679901599884, "grad_min_sv": 1.3707274611196584e-08, "grad_condition": 34742063.3411188, "lr": 2.4471741852423218e-05, "time_sec": 41.679542541503906 }, { "epoch": 136, "train_loss": 1.6033842488479615, "train_acc": 0.57426, "test_loss": 6.3071887496948245, "test_acc": 0.0161, "lyapunov": 1.8717652309276258, "grad_norm": 1.1623205937404684, "grad_max_sv": 0.28173171132802965, "grad_min_sv": 1.3602863799255793e-08, "grad_condition": 47504661.60977468, "lr": 2.1340251233966362e-05, "time_sec": 41.70148062705994 }, { "epoch": 137, "train_loss": 1.585039638633728, "train_acc": 0.57336, "test_loss": 6.212019223022461, "test_acc": 0.0167, "lyapunov": 1.8105511723272025, "grad_norm": 0.76774524189785, "grad_max_sv": 0.2841952469199896, "grad_min_sv": 1.3692064346898514e-08, "grad_condition": 45911317.56625296, "lr": 1.8418716601170932e-05, "time_sec": 41.718605279922485 }, { "epoch": 138, "train_loss": 1.584446519355774, "train_acc": 0.57526, "test_loss": 6.243849922943115, "test_acc": 0.0165, "lyapunov": 1.828900443928321, "grad_norm": 0.7339440588405652, "grad_max_sv": 0.2821473300457001, "grad_min_sv": 1.3492376377960413e-08, "grad_condition": 46486868.242411375, "lr": 1.570841943568445e-05, "time_sec": 41.803757667541504 }, { "epoch": 139, "train_loss": 1.591472290611267, "train_acc": 0.57168, "test_loss": 6.332618227386474, "test_acc": 0.0164, "lyapunov": 1.8522861116682476, "grad_norm": 0.7344821119501195, "grad_max_sv": 0.2718358475714922, "grad_min_sv": 1.3269187557063412e-08, "grad_condition": 28030061.559468903, "lr": 1.3210548563419845e-05, "time_sec": 41.6920862197876 }, { "epoch": 140, "train_loss": 1.614663985748291, "train_acc": 0.57106, "test_loss": 6.035421504974365, "test_acc": 0.0166, "lyapunov": 1.865170035825666, "grad_norm": 0.7488812688556887, "grad_max_sv": 0.28298918418586255, "grad_min_sv": 1.3682502991718692e-08, "grad_condition": 24201290.710221395, "lr": 1.0926199633097203e-05, "time_sec": 41.67938685417175 }, { "epoch": 141, "train_loss": 1.602144892578125, "train_acc": 0.57176, "test_loss": 6.090472431182861, "test_acc": 0.0168, "lyapunov": 1.8573481064013508, "grad_norm": 0.9964350746023342, "grad_max_sv": 0.28083013482391833, "grad_min_sv": 1.342545436419651e-08, "grad_condition": 71076432.31589943, "lr": 8.856374635655688e-06, "time_sec": 41.67989158630371 }, { "epoch": 142, "train_loss": 1.5910524003982545, "train_acc": 0.574, "test_loss": 6.0493482467651365, "test_acc": 0.0167, "lyapunov": 1.8519471301447095, "grad_norm": 0.7327372969700953, "grad_max_sv": 0.28154470436275003, "grad_min_sv": 1.3814112725940574e-08, "grad_condition": 40685021.10874365, "lr": 7.001981464747503e-06, "time_sec": 41.87545084953308 }, { "epoch": 143, "train_loss": 1.5878816836166383, "train_acc": 0.5754, "test_loss": 6.0228049758911135, "test_acc": 0.0173, "lyapunov": 1.835201174096988, "grad_norm": 0.7329380251080414, "grad_max_sv": 0.2804208301007748, "grad_min_sv": 1.3855345770696913e-08, "grad_condition": 24866442.419618618, "lr": 5.3638335185058295e-06, "time_sec": 41.670424938201904 }, { "epoch": 144, "train_loss": 1.5844879238891603, "train_acc": 0.57532, "test_loss": 6.013319036102295, "test_acc": 0.0167, "lyapunov": 1.797589682557089, "grad_norm": 0.7332915407418003, "grad_max_sv": 0.2873740203678608, "grad_min_sv": 1.3867528024166797e-08, "grad_condition": 66782743.82880296, "lr": 3.942649342761114e-06, "time_sec": 41.666340827941895 }, { "epoch": 145, "train_loss": 1.5729130697250366, "train_acc": 0.57884, "test_loss": 5.962558745574952, "test_acc": 0.0174, "lyapunov": 1.8133810779932515, "grad_norm": 0.7304773544167381, "grad_max_sv": 0.2831062778830528, "grad_min_sv": 1.3597974729551154e-08, "grad_condition": 27885577.58840422, "lr": 2.7390523158633524e-06, "time_sec": 41.66122889518738 }, { "epoch": 146, "train_loss": 1.5774464596939086, "train_acc": 0.57336, "test_loss": 6.056200170898437, "test_acc": 0.0176, "lyapunov": 1.8052761911431237, "grad_norm": 0.7323581109158898, "grad_max_sv": 0.27999263890087606, "grad_min_sv": 1.3672255842755998e-08, "grad_condition": 30955091.121420026, "lr": 1.7535703752478133e-06, "time_sec": 41.6817889213562 }, { "epoch": 147, "train_loss": 1.5797025276184082, "train_acc": 0.57294, "test_loss": 6.142494761657715, "test_acc": 0.0163, "lyapunov": 1.8119597739880653, "grad_norm": 0.7326729565983514, "grad_max_sv": 0.2801577255129814, "grad_min_sv": 1.3520314751103158e-08, "grad_condition": 24177790.25879824, "lr": 9.866357858642196e-07, "time_sec": 41.667490005493164 }, { "epoch": 148, "train_loss": 1.5737435025787354, "train_acc": 0.57896, "test_loss": 6.0964897369384765, "test_acc": 0.016, "lyapunov": 1.8165211808651, "grad_norm": 0.7295448230456424, "grad_max_sv": 0.2751427095383406, "grad_min_sv": 1.348928903022184e-08, "grad_condition": 24265473.368122566, "lr": 4.38584950570808e-07, "time_sec": 41.68909525871277 }, { "epoch": 149, "train_loss": 1.5774297478485106, "train_acc": 0.5743, "test_loss": 6.148982523345947, "test_acc": 0.0159, "lyapunov": 1.8202249927593923, "grad_norm": 0.7313561355684882, "grad_max_sv": 0.2817809645086527, "grad_min_sv": 1.3657219487261951e-08, "grad_condition": 38822037.86584419, "lr": 1.096582625772501e-07, "time_sec": 41.70693755149841 }, { "epoch": 150, "train_loss": 1.5808244900512696, "train_acc": 0.57584, "test_loss": 5.973857634735108, "test_acc": 0.0172, "lyapunov": 1.8156279499268593, "grad_norm": 0.7308465286184226, "grad_max_sv": 0.28174142725765705, "grad_min_sv": 1.372764353510525e-08, "grad_condition": 43888249.75048177, "lr": 0.0, "time_sec": 41.68298602104187 } ], "8": [ { "epoch": 1, "train_loss": 5.021671794891358, "train_acc": 0.02426, "test_loss": 4.758953214263916, "test_acc": 0.0194, "lyapunov": 2.365524544740272, "grad_norm": 5.666214881321602, "grad_max_sv": 4.635834372043609, "grad_min_sv": 9.740842493444202e-08, "grad_condition": 345906665.41414034, "lr": 0.0009998903417374227, "time_sec": 86.94375228881836 }, { "epoch": 2, "train_loss": 4.6419046446228025, "train_acc": 0.03036, "test_loss": 4.812141468811035, "test_acc": 0.0141, "lyapunov": 1.8034114608984164, "grad_norm": 3.7942354948877397, "grad_max_sv": 2.932516324520111, "grad_min_sv": 6.569729187888563e-08, "grad_condition": 162956558.25651228, "lr": 0.0009995614150494292, "time_sec": 86.91073846817017 }, { "epoch": 3, "train_loss": 4.522548667297364, "train_acc": 0.03148, "test_loss": 4.54623723449707, "test_acc": 0.0238, "lyapunov": 1.6952560444926972, "grad_norm": 2.3455501053352146, "grad_max_sv": 1.7244864150881767, "grad_min_sv": 4.1950142698997384e-08, "grad_condition": 6680092616.82326, "lr": 0.0009990133642141358, "time_sec": 86.88951110839844 }, { "epoch": 4, "train_loss": 4.4614645977783205, "train_acc": 0.0325, "test_loss": 5.176557122039795, "test_acc": 0.0101, "lyapunov": 1.6139005059781282, "grad_norm": 1.5168077426412896, "grad_max_sv": 0.9842755444347858, "grad_min_sv": 2.4031745480719025e-08, "grad_condition": 11261049173.025684, "lr": 0.0009982464296247522, "time_sec": 86.94786024093628 }, { "epoch": 5, "train_loss": 4.4149443920898435, "train_acc": 0.03626, "test_loss": 5.137158406066894, "test_acc": 0.01, "lyapunov": 1.6045118917894485, "grad_norm": 1.2582953215287522, "grad_max_sv": 0.7553236961364747, "grad_min_sv": 2.073135719031505e-08, "grad_condition": 222472203.43764964, "lr": 0.0009972609476841367, "time_sec": 86.93599653244019 }, { "epoch": 6, "train_loss": 4.404399389801025, "train_acc": 0.03718, "test_loss": 5.152426997375488, "test_acc": 0.0145, "lyapunov": 1.5948826068502557, "grad_norm": 1.0525562897343101, "grad_max_sv": 0.5827781304717063, "grad_min_sv": 1.6368500771208466e-08, "grad_condition": 975204505.0574242, "lr": 0.000996057350657239, "time_sec": 86.89734673500061 }, { "epoch": 7, "train_loss": 4.373200228271484, "train_acc": 0.0427, "test_loss": 5.138384069824219, "test_acc": 0.01, "lyapunov": 1.5917642296427656, "grad_norm": 0.979719698336329, "grad_max_sv": 0.5500100567936897, "grad_min_sv": 1.578485221420678e-08, "grad_condition": 40146995.15588243, "lr": 0.000994636166481494, "time_sec": 86.9030191898346 }, { "epoch": 8, "train_loss": 4.3614981033325195, "train_acc": 0.04452, "test_loss": 5.208292040252686, "test_acc": 0.0158, "lyapunov": 1.5925918241291095, "grad_norm": 0.8254065825253598, "grad_max_sv": 0.43389859050512314, "grad_min_sv": 1.2995100632032242e-08, "grad_condition": 93911652.28137563, "lr": 0.0009929980185352525, "time_sec": 86.902259349823 }, { "epoch": 9, "train_loss": 4.359973902893066, "train_acc": 0.04506, "test_loss": 4.722157088470459, "test_acc": 0.018, "lyapunov": 1.5934884682335817, "grad_norm": 0.7465758222368373, "grad_max_sv": 0.3876167729496956, "grad_min_sv": 1.1805707171921865e-08, "grad_condition": 96983113.34478703, "lr": 0.0009911436253643444, "time_sec": 86.9238531589508 }, { "epoch": 10, "train_loss": 4.4141249188232425, "train_acc": 0.03536, "test_loss": 5.436407916259766, "test_acc": 0.01, "lyapunov": 1.5828703861407307, "grad_norm": 0.6206738544013151, "grad_max_sv": 0.3251112919300795, "grad_min_sv": 9.17487998804145e-09, "grad_condition": 105514243.19237423, "lr": 0.0009890738003669028, "time_sec": 86.9449622631073 }, { "epoch": 11, "train_loss": 4.426171367950439, "train_acc": 0.0344, "test_loss": 4.693856712341309, "test_acc": 0.0236, "lyapunov": 1.5946678465894422, "grad_norm": 0.5860438322533541, "grad_max_sv": 0.2918587654829025, "grad_min_sv": 6.5412758706696685e-09, "grad_condition": 5280467761.157875, "lr": 0.00098678945143658, "time_sec": 86.91325283050537 }, { "epoch": 12, "train_loss": 4.3411827925109865, "train_acc": 0.04538, "test_loss": 5.247728338623046, "test_acc": 0.0136, "lyapunov": 1.5863848153282614, "grad_norm": 0.5956948826941676, "grad_max_sv": 0.2928905326873064, "grad_min_sv": 8.411352403828177e-09, "grad_condition": 128968920.19480267, "lr": 0.0009842915805643154, "time_sec": 86.90281319618225 }, { "epoch": 13, "train_loss": 4.339786265563965, "train_acc": 0.04572, "test_loss": 5.686103868103027, "test_acc": 0.0125, "lyapunov": 1.5810096681575336, "grad_norm": 0.5604669884006932, "grad_max_sv": 0.2611371923238039, "grad_min_sv": 8.195694697898936e-09, "grad_condition": 39688248.11524393, "lr": 0.000981581283398829, "time_sec": 86.90422630310059 }, { "epoch": 14, "train_loss": 4.35356285232544, "train_acc": 0.04532, "test_loss": 4.883278243255615, "test_acc": 0.015, "lyapunov": 1.579099393866556, "grad_norm": 0.528427576292652, "grad_max_sv": 0.2469606887549162, "grad_min_sv": 7.61194059832604e-09, "grad_condition": 168282434.76948723, "lr": 0.0009786597487660333, "time_sec": 86.88846230506897 }, { "epoch": 15, "train_loss": 4.3755184262084965, "train_acc": 0.04264, "test_loss": 6.138819856262207, "test_acc": 0.0126, "lyapunov": 1.6284648536721154, "grad_norm": 0.5259167846709967, "grad_max_sv": 0.25808656550943854, "grad_min_sv": 7.094433302975989e-09, "grad_condition": 78394577.54559764, "lr": 0.0009755282581475766, "time_sec": 86.88808155059814 }, { "epoch": 16, "train_loss": 4.3449753375244144, "train_acc": 0.04422, "test_loss": 4.874321587371826, "test_acc": 0.0139, "lyapunov": 1.592136370861317, "grad_norm": 0.5849477114279426, "grad_max_sv": 0.2871789067983627, "grad_min_sv": 7.143974147904957e-09, "grad_condition": 825777754.2283806, "lr": 0.0009721881851187403, "time_sec": 86.88666772842407 }, { "epoch": 17, "train_loss": 4.326568845520019, "train_acc": 0.04702, "test_loss": 4.870712732696533, "test_acc": 0.0106, "lyapunov": 1.579986076830598, "grad_norm": 0.587479722542324, "grad_max_sv": 0.2732066046446562, "grad_min_sv": 6.707479306713086e-09, "grad_condition": 933588154.4592457, "lr": 0.0009686409947459456, "time_sec": 86.94699215888977 }, { "epoch": 18, "train_loss": 4.290269263916016, "train_acc": 0.04908, "test_loss": 4.543920527648925, "test_acc": 0.0184, "lyapunov": 1.5655539648612138, "grad_norm": 0.5190972278925252, "grad_max_sv": 0.27400444857776163, "grad_min_sv": 7.268163138354766e-09, "grad_condition": 103768651.90634331, "lr": 0.0009648882429441254, "time_sec": 86.91610383987427 }, { "epoch": 19, "train_loss": 4.277731272888183, "train_acc": 0.0529, "test_loss": 4.523501123046875, "test_acc": 0.0234, "lyapunov": 1.5601860742129938, "grad_norm": 0.5064673349074232, "grad_max_sv": 0.26197145469486716, "grad_min_sv": 7.129040378514584e-09, "grad_condition": 89369620.75339693, "lr": 0.00096093157579425, "time_sec": 86.9239010810852 }, { "epoch": 20, "train_loss": 4.283599534912109, "train_acc": 0.04918, "test_loss": 4.699870119476318, "test_acc": 0.01, "lyapunov": 1.573568820343603, "grad_norm": 0.4940062913988571, "grad_max_sv": 0.24619702994823456, "grad_min_sv": 6.7696058640709375e-09, "grad_condition": 72620577.46255757, "lr": 0.0009567727288213001, "time_sec": 86.96331477165222 }, { "epoch": 21, "train_loss": 4.293489807434082, "train_acc": 0.05038, "test_loss": 4.714311406707764, "test_acc": 0.0108, "lyapunov": 1.5708344915638799, "grad_norm": 0.545017777953754, "grad_max_sv": 0.2541573029011488, "grad_min_sv": 6.718018621953981e-09, "grad_condition": 42979908.88210177, "lr": 0.0009524135262330095, "time_sec": 86.91739249229431 }, { "epoch": 22, "train_loss": 4.2768078778076175, "train_acc": 0.0541, "test_loss": 4.779728842163086, "test_acc": 0.01, "lyapunov": 1.5667131340412228, "grad_norm": 0.5092105231068674, "grad_max_sv": 0.27126444056630133, "grad_min_sv": 7.1301694416769925e-09, "grad_condition": 57355277.993238926, "lr": 0.0009478558801197061, "time_sec": 86.9019386768341 }, { "epoch": 23, "train_loss": 4.27697469543457, "train_acc": 0.05122, "test_loss": 4.672700902557373, "test_acc": 0.01, "lyapunov": 1.5615102702089587, "grad_norm": 0.4784115114004879, "grad_max_sv": 0.24027332551777364, "grad_min_sv": 6.443715307516418e-09, "grad_condition": 95371819.86060278, "lr": 0.000943101789615607, "time_sec": 86.91923117637634 }, { "epoch": 24, "train_loss": 4.278717909088135, "train_acc": 0.05186, "test_loss": 4.900936952209473, "test_acc": 0.01, "lyapunov": 1.5694453353467195, "grad_norm": 0.4949771017584012, "grad_max_sv": 0.24392427019774915, "grad_min_sv": 6.253112343201916e-09, "grad_condition": 49683498.32382451, "lr": 0.0009381533400219313, "time_sec": 86.95798850059509 }, { "epoch": 25, "train_loss": 4.284033089141846, "train_acc": 0.0516, "test_loss": 4.647933837890625, "test_acc": 0.01, "lyapunov": 1.610082578781011, "grad_norm": 0.4618580067316832, "grad_max_sv": 0.21940371356904506, "grad_min_sv": 5.9646471067820174e-09, "grad_condition": 44077507.34171269, "lr": 0.0009330127018922189, "time_sec": 86.92604160308838 }, { "epoch": 26, "train_loss": 4.27171460357666, "train_acc": 0.0513, "test_loss": 4.689661137390137, "test_acc": 0.01, "lyapunov": 1.5887331782704424, "grad_norm": 0.45567402361835824, "grad_max_sv": 0.20672011002898216, "grad_min_sv": 5.767535921075151e-09, "grad_condition": 44437336.12601619, "lr": 0.000927682130080253, "time_sec": 86.91289949417114 }, { "epoch": 27, "train_loss": 4.287545222320556, "train_acc": 0.0503, "test_loss": 4.6759644165039065, "test_acc": 0.0105, "lyapunov": 1.6080376479936682, "grad_norm": 0.4608750254003879, "grad_max_sv": 0.21028368686675095, "grad_min_sv": 5.734315782138567e-09, "grad_condition": 303277586.5403552, "lr": 0.0009221639627510072, "time_sec": 86.92653059959412 }, { "epoch": 28, "train_loss": 4.26929240020752, "train_acc": 0.05308, "test_loss": 4.89806633605957, "test_acc": 0.011, "lyapunov": 1.6118984780348171, "grad_norm": 0.43418302492765676, "grad_max_sv": 0.20326684638857842, "grad_min_sv": 5.713833948692293e-09, "grad_condition": 85779552.11325228, "lr": 0.0009164606203550494, "time_sec": 86.91330051422119 }, { "epoch": 29, "train_loss": 4.253239243469238, "train_acc": 0.05616, "test_loss": 4.924478411865234, "test_acc": 0.01, "lyapunov": 1.6098854767392055, "grad_norm": 0.4850634248026458, "grad_max_sv": 0.20474721789360045, "grad_min_sv": 5.8581581326979866e-09, "grad_condition": 912075238.28812, "lr": 0.0009105746045668516, "time_sec": 86.93636131286621 }, { "epoch": 30, "train_loss": 4.235443085327148, "train_acc": 0.0606, "test_loss": 5.510071346282959, "test_acc": 0.01, "lyapunov": 1.571061046532048, "grad_norm": 0.45361919630223685, "grad_max_sv": 0.2025857836008072, "grad_min_sv": 5.868267084763179e-09, "grad_condition": 42096450.95484826, "lr": 0.0009045084971874733, "time_sec": 86.9319851398468 }, { "epoch": 31, "train_loss": 4.231041951293945, "train_acc": 0.05988, "test_loss": 5.147942330932617, "test_acc": 0.01, "lyapunov": 1.5691828867968391, "grad_norm": 0.432720376091447, "grad_max_sv": 0.19395264871418477, "grad_min_sv": 6.259870760638719e-09, "grad_condition": 34343773.40740795, "lr": 0.0008982649590120977, "time_sec": 86.94789290428162 }, { "epoch": 32, "train_loss": 4.2413297773742675, "train_acc": 0.0587, "test_loss": 5.009992076873779, "test_acc": 0.01, "lyapunov": 1.5915203551807062, "grad_norm": 0.4122171639918169, "grad_max_sv": 0.182863287627697, "grad_min_sv": 5.790357663650308e-09, "grad_condition": 714325029.1851714, "lr": 0.0008918467286629196, "time_sec": 86.911212682724 }, { "epoch": 33, "train_loss": 4.2658996716308595, "train_acc": 0.0542, "test_loss": 5.127438952636719, "test_acc": 0.0101, "lyapunov": 1.579336861210406, "grad_norm": 0.44521811591156923, "grad_max_sv": 0.19066935162991286, "grad_min_sv": 5.523765223003352e-09, "grad_condition": 53898858.78718817, "lr": 0.0008852566213878943, "time_sec": 86.91553449630737 }, { "epoch": 34, "train_loss": 4.242719013824463, "train_acc": 0.05736, "test_loss": 5.307705741882324, "test_acc": 0.01, "lyapunov": 1.554588299273225, "grad_norm": 0.40056388572882007, "grad_max_sv": 0.19328901916742325, "grad_min_sv": 5.563922629570062e-09, "grad_condition": 45803958.546867594, "lr": 0.000878497527825878, "time_sec": 86.91433024406433 }, { "epoch": 35, "train_loss": 4.213116936340332, "train_acc": 0.06228, "test_loss": 5.048512329101563, "test_acc": 0.01, "lyapunov": 1.548424531126876, "grad_norm": 0.40286521350806986, "grad_max_sv": 0.18639697767794133, "grad_min_sv": 5.634928314929288e-09, "grad_condition": 47861656.46465705, "lr": 0.000871572412738697, "time_sec": 86.94499635696411 }, { "epoch": 36, "train_loss": 4.46321242477417, "train_acc": 0.02644, "test_loss": 7.976507986450195, "test_acc": 0.01, "lyapunov": 1.5736174876122828, "grad_norm": 0.3688662413553731, "grad_max_sv": 0.1843747731298208, "grad_min_sv": 1.027042620136494e-09, "grad_condition": 23392046595.39054, "lr": 0.0008644843137107055, "time_sec": 86.94508624076843 }, { "epoch": 37, "train_loss": 4.448079302368164, "train_acc": 0.02678, "test_loss": 5.779720497131348, "test_acc": 0.01, "lyapunov": 1.5641913728031052, "grad_norm": 0.3319698693631811, "grad_max_sv": 0.17876109518110753, "grad_min_sv": 2.4601973283386735e-10, "grad_condition": 23401419871.768867, "lr": 0.0008572363398164014, "time_sec": 86.95254611968994 }, { "epoch": 38, "train_loss": 4.4511954998779295, "train_acc": 0.02752, "test_loss": 9.1264736038208, "test_acc": 0.01, "lyapunov": 1.5642469356127102, "grad_norm": 0.2986469281617768, "grad_max_sv": 0.1681674152612686, "grad_min_sv": 2.3341577206836764e-10, "grad_condition": 26143404878.86806, "lr": 0.0008498316702566826, "time_sec": 87.00612330436707 }, { "epoch": 39, "train_loss": 4.4328032247924805, "train_acc": 0.03036, "test_loss": 10.002013760375977, "test_acc": 0.01, "lyapunov": 1.545380079532828, "grad_norm": 0.31612252817270037, "grad_max_sv": 0.17967074736952782, "grad_min_sv": 1.3078811700331324e-09, "grad_condition": 7630262604.515658, "lr": 0.0008422735529643442, "time_sec": 86.96651196479797 }, { "epoch": 40, "train_loss": 4.410691116485595, "train_acc": 0.03262, "test_loss": 10.329160571289062, "test_acc": 0.01, "lyapunov": 1.544363977963967, "grad_norm": 0.3305250196532406, "grad_max_sv": 0.18044610992074012, "grad_min_sv": 2.8862289467267156e-09, "grad_condition": 208503955.3202583, "lr": 0.0008345653031794289, "time_sec": 86.93889307975769 }, { "epoch": 41, "train_loss": 4.40241349319458, "train_acc": 0.03342, "test_loss": 7.508806234741211, "test_acc": 0.01, "lyapunov": 1.5479626981803523, "grad_norm": 0.37593581599125797, "grad_max_sv": 0.17868120335042476, "grad_min_sv": 2.733827051543125e-09, "grad_condition": 137280184.1727237, "lr": 0.0008267103019950526, "time_sec": 86.95495200157166 }, { "epoch": 42, "train_loss": 4.370949498138428, "train_acc": 0.03828, "test_loss": 6.459606773376465, "test_acc": 0.01, "lyapunov": 1.5444700297187357, "grad_norm": 0.3619230318860018, "grad_max_sv": 0.16240518875420093, "grad_min_sv": 3.560387096604445e-09, "grad_condition": 86248484.21915439, "lr": 0.0008187119948743447, "time_sec": 86.94808578491211 }, { "epoch": 43, "train_loss": 4.395889522705078, "train_acc": 0.03416, "test_loss": 7.4897293304443355, "test_acc": 0.01, "lyapunov": 1.5568798454216375, "grad_norm": 0.3066578397068162, "grad_max_sv": 0.15977313853800296, "grad_min_sv": 2.1426118134706616e-09, "grad_condition": 694043179.0150942, "lr": 0.000810573890139155, "time_sec": 86.97652959823608 }, { "epoch": 44, "train_loss": 4.395970639190674, "train_acc": 0.0331, "test_loss": 6.251794491577148, "test_acc": 0.01, "lyapunov": 1.5505369288842086, "grad_norm": 0.3558862909608559, "grad_max_sv": 0.15992271900177002, "grad_min_sv": 2.2060850382588092e-09, "grad_condition": 314610426.30490005, "lr": 0.0008022995574311873, "time_sec": 86.97155785560608 }, { "epoch": 45, "train_loss": 4.3631904621887205, "train_acc": 0.03756, "test_loss": 5.525508670043945, "test_acc": 0.01, "lyapunov": 1.5545306144772892, "grad_norm": 0.3150905966342124, "grad_max_sv": 0.15917456932365895, "grad_min_sv": 2.917880549419688e-09, "grad_condition": 172334946.43984643, "lr": 0.0007938926261462363, "time_sec": 86.95413851737976 }, { "epoch": 46, "train_loss": 4.385730860290527, "train_acc": 0.03456, "test_loss": 5.2734522521972655, "test_acc": 0.01, "lyapunov": 1.5768346917598755, "grad_norm": 0.30280594802628175, "grad_max_sv": 0.15774821415543555, "grad_min_sv": 3.0362800302642657e-09, "grad_condition": 276419213.49352396, "lr": 0.0007853567838422158, "time_sec": 86.9428277015686 }, { "epoch": 47, "train_loss": 4.421937339019776, "train_acc": 0.03154, "test_loss": 5.600688215637207, "test_acc": 0.01, "lyapunov": 1.5790051977957607, "grad_norm": 0.33072277785528675, "grad_max_sv": 0.16996506713330745, "grad_min_sv": 2.771691926927583e-09, "grad_condition": 320580453.11077607, "lr": 0.0007766957746216719, "time_sec": 86.92568945884705 }, { "epoch": 48, "train_loss": 4.417486723175049, "train_acc": 0.0318, "test_loss": 5.850329084014892, "test_acc": 0.01, "lyapunov": 1.5709409283859956, "grad_norm": 0.3015658481608736, "grad_max_sv": 0.16958414614200593, "grad_min_sv": 2.117095306404743e-09, "grad_condition": 1465805966.8142715, "lr": 0.0007679133974894982, "time_sec": 86.98221182823181 }, { "epoch": 49, "train_loss": 4.413777235107422, "train_acc": 0.03204, "test_loss": 5.770690809631348, "test_acc": 0.01, "lyapunov": 1.5579876326539022, "grad_norm": 0.3480252425503119, "grad_max_sv": 0.16178445334080607, "grad_min_sv": 2.0201714462289255e-09, "grad_condition": 2834174702.248597, "lr": 0.000759013504686565, "time_sec": 87.00604128837585 }, { "epoch": 50, "train_loss": 4.4205519735717775, "train_acc": 0.0298, "test_loss": 5.984611973571777, "test_acc": 0.01, "lyapunov": 1.5497863826239506, "grad_norm": 0.2905045703519568, "grad_max_sv": 0.15919520035386087, "grad_min_sv": 9.888408669417747e-10, "grad_condition": 5631365913.291557, "lr": 0.0007499999999999998, "time_sec": 86.96013498306274 }, { "epoch": 51, "train_loss": 4.41098743927002, "train_acc": 0.0325, "test_loss": 6.533537203979492, "test_acc": 0.01, "lyapunov": 1.555987215407974, "grad_norm": 0.30379457449464103, "grad_max_sv": 0.16679704934358597, "grad_min_sv": 2.413719297654146e-09, "grad_condition": 341047841.4947473, "lr": 0.0007408768370508575, "time_sec": 86.97173476219177 }, { "epoch": 52, "train_loss": 4.390000881347656, "train_acc": 0.03462, "test_loss": 5.217885815429687, "test_acc": 0.01, "lyapunov": 1.5600232867633594, "grad_norm": 0.32784156163445544, "grad_max_sv": 0.15694030448794366, "grad_min_sv": 2.8198880390462035e-09, "grad_condition": 111339990.40279654, "lr": 0.0007316480175599307, "time_sec": 86.9988853931427 }, { "epoch": 53, "train_loss": 4.288632299194336, "train_acc": 0.04882, "test_loss": 8.274944879150391, "test_acc": 0.01, "lyapunov": 1.565576893899142, "grad_norm": 0.3486314610649234, "grad_max_sv": 0.1506714668124914, "grad_min_sv": 3.930395829632172e-09, "grad_condition": 78544413.37347092, "lr": 0.0007223175895924635, "time_sec": 86.96367621421814 }, { "epoch": 54, "train_loss": 4.362063083496094, "train_acc": 0.03894, "test_loss": 5.243001276397705, "test_acc": 0.01, "lyapunov": 1.5714266458740624, "grad_norm": 0.33670855500975183, "grad_max_sv": 0.1638818845152855, "grad_min_sv": 3.341216674862535e-09, "grad_condition": 143330583.52604035, "lr": 0.0007128896457825361, "time_sec": 86.96970129013062 }, { "epoch": 55, "train_loss": 4.3985242970275875, "train_acc": 0.0349, "test_loss": 5.079080085754395, "test_acc": 0.01, "lyapunov": 1.557041028881317, "grad_norm": 0.3110407590384958, "grad_max_sv": 0.13654662668704987, "grad_min_sv": 3.0798576551929748e-09, "grad_condition": 90826613.18081078, "lr": 0.0007033683215378998, "time_sec": 86.96664762496948 }, { "epoch": 56, "train_loss": 4.3555380534362795, "train_acc": 0.03972, "test_loss": 5.452935369873047, "test_acc": 0.01, "lyapunov": 1.560518858987657, "grad_norm": 0.31258330150396313, "grad_max_sv": 0.15348581783473492, "grad_min_sv": 3.6443401876112836e-09, "grad_condition": 63305882.37131055, "lr": 0.0006937577932260512, "time_sec": 87.06724190711975 }, { "epoch": 57, "train_loss": 4.381474671783447, "train_acc": 0.03686, "test_loss": 7.36265283203125, "test_acc": 0.01, "lyapunov": 1.5697053960522118, "grad_norm": 0.3865664941898656, "grad_max_sv": 0.15512134719174356, "grad_min_sv": 3.3817354081872146e-09, "grad_condition": 457011679.7340926, "lr": 0.0006840622763423388, "time_sec": 87.06652784347534 }, { "epoch": 58, "train_loss": 4.403821620025635, "train_acc": 0.03228, "test_loss": 8.040378480529785, "test_acc": 0.01, "lyapunov": 1.5559333075038002, "grad_norm": 0.29135723667857816, "grad_max_sv": 0.16249749660491944, "grad_min_sv": 2.647806284818144e-09, "grad_condition": 607788328.9678621, "lr": 0.0006742860236609073, "time_sec": 87.00199866294861 }, { "epoch": 59, "train_loss": 4.402755667114258, "train_acc": 0.0333, "test_loss": 8.325734463500977, "test_acc": 0.01, "lyapunov": 1.5946810336978845, "grad_norm": 0.31029489050735465, "grad_max_sv": 0.15088103022426366, "grad_min_sv": 2.4962215631335606e-09, "grad_condition": 846951781.3818216, "lr": 0.0006644333233692913, "time_sec": 86.94004797935486 }, { "epoch": 60, "train_loss": 4.4194785871887206, "train_acc": 0.02986, "test_loss": 9.861287240600586, "test_acc": 0.01, "lyapunov": 1.5665948046442797, "grad_norm": 0.2681308492085899, "grad_max_sv": 0.13850090205669402, "grad_min_sv": 5.255404293767318e-10, "grad_condition": 4977286898.088277, "lr": 0.0006545084971874734, "time_sec": 86.9956967830658 }, { "epoch": 61, "train_loss": 4.416754204711914, "train_acc": 0.03102, "test_loss": 6.132235699462891, "test_acc": 0.01, "lyapunov": 1.5757032172454288, "grad_norm": 0.30003715480279103, "grad_max_sv": 0.13602122720330953, "grad_min_sv": 8.228586455857377e-10, "grad_condition": 13175326162.721104, "lr": 0.0006445158984722354, "time_sec": 86.99738907814026 }, { "epoch": 62, "train_loss": 4.400070931243897, "train_acc": 0.03248, "test_loss": 6.946181610870362, "test_acc": 0.01, "lyapunov": 1.5760818457664432, "grad_norm": 0.2705000538096509, "grad_max_sv": 0.1345938090234995, "grad_min_sv": 6.920980580521832e-10, "grad_condition": 1943244549.4253707, "lr": 0.0006344599103076324, "time_sec": 87.10566878318787 }, { "epoch": 63, "train_loss": 4.397411993865966, "train_acc": 0.03356, "test_loss": 6.4025613311767575, "test_acc": 0.01, "lyapunov": 1.5691703021373895, "grad_norm": 0.295770706108135, "grad_max_sv": 0.13735821805894374, "grad_min_sv": 6.700764958362821e-10, "grad_condition": 4282192212.8114214, "lr": 0.0006243449435824269, "time_sec": 87.11572027206421 }, { "epoch": 64, "train_loss": 4.411172714538575, "train_acc": 0.03268, "test_loss": 6.260893269348145, "test_acc": 0.01, "lyapunov": 1.5818147948940697, "grad_norm": 0.3079314625857066, "grad_max_sv": 0.12949498016387223, "grad_min_sv": 1.4190367893734219e-10, "grad_condition": 12329273937.565323, "lr": 0.0006141754350553275, "time_sec": 86.98852014541626 }, { "epoch": 65, "train_loss": 4.395129007568359, "train_acc": 0.03392, "test_loss": 6.5868188064575195, "test_acc": 0.01, "lyapunov": 1.5632798476597232, "grad_norm": 0.25782867400033804, "grad_max_sv": 0.12777244430035353, "grad_min_sv": 2.976579219378644e-10, "grad_condition": 5942895423.124485, "lr": 0.0006039558454088793, "time_sec": 87.11568331718445 }, { "epoch": 66, "train_loss": 4.406106295013427, "train_acc": 0.0315, "test_loss": 6.073413898468018, "test_acc": 0.01, "lyapunov": 1.576541522884613, "grad_norm": 0.30947554951534784, "grad_max_sv": 0.1285885890945792, "grad_min_sv": 5.432121253815892e-10, "grad_condition": 6217167701.43366, "lr": 0.000593690657292862, "time_sec": 87.17264008522034 }, { "epoch": 67, "train_loss": 4.393605449829102, "train_acc": 0.03414, "test_loss": 6.305842741394043, "test_acc": 0.01, "lyapunov": 1.5533494059082187, "grad_norm": 0.25961319227506663, "grad_max_sv": 0.12907455265522003, "grad_min_sv": 1.6513973369542203e-09, "grad_condition": 1871563855.9625301, "lr": 0.0005833843733580507, "time_sec": 87.04546856880188 }, { "epoch": 68, "train_loss": 4.397481441650391, "train_acc": 0.03526, "test_loss": 9.038330000305177, "test_acc": 0.01, "lyapunov": 1.5915909249459386, "grad_norm": 0.3105737189018771, "grad_max_sv": 0.1272705690935254, "grad_min_sv": 1.1124955923331755e-09, "grad_condition": 6291710890.600344, "lr": 0.0005730415142812054, "time_sec": 87.03171014785767 }, { "epoch": 69, "train_loss": 4.432055924072266, "train_acc": 0.02954, "test_loss": 6.220795520019531, "test_acc": 0.01, "lyapunov": 1.606788797756595, "grad_norm": 0.2965672457851634, "grad_max_sv": 0.11880129799246789, "grad_min_sv": 5.90287951778381e-11, "grad_condition": 15582797170.964344, "lr": 0.0005626666167821517, "time_sec": 87.01269674301147 }, { "epoch": 70, "train_loss": 4.433936797943115, "train_acc": 0.02888, "test_loss": 6.659252740478515, "test_acc": 0.01, "lyapunov": 1.5713767874271363, "grad_norm": 0.23364690554453782, "grad_max_sv": 0.11591648273169994, "grad_min_sv": 1.5320265177461676e-10, "grad_condition": 17166771390.34465, "lr": 0.0005522642316338265, "time_sec": 87.01791882514954 }, { "epoch": 71, "train_loss": 4.438748676300049, "train_acc": 0.02874, "test_loss": 6.609808558654785, "test_acc": 0.01, "lyapunov": 1.584676984021121, "grad_norm": 0.2633441624923964, "grad_max_sv": 0.11810853406786918, "grad_min_sv": 1.1007920121830777e-10, "grad_condition": 12701526680.721195, "lr": 0.0005418389216661573, "time_sec": 86.99067282676697 }, { "epoch": 72, "train_loss": 4.428876764984131, "train_acc": 0.029, "test_loss": 7.024348274230957, "test_acc": 0.01, "lyapunov": 1.5694371559430875, "grad_norm": 0.2586705276163511, "grad_max_sv": 0.11742300663609058, "grad_min_sv": 4.3393096759821404e-11, "grad_condition": 17654480120.057854, "lr": 0.0005313952597646563, "time_sec": 86.99662733078003 }, { "epoch": 73, "train_loss": 4.406545689849853, "train_acc": 0.033, "test_loss": 5.295959346008301, "test_acc": 0.01, "lyapunov": 1.598822437283938, "grad_norm": 0.48160257702896175, "grad_max_sv": 0.12682502008974553, "grad_min_sv": 1.6137241577078923e-09, "grad_condition": 1098514733.1527858, "lr": 0.0005209378268645994, "time_sec": 86.98713731765747 }, { "epoch": 74, "train_loss": 4.371206529998779, "train_acc": 0.03752, "test_loss": 6.3423968727111815, "test_acc": 0.01, "lyapunov": 1.5900212995841374, "grad_norm": 0.2599656462367281, "grad_max_sv": 0.11894330121576786, "grad_min_sv": 2.0068056321743966e-09, "grad_condition": 322985873.66543674, "lr": 0.0005104712099416781, "time_sec": 87.01381850242615 }, { "epoch": 75, "train_loss": 4.4355110260009765, "train_acc": 0.03008, "test_loss": 6.5740388412475586, "test_acc": 0.01, "lyapunov": 1.5995566000414017, "grad_norm": 0.46971014639594094, "grad_max_sv": 0.11837511248886586, "grad_min_sv": 9.224606550920768e-10, "grad_condition": 5756377475.535638, "lr": 0.0004999999999999996, "time_sec": 86.98455214500427 }, { "epoch": 76, "train_loss": 4.386026970672607, "train_acc": 0.03692, "test_loss": 7.027304895019531, "test_acc": 0.01, "lyapunov": 1.5754540259271022, "grad_norm": 0.26903612071874217, "grad_max_sv": 0.11812076661735774, "grad_min_sv": 2.299920467269123e-09, "grad_condition": 91850509.00722608, "lr": 0.0004895287900583212, "time_sec": 86.98026323318481 }, { "epoch": 77, "train_loss": 4.393477527923584, "train_acc": 0.03412, "test_loss": 6.660316326904297, "test_acc": 0.01, "lyapunov": 1.5862211976819636, "grad_norm": 0.3013890397473114, "grad_max_sv": 0.1351075556129217, "grad_min_sv": 2.3924681109713588e-09, "grad_condition": 445706368.4192219, "lr": 0.0004790621731353997, "time_sec": 86.97005081176758 }, { "epoch": 78, "train_loss": 4.546225792083741, "train_acc": 0.0251, "test_loss": 5.343878612518311, "test_acc": 0.01, "lyapunov": 1.5964782609963966, "grad_norm": 0.90282337732271, "grad_max_sv": 0.20608680080622435, "grad_min_sv": 2.659187132906355e-09, "grad_condition": 7860910669.836441, "lr": 0.000468604740235343, "time_sec": 86.96122479438782 }, { "epoch": 79, "train_loss": 4.357597355346679, "train_acc": 0.04282, "test_loss": 8.47580428466797, "test_acc": 0.01, "lyapunov": 1.6247231682853016, "grad_norm": 0.3014093640980023, "grad_max_sv": 0.13778700064867735, "grad_min_sv": 3.3349062959070475e-09, "grad_condition": 113414547.08337688, "lr": 0.00045816107833384175, "time_sec": 86.99122476577759 }, { "epoch": 80, "train_loss": 4.353704885253906, "train_acc": 0.04112, "test_loss": 7.1475914855957035, "test_acc": 0.01, "lyapunov": 1.646431783581024, "grad_norm": 0.2930066807721922, "grad_max_sv": 0.14062532242387532, "grad_min_sv": 3.158852413670532e-09, "grad_condition": 56459529.26701255, "lr": 0.0004477357683661729, "time_sec": 86.95756244659424 }, { "epoch": 81, "train_loss": 4.300996598510742, "train_acc": 0.0489, "test_loss": 5.905246903991699, "test_acc": 0.01, "lyapunov": 1.5976380972606141, "grad_norm": 0.3041834155807877, "grad_max_sv": 0.14135726243257524, "grad_min_sv": 3.5767058866736924e-09, "grad_condition": 57327864.423104, "lr": 0.00043733338321784746, "time_sec": 86.97077941894531 }, { "epoch": 82, "train_loss": 4.3091406649780275, "train_acc": 0.04946, "test_loss": 7.282952543640136, "test_acc": 0.01, "lyapunov": 1.6646705594514033, "grad_norm": 0.32878525949020004, "grad_max_sv": 0.1341265318915248, "grad_min_sv": 3.612622626048001e-09, "grad_condition": 55658705.11435084, "lr": 0.0004269584857187939, "time_sec": 86.95407176017761 }, { "epoch": 83, "train_loss": 4.3103489337158205, "train_acc": 0.0477, "test_loss": 6.477012939453125, "test_acc": 0.01, "lyapunov": 1.6391792172361213, "grad_norm": 0.2962764376330481, "grad_max_sv": 0.13159138858318328, "grad_min_sv": 3.4047045499975907e-09, "grad_condition": 518340281.28618824, "lr": 0.0004166156266419484, "time_sec": 86.94712162017822 }, { "epoch": 84, "train_loss": 4.36897839553833, "train_acc": 0.03928, "test_loss": 7.850455484008789, "test_acc": 0.01, "lyapunov": 1.6661204986864953, "grad_norm": 0.28424512363766397, "grad_max_sv": 0.13404478561133146, "grad_min_sv": 3.010059496851036e-09, "grad_condition": 3110503073.168424, "lr": 0.0004063093427071373, "time_sec": 86.97210931777954 }, { "epoch": 85, "train_loss": 4.437010177459717, "train_acc": 0.03262, "test_loss": 9.851054901123048, "test_acc": 0.01, "lyapunov": 1.8142987602507061, "grad_norm": 0.2956023765215779, "grad_max_sv": 0.1340159485116601, "grad_min_sv": 1.7363556922736066e-09, "grad_condition": 1531015855.923596, "lr": 0.0003960441545911199, "time_sec": 86.96314144134521 }, { "epoch": 86, "train_loss": 4.416305867919922, "train_acc": 0.03328, "test_loss": 8.345118670654298, "test_acc": 0.01, "lyapunov": 1.6857655969117304, "grad_norm": 0.36818360732987215, "grad_max_sv": 0.1309028506744653, "grad_min_sv": 1.6532958094842372e-09, "grad_condition": 3316626722.3164024, "lr": 0.0003858245649446718, "time_sec": 86.98166847229004 }, { "epoch": 87, "train_loss": 4.4015829487609865, "train_acc": 0.03524, "test_loss": 12.013820776367188, "test_acc": 0.01, "lyapunov": 1.7373071418089026, "grad_norm": 0.2760253519467448, "grad_max_sv": 0.1359336195513606, "grad_min_sv": 2.3007044532528943e-09, "grad_condition": 346456514.74827063, "lr": 0.00037565505641757235, "time_sec": 86.93886590003967 }, { "epoch": 88, "train_loss": 4.4740436238098145, "train_acc": 0.0295, "test_loss": 6.990837461853027, "test_acc": 0.01, "lyapunov": 1.6694230228433828, "grad_norm": 0.43177687387451896, "grad_max_sv": 0.18005888294428588, "grad_min_sv": 2.4754363480046505e-09, "grad_condition": 195635928.7701267, "lr": 0.00036554008969236695, "time_sec": 86.95178961753845 }, { "epoch": 89, "train_loss": 4.411496069488526, "train_acc": 0.03514, "test_loss": 11.70218861694336, "test_acc": 0.01, "lyapunov": 1.7507646498472795, "grad_norm": 0.31033816746007103, "grad_max_sv": 0.14542356096208095, "grad_min_sv": 2.638068418488876e-09, "grad_condition": 139957124.11622453, "lr": 0.0003554841015277638, "time_sec": 86.93717288970947 }, { "epoch": 90, "train_loss": 4.404713847961426, "train_acc": 0.03648, "test_loss": 9.9756316696167, "test_acc": 0.01, "lyapunov": 1.807755483995618, "grad_norm": 0.35906280668802704, "grad_max_sv": 0.1372342212125659, "grad_min_sv": 2.7565777874737076e-09, "grad_condition": 675780697.8457712, "lr": 0.000345491502812526, "time_sec": 86.93306636810303 }, { "epoch": 91, "train_loss": 4.408483022918701, "train_acc": 0.0368, "test_loss": 7.146534729003906, "test_acc": 0.01, "lyapunov": 1.801394305570656, "grad_norm": 0.3109524713855987, "grad_max_sv": 0.13791952189058065, "grad_min_sv": 2.771594766713681e-09, "grad_condition": 92088285.24973363, "lr": 0.0003355666766307081, "time_sec": 87.15299654006958 }, { "epoch": 92, "train_loss": 4.409290451202392, "train_acc": 0.03586, "test_loss": 14.403669937133788, "test_acc": 0.01, "lyapunov": 1.7155236371642792, "grad_norm": 0.4463202756830642, "grad_max_sv": 0.1406608471646905, "grad_min_sv": 2.481988065313384e-09, "grad_condition": 2274242135.598548, "lr": 0.00032571397633909225, "time_sec": 86.9645299911499 }, { "epoch": 93, "train_loss": 4.38183258102417, "train_acc": 0.03594, "test_loss": 14.732258331298828, "test_acc": 0.01, "lyapunov": 1.642303287525616, "grad_norm": 0.28509807189744846, "grad_max_sv": 0.14340070001780986, "grad_min_sv": 2.788214630510509e-09, "grad_condition": 661394156.996754, "lr": 0.00031593772365766094, "time_sec": 86.95910167694092 }, { "epoch": 94, "train_loss": 4.385672190704346, "train_acc": 0.03708, "test_loss": 14.926625048828125, "test_acc": 0.01, "lyapunov": 1.6731561519910612, "grad_norm": 0.3134461909653867, "grad_max_sv": 0.13709199130535127, "grad_min_sv": 2.8174823593109245e-09, "grad_condition": 118734750.50598077, "lr": 0.0003062422067739483, "time_sec": 86.92044115066528 }, { "epoch": 95, "train_loss": 4.3819806816101075, "train_acc": 0.03738, "test_loss": 11.074764614868164, "test_acc": 0.01, "lyapunov": 1.7133415379487644, "grad_norm": 0.33153421078042083, "grad_max_sv": 0.1331325426697731, "grad_min_sv": 2.8642708720452715e-09, "grad_condition": 165102808.59407786, "lr": 0.00029663167846209965, "time_sec": 86.93906211853027 }, { "epoch": 96, "train_loss": 4.404074432220459, "train_acc": 0.03724, "test_loss": 10.12900542602539, "test_acc": 0.01, "lyapunov": 1.7632283039410095, "grad_norm": 0.3911637522793098, "grad_max_sv": 0.12627853509038686, "grad_min_sv": 2.4115265688864905e-09, "grad_condition": 541677422.6672779, "lr": 0.00028711035421746345, "time_sec": 86.93936419487 }, { "epoch": 97, "train_loss": 4.451261331481934, "train_acc": 0.0326, "test_loss": 5.3055485847473145, "test_acc": 0.01, "lyapunov": 1.8559754114321736, "grad_norm": 0.5079628716235006, "grad_max_sv": 0.12650683380197733, "grad_min_sv": 1.8654332285903626e-09, "grad_condition": 10465021306.197956, "lr": 0.00027768241040753615, "time_sec": 86.9362096786499 }, { "epoch": 98, "train_loss": 4.457196118621826, "train_acc": 0.03388, "test_loss": 5.874557138061523, "test_acc": 0.01, "lyapunov": 1.8899869574305346, "grad_norm": 0.40869012587460146, "grad_max_sv": 0.136830860003829, "grad_min_sv": 2.1947758774298626e-09, "grad_condition": 2135302003.3466086, "lr": 0.00026835198244006903, "time_sec": 86.93851733207703 }, { "epoch": 99, "train_loss": 4.461137276153565, "train_acc": 0.03376, "test_loss": 7.712980445861817, "test_acc": 0.01, "lyapunov": 1.9207234422264197, "grad_norm": 0.44593651641010523, "grad_max_sv": 0.154570347443223, "grad_min_sv": 2.743885928125303e-09, "grad_condition": 11426608589.300367, "lr": 0.0002591231629491421, "time_sec": 86.93646287918091 }, { "epoch": 100, "train_loss": 4.4880205709838865, "train_acc": 0.0309, "test_loss": 4.7405736495971675, "test_acc": 0.01, "lyapunov": 1.9402269292670442, "grad_norm": 0.5314169008984867, "grad_max_sv": 0.17140868678689003, "grad_min_sv": 2.9702306628132115e-09, "grad_condition": 68768483.18390863, "lr": 0.0002499999999999997, "time_sec": 86.96372699737549 }, { "epoch": 101, "train_loss": 4.516919324493408, "train_acc": 0.02856, "test_loss": 4.631107287597656, "test_acc": 0.01, "lyapunov": 1.8684387063736196, "grad_norm": 0.40457693704891007, "grad_max_sv": 0.17230616863816978, "grad_min_sv": 3.0731200580808025e-09, "grad_condition": 123538009.91902074, "lr": 0.00024098649531343477, "time_sec": 86.94155859947205 }, { "epoch": 102, "train_loss": 4.4609598399353025, "train_acc": 0.03628, "test_loss": 4.7487232215881345, "test_acc": 0.01, "lyapunov": 1.9666810218635422, "grad_norm": 1.4354338025926532, "grad_max_sv": 0.1278171473182738, "grad_min_sv": 2.1240830764037368e-09, "grad_condition": 9763663835.33721, "lr": 0.0002320866025105016, "time_sec": 86.95742726325989 }, { "epoch": 103, "train_loss": 4.386784707641602, "train_acc": 0.04782, "test_loss": 4.745209142303467, "test_acc": 0.01, "lyapunov": 2.016990929918216, "grad_norm": 0.7337516988127725, "grad_max_sv": 0.13401773255318403, "grad_min_sv": 3.1091931931848117e-09, "grad_condition": 60104344.68401686, "lr": 0.0002233042253783278, "time_sec": 86.95129346847534 }, { "epoch": 104, "train_loss": 4.375011655273438, "train_acc": 0.04672, "test_loss": 4.693084164428711, "test_acc": 0.01, "lyapunov": 1.9775711432137453, "grad_norm": 1.0479430580386422, "grad_max_sv": 0.12959324829280378, "grad_min_sv": 3.1502246932574305e-09, "grad_condition": 77237986.61774956, "lr": 0.000214643216157784, "time_sec": 86.95826411247253 }, { "epoch": 105, "train_loss": 4.405172659912109, "train_acc": 0.04668, "test_loss": 4.741758982849121, "test_acc": 0.01, "lyapunov": 2.0328768131982944, "grad_norm": 0.4687797625820131, "grad_max_sv": 0.12328344490379095, "grad_min_sv": 3.1737769629405777e-09, "grad_condition": 85772134.99380484, "lr": 0.00020610737385376332, "time_sec": 86.93880844116211 }, { "epoch": 106, "train_loss": 4.356244638671875, "train_acc": 0.04978, "test_loss": 4.669058666992187, "test_acc": 0.01, "lyapunov": 1.8990197315850221, "grad_norm": 0.4676609605386515, "grad_max_sv": 0.13252175226807594, "grad_min_sv": 3.525467490855805e-09, "grad_condition": 52596210.13089059, "lr": 0.00019770044256881242, "time_sec": 86.96025395393372 }, { "epoch": 107, "train_loss": 4.388246943969727, "train_acc": 0.04924, "test_loss": 4.68506374206543, "test_acc": 0.01, "lyapunov": 1.9624325927261197, "grad_norm": 0.4545225835797128, "grad_max_sv": 0.13236304577440022, "grad_min_sv": 3.35203632160358e-09, "grad_condition": 105742345.63281551, "lr": 0.0001894261098608447, "time_sec": 86.91460108757019 }, { "epoch": 108, "train_loss": 4.3695238963317875, "train_acc": 0.0483, "test_loss": 4.651059510803223, "test_acc": 0.01, "lyapunov": 1.9490872517876003, "grad_norm": 0.3584506383494584, "grad_max_sv": 0.13239602297544478, "grad_min_sv": 3.544706423871946e-09, "grad_condition": 66536799.35327874, "lr": 0.000181288005125655, "time_sec": 86.93394088745117 }, { "epoch": 109, "train_loss": 4.394715529022217, "train_acc": 0.04782, "test_loss": 4.621646475219727, "test_acc": 0.01, "lyapunov": 2.0419393695528854, "grad_norm": 0.4760680798020925, "grad_max_sv": 0.12705831751227378, "grad_min_sv": 3.4668329873532855e-09, "grad_condition": 42335589.552427046, "lr": 0.0001732896980049473, "time_sec": 86.94732666015625 }, { "epoch": 110, "train_loss": 4.396159273681641, "train_acc": 0.04692, "test_loss": 4.635798811340332, "test_acc": 0.01, "lyapunov": 1.9756651958236304, "grad_norm": 0.5216765889891325, "grad_max_sv": 0.1416484847664833, "grad_min_sv": 3.2233721108509276e-09, "grad_condition": 671403726.1537082, "lr": 0.00016543469682057076, "time_sec": 86.9427604675293 }, { "epoch": 111, "train_loss": 4.381094040985108, "train_acc": 0.04852, "test_loss": 4.627859112548828, "test_acc": 0.01, "lyapunov": 1.9908651262902848, "grad_norm": 0.45725032205485455, "grad_max_sv": 0.1261982116382569, "grad_min_sv": 3.3899231258877062e-09, "grad_condition": 95101801.02691573, "lr": 0.00015772644703565552, "time_sec": 86.96308636665344 }, { "epoch": 112, "train_loss": 4.365775197753906, "train_acc": 0.04556, "test_loss": 4.630611195373535, "test_acc": 0.01, "lyapunov": 1.7899589819066666, "grad_norm": 0.327253288333232, "grad_max_sv": 0.12595976889133453, "grad_min_sv": 3.5455886261692714e-09, "grad_condition": 83078444.71479167, "lr": 0.00015016832974331713, "time_sec": 86.92891812324524 }, { "epoch": 113, "train_loss": 4.326185424499512, "train_acc": 0.04906, "test_loss": 4.624507279968261, "test_acc": 0.01, "lyapunov": 1.743294736308515, "grad_norm": 0.30709867178590255, "grad_max_sv": 0.12423296440392732, "grad_min_sv": 3.5773004710814434e-09, "grad_condition": 294726116.3341021, "lr": 0.00014276366018359834, "time_sec": 86.93962240219116 }, { "epoch": 114, "train_loss": 4.36080623336792, "train_acc": 0.04476, "test_loss": 4.638040520477295, "test_acc": 0.01, "lyapunov": 1.7487388175466787, "grad_norm": 0.2896504251843997, "grad_max_sv": 0.12205407582223415, "grad_min_sv": 3.2766004282210047e-09, "grad_condition": 256392136.90108904, "lr": 0.00013551568628929425, "time_sec": 86.93535208702087 }, { "epoch": 115, "train_loss": 4.368169149475098, "train_acc": 0.0457, "test_loss": 4.695854078674317, "test_acc": 0.01, "lyapunov": 1.7834696016653115, "grad_norm": 0.292592900967331, "grad_max_sv": 0.11619443818926811, "grad_min_sv": 3.1756336950887087e-09, "grad_condition": 1621784198.0725887, "lr": 0.00012842758726130276, "time_sec": 86.98673295974731 }, { "epoch": 116, "train_loss": 4.387150159606934, "train_acc": 0.04296, "test_loss": 4.669398309326172, "test_acc": 0.01, "lyapunov": 1.90544245035752, "grad_norm": 0.3736850472793119, "grad_max_sv": 0.11484571509063243, "grad_min_sv": 3.1586906028280294e-09, "grad_condition": 96176772.93288267, "lr": 0.0001215024721741218, "time_sec": 86.95901346206665 }, { "epoch": 117, "train_loss": 4.474187949371338, "train_acc": 0.04052, "test_loss": 4.7027623680114745, "test_acc": 0.01, "lyapunov": 2.13019656860615, "grad_norm": 0.4706454049323369, "grad_max_sv": 0.15399074126034976, "grad_min_sv": 3.3639367810409104e-09, "grad_condition": 148375942.6842225, "lr": 0.00011474337861210538, "time_sec": 86.95926237106323 }, { "epoch": 118, "train_loss": 4.414019877319336, "train_acc": 0.04538, "test_loss": 4.650316640472412, "test_acc": 0.01, "lyapunov": 2.0560264450204953, "grad_norm": 0.42333097819604315, "grad_max_sv": 0.11436628978699445, "grad_min_sv": 3.070071629500382e-09, "grad_condition": 1871812696.3982494, "lr": 0.00010815327133708009, "time_sec": 86.95543646812439 }, { "epoch": 119, "train_loss": 4.386474652862549, "train_acc": 0.04654, "test_loss": 4.6715775375366215, "test_acc": 0.01, "lyapunov": 1.969224628889957, "grad_norm": 0.47947570620147545, "grad_max_sv": 0.1272017750889063, "grad_min_sv": 3.3292521794958674e-09, "grad_condition": 61497599.9453614, "lr": 0.00010173504098790182, "time_sec": 86.94949531555176 }, { "epoch": 120, "train_loss": 4.384591791992188, "train_acc": 0.04658, "test_loss": 4.632473320007324, "test_acc": 0.0077, "lyapunov": 1.9927328724385527, "grad_norm": 0.5289661566724388, "grad_max_sv": 0.1261268701404333, "grad_min_sv": 3.4284845490395456e-09, "grad_condition": 48538207.83291945, "lr": 9.549150281252629e-05, "time_sec": 86.94581913948059 }, { "epoch": 121, "train_loss": 4.385587129669189, "train_acc": 0.04774, "test_loss": 4.632090152740479, "test_acc": 0.01, "lyapunov": 2.0432661521770155, "grad_norm": 0.4859111606482192, "grad_max_sv": 0.11864052936434746, "grad_min_sv": 3.4766741936753665e-09, "grad_condition": 60808462.870111085, "lr": 8.942539543314794e-05, "time_sec": 86.94836401939392 }, { "epoch": 122, "train_loss": 4.37459453338623, "train_acc": 0.05042, "test_loss": 4.624907290649414, "test_acc": 0.01, "lyapunov": 2.0131407037110587, "grad_norm": 0.4855933253122246, "grad_max_sv": 0.11917878109961748, "grad_min_sv": 3.5260590100505416e-09, "grad_condition": 40236226.2868594, "lr": 8.353937964495024e-05, "time_sec": 86.96557188034058 }, { "epoch": 123, "train_loss": 4.384435540771484, "train_acc": 0.04966, "test_loss": 4.6222803535461425, "test_acc": 0.01, "lyapunov": 2.056239744891291, "grad_norm": 0.4869249888343625, "grad_max_sv": 0.13170703500509262, "grad_min_sv": 3.4749707009465447e-09, "grad_condition": 81569926.69224386, "lr": 7.783603724899243e-05, "time_sec": 86.94557666778564 }, { "epoch": 124, "train_loss": 4.411828415222168, "train_acc": 0.04734, "test_loss": 4.617088554382324, "test_acc": 0.01, "lyapunov": 2.088481501850021, "grad_norm": 0.6074321406428054, "grad_max_sv": 0.13408620320260525, "grad_min_sv": 3.669820186798234e-09, "grad_condition": 89563715.17480934, "lr": 7.231786991974666e-05, "time_sec": 86.94801068305969 }, { "epoch": 125, "train_loss": 4.379881989440918, "train_acc": 0.04928, "test_loss": 4.626477690124512, "test_acc": 0.01, "lyapunov": 2.0224476098404516, "grad_norm": 0.5566340932563276, "grad_max_sv": 0.11598262693732977, "grad_min_sv": 3.3913336450717977e-09, "grad_condition": 154440174.8024956, "lr": 6.698729810778072e-05, "time_sec": 86.95501017570496 }, { "epoch": 126, "train_loss": 4.406389302368164, "train_acc": 0.04668, "test_loss": 4.62824654006958, "test_acc": 0.01, "lyapunov": 2.0166642894525357, "grad_norm": 0.5564968205221957, "grad_max_sv": 0.12961208932101725, "grad_min_sv": 3.404863768707855e-09, "grad_condition": 46850126.917104796, "lr": 6.184665997806817e-05, "time_sec": 86.89860510826111 }, { "epoch": 127, "train_loss": 4.421845231018066, "train_acc": 0.04476, "test_loss": 4.664912997436524, "test_acc": 0.01, "lyapunov": 2.0588970028835796, "grad_norm": 0.54518049391847, "grad_max_sv": 0.13061115611344576, "grad_min_sv": 3.511758283128441e-09, "grad_condition": 220500422.1836423, "lr": 5.6898210384392595e-05, "time_sec": 86.902822971344 }, { "epoch": 128, "train_loss": 4.466351209259034, "train_acc": 0.04156, "test_loss": 4.625092854309082, "test_acc": 0.01, "lyapunov": 2.054337273168442, "grad_norm": 0.8009056003184672, "grad_max_sv": 0.15183761473745108, "grad_min_sv": 3.3345070037309657e-09, "grad_condition": 1708739228.5454607, "lr": 5.214411988029363e-05, "time_sec": 86.9044144153595 }, { "epoch": 129, "train_loss": 4.410576982879639, "train_acc": 0.0476, "test_loss": 4.881959016418457, "test_acc": 0.01, "lyapunov": 2.066727384277012, "grad_norm": 0.5318034857860106, "grad_max_sv": 0.13615109845995904, "grad_min_sv": 3.475596455342761e-09, "grad_condition": 319815003.9823411, "lr": 4.7586473766990294e-05, "time_sec": 86.9201877117157 }, { "epoch": 130, "train_loss": 4.433161810302734, "train_acc": 0.04566, "test_loss": 4.664642805480957, "test_acc": 0.01, "lyapunov": 2.0571704889502365, "grad_norm": 0.6233163181376318, "grad_max_sv": 0.1495013041421771, "grad_min_sv": 3.495363523273176e-09, "grad_condition": 164232362.84179428, "lr": 4.32272711786996e-05, "time_sec": 86.9145233631134 }, { "epoch": 131, "train_loss": 4.559218102874756, "train_acc": 0.03048, "test_loss": 6.326250002288818, "test_acc": 0.01, "lyapunov": 1.9217658497183525, "grad_norm": 0.7564931295651885, "grad_max_sv": 0.2271105471998453, "grad_min_sv": 3.6081980313296123e-09, "grad_condition": 117749026.05203581, "lr": 3.906842420574966e-05, "time_sec": 86.89276170730591 }, { "epoch": 132, "train_loss": 4.559870092773438, "train_acc": 0.03412, "test_loss": 5.827829841613769, "test_acc": 0.01, "lyapunov": 2.123707967950865, "grad_norm": 0.6846614047113081, "grad_max_sv": 0.20084010064601898, "grad_min_sv": 3.3751881069101626e-09, "grad_condition": 872873152.1371578, "lr": 3.5111757055874305e-05, "time_sec": 86.91409301757812 }, { "epoch": 133, "train_loss": 4.433041811676025, "train_acc": 0.04474, "test_loss": 5.367306958007813, "test_acc": 0.01, "lyapunov": 2.0676878599254676, "grad_norm": 0.5862986449277, "grad_max_sv": 0.14338587652891874, "grad_min_sv": 3.311574372187598e-09, "grad_condition": 132479663.36386319, "lr": 3.1359005254054254e-05, "time_sec": 86.91529488563538 }, { "epoch": 134, "train_loss": 4.398417986602783, "train_acc": 0.04772, "test_loss": 4.720828105163574, "test_acc": 0.01, "lyapunov": 2.0894959808310585, "grad_norm": 0.5265195386524826, "grad_max_sv": 0.12358421217650176, "grad_min_sv": 3.3169084333317666e-09, "grad_condition": 75397884.58751842, "lr": 2.7811814881259484e-05, "time_sec": 86.98745679855347 }, { "epoch": 135, "train_loss": 4.413595640716553, "train_acc": 0.04784, "test_loss": 4.712530905151367, "test_acc": 0.01, "lyapunov": 2.1319035063009433, "grad_norm": 0.5366514710399874, "grad_max_sv": 0.12893760427832604, "grad_min_sv": 3.733237558065788e-09, "grad_condition": 129039558.48728514, "lr": 2.4471741852423218e-05, "time_sec": 86.93967342376709 }, { "epoch": 136, "train_loss": 4.405735962677002, "train_acc": 0.04902, "test_loss": 4.652213160705567, "test_acc": 0.01, "lyapunov": 2.1043942465501675, "grad_norm": 0.5842194415437647, "grad_max_sv": 0.13640696089714766, "grad_min_sv": 3.6649167473382093e-09, "grad_condition": 67841494.7867911, "lr": 2.1340251233966362e-05, "time_sec": 86.92829084396362 }, { "epoch": 137, "train_loss": 4.409075500030518, "train_acc": 0.04824, "test_loss": 4.6458401512146, "test_acc": 0.01, "lyapunov": 2.1048210426364715, "grad_norm": 0.6189485837537402, "grad_max_sv": 0.12394427489489317, "grad_min_sv": 3.56216997565717e-09, "grad_condition": 43191541.57949173, "lr": 1.8418716601170932e-05, "time_sec": 86.98851037025452 }, { "epoch": 138, "train_loss": 4.394878734741211, "train_acc": 0.05004, "test_loss": 4.742844686889648, "test_acc": 0.01, "lyapunov": 2.098401205009207, "grad_norm": 0.5053435905574138, "grad_max_sv": 0.11973771546036005, "grad_min_sv": 3.5540812636652985e-09, "grad_condition": 48597244.2583981, "lr": 1.570841943568445e-05, "time_sec": 86.94594693183899 }, { "epoch": 139, "train_loss": 4.454589398956299, "train_acc": 0.04486, "test_loss": 10.641064196777343, "test_acc": 0.01, "lyapunov": 2.0825157180771496, "grad_norm": 0.7130369910143651, "grad_max_sv": 0.14804725386202336, "grad_min_sv": 3.4161704021151706e-09, "grad_condition": 236395663.3257776, "lr": 1.3210548563419845e-05, "time_sec": 87.00129246711731 }, { "epoch": 140, "train_loss": 4.612700431671143, "train_acc": 0.02562, "test_loss": 5.085433462524414, "test_acc": 0.01, "lyapunov": 2.0142276125490817, "grad_norm": 0.8209647733278711, "grad_max_sv": 0.24317651763558387, "grad_min_sv": 3.4037354469662608e-09, "grad_condition": 190430418.85185307, "lr": 1.0926199633097203e-05, "time_sec": 86.9971239566803 }, { "epoch": 141, "train_loss": 4.487321048126221, "train_acc": 0.0448, "test_loss": 4.666201837921142, "test_acc": 0.01, "lyapunov": 2.2915835459823803, "grad_norm": 0.6559251797263009, "grad_max_sv": 0.13485133294016122, "grad_min_sv": 3.4415409784147033e-09, "grad_condition": 93528260.3989991, "lr": 8.856374635655688e-06, "time_sec": 87.03978943824768 }, { "epoch": 142, "train_loss": 4.471693329467773, "train_acc": 0.04518, "test_loss": 10.255754643249512, "test_acc": 0.01, "lyapunov": 2.178483701118118, "grad_norm": 0.8381236929202858, "grad_max_sv": 0.14980254359543324, "grad_min_sv": 3.358237557309074e-09, "grad_condition": 83488767.17166467, "lr": 7.001981464747503e-06, "time_sec": 87.01720571517944 }, { "epoch": 143, "train_loss": 4.446647290802002, "train_acc": 0.04566, "test_loss": 4.652296996307373, "test_acc": 0.01, "lyapunov": 2.1722125500974143, "grad_norm": 0.5045885772353321, "grad_max_sv": 0.11461257673799992, "grad_min_sv": 3.376102331031916e-09, "grad_condition": 69534096.19918647, "lr": 5.3638335185058295e-06, "time_sec": 86.93180632591248 }, { "epoch": 144, "train_loss": 4.493613358459473, "train_acc": 0.04666, "test_loss": 4.656233798217773, "test_acc": 0.01, "lyapunov": 2.1921363026284806, "grad_norm": 0.5273945169505434, "grad_max_sv": 0.11423748508095741, "grad_min_sv": 3.4756384994128094e-09, "grad_condition": 646405488.9879736, "lr": 3.942649342761114e-06, "time_sec": 86.91520476341248 }, { "epoch": 145, "train_loss": 4.597374949035644, "train_acc": 0.0423, "test_loss": 4.678201083374024, "test_acc": 0.01, "lyapunov": 2.2713517182318452, "grad_norm": 0.47075033695967056, "grad_max_sv": 0.12002073060721159, "grad_min_sv": 3.703222454382038e-09, "grad_condition": 39345602.26548739, "lr": 2.7390523158633524e-06, "time_sec": 86.92837643623352 }, { "epoch": 146, "train_loss": 4.794219552612304, "train_acc": 0.02986, "test_loss": 4.920618478393554, "test_acc": 0.01, "lyapunov": 2.394326541429895, "grad_norm": 0.5246817663077135, "grad_max_sv": 0.1241353990510106, "grad_min_sv": 3.777793512477895e-09, "grad_condition": 151497093.53789455, "lr": 1.7535703752478133e-06, "time_sec": 86.90443754196167 }, { "epoch": 147, "train_loss": 4.823008825378418, "train_acc": 0.02802, "test_loss": 4.705312028503418, "test_acc": 0.01, "lyapunov": 2.351406611749888, "grad_norm": 0.5821396042735293, "grad_max_sv": 0.13014851678162814, "grad_min_sv": 4.0446829205776495e-09, "grad_condition": 251708764.25831342, "lr": 9.866357858642196e-07, "time_sec": 86.91423988342285 }, { "epoch": 148, "train_loss": 4.7621851733398435, "train_acc": 0.03064, "test_loss": 4.91432806854248, "test_acc": 0.01, "lyapunov": 2.320931021209873, "grad_norm": 0.3655369703619559, "grad_max_sv": 0.13613226637244225, "grad_min_sv": 4.233843499401591e-09, "grad_condition": 37577954.13970064, "lr": 4.38584950570808e-07, "time_sec": 86.91514897346497 }, { "epoch": 149, "train_loss": 4.751388474884033, "train_acc": 0.0314, "test_loss": 4.928393530273437, "test_acc": 0.01, "lyapunov": 2.314872954507618, "grad_norm": 0.34582385046790637, "grad_max_sv": 0.13010288886725901, "grad_min_sv": 4.070593409566392e-09, "grad_condition": 116727132.6636453, "lr": 1.096582625772501e-07, "time_sec": 86.9192042350769 }, { "epoch": 150, "train_loss": 4.749187584838867, "train_acc": 0.03084, "test_loss": 4.9377007514953615, "test_acc": 0.01, "lyapunov": 2.3339363833522553, "grad_norm": 0.3438957720875417, "grad_max_sv": 0.13015102557837963, "grad_min_sv": 4.109157251269702e-09, "grad_condition": 44500021.17512281, "lr": 0.0, "time_sec": 86.93520998954773 } ], "12": [ { "epoch": 1, "train_loss": 5.079536279754639, "train_acc": 0.01882, "test_loss": 4.8872514236450195, "test_acc": 0.01, "lyapunov": 2.433271625157817, "grad_norm": 5.340808628002946, "grad_max_sv": 4.541763198375702, "grad_min_sv": 9.132611378248612e-08, "grad_condition": 60829743.69210352, "lr": 0.0009998903417374227, "time_sec": 132.14811611175537 }, { "epoch": 2, "train_loss": 4.774603317108154, "train_acc": 0.01862, "test_loss": 4.825307096862793, "test_acc": 0.0099, "lyapunov": 1.98436847062367, "grad_norm": 3.9424334574306945, "grad_max_sv": 2.8938568502198905, "grad_min_sv": 5.677021384237202e-08, "grad_condition": 58708438.134107456, "lr": 0.0009995614150494292, "time_sec": 132.15339040756226 }, { "epoch": 3, "train_loss": 4.663901504821777, "train_acc": 0.0181, "test_loss": 4.741232266235351, "test_acc": 0.0145, "lyapunov": 1.810482630949191, "grad_norm": 2.7675521449461615, "grad_max_sv": 1.8919199114665388, "grad_min_sv": 3.818708835257034e-08, "grad_condition": 54723570.14412842, "lr": 0.0009990133642141358, "time_sec": 132.11823868751526 }, { "epoch": 4, "train_loss": 4.583503988037109, "train_acc": 0.0196, "test_loss": 4.733808113098145, "test_acc": 0.0127, "lyapunov": 1.7725569412226567, "grad_norm": 1.5853399774616823, "grad_max_sv": 1.1614753112196923, "grad_min_sv": 2.5252084090432447e-08, "grad_condition": 49535418.60263091, "lr": 0.0009982464296247522, "time_sec": 132.14728569984436 }, { "epoch": 5, "train_loss": 4.5524190596008305, "train_acc": 0.0185, "test_loss": 4.749317463684082, "test_acc": 0.0192, "lyapunov": 1.7379879927086404, "grad_norm": 0.9357664119583106, "grad_max_sv": 0.623048696666956, "grad_min_sv": 9.444938395329703e-09, "grad_condition": 17454448603.577705, "lr": 0.0009972609476841367, "time_sec": 132.12196040153503 }, { "epoch": 6, "train_loss": 4.5547177754211425, "train_acc": 0.0182, "test_loss": 4.739207301330566, "test_acc": 0.01, "lyapunov": 1.7158090205448668, "grad_norm": 0.6464921766494518, "grad_max_sv": 0.4727002829313278, "grad_min_sv": 1.4752434742032504e-09, "grad_condition": 79239316890.38657, "lr": 0.000996057350657239, "time_sec": 132.20789337158203 }, { "epoch": 7, "train_loss": 4.567618137207031, "train_acc": 0.01618, "test_loss": 4.935951011657715, "test_acc": 0.01, "lyapunov": 1.6808951733362338, "grad_norm": 0.708796945528179, "grad_max_sv": 0.49447881430387497, "grad_min_sv": 6.565144610538648e-12, "grad_condition": 125853841385.85806, "lr": 0.000994636166481494, "time_sec": 132.16308617591858 }, { "epoch": 8, "train_loss": 4.5752451333618165, "train_acc": 0.01508, "test_loss": 4.654486715698242, "test_acc": 0.01, "lyapunov": 1.6649316146855464, "grad_norm": 0.516840314330209, "grad_max_sv": 0.3999390289187431, "grad_min_sv": 3.239160638355361e-12, "grad_condition": 132523175102.69946, "lr": 0.0009929980185352525, "time_sec": 132.1433699131012 }, { "epoch": 9, "train_loss": 4.584617326049805, "train_acc": 0.01304, "test_loss": 5.1370941864013675, "test_acc": 0.01, "lyapunov": 1.6745121082686403, "grad_norm": 0.4662376866434158, "grad_max_sv": 0.40068961679935455, "grad_min_sv": 1.600815539628815e-12, "grad_condition": 195211792607.34824, "lr": 0.0009911436253643444, "time_sec": 132.11373782157898 }, { "epoch": 10, "train_loss": 4.584750150451661, "train_acc": 0.01344, "test_loss": 5.014252323913574, "test_acc": 0.01, "lyapunov": 1.6392524599114342, "grad_norm": 0.44066573339421267, "grad_max_sv": 0.36354004368186, "grad_min_sv": 1.0598376590459934e-12, "grad_condition": 227681718826.60748, "lr": 0.0009890738003669028, "time_sec": 132.10810494422913 }, { "epoch": 11, "train_loss": 4.5782438153076175, "train_acc": 0.01444, "test_loss": 5.320826235198974, "test_acc": 0.01, "lyapunov": 1.6105381171111866, "grad_norm": 0.46476522396770953, "grad_max_sv": 0.384793009608984, "grad_min_sv": 2.2384307405079876e-12, "grad_condition": 181440627603.39355, "lr": 0.00098678945143658, "time_sec": 132.21521854400635 }, { "epoch": 12, "train_loss": 4.58615560546875, "train_acc": 0.0146, "test_loss": 6.162300729370117, "test_acc": 0.01, "lyapunov": 1.6162703143971047, "grad_norm": 0.4583379516120641, "grad_max_sv": 0.35209991298615934, "grad_min_sv": 2.3950308634256474e-10, "grad_condition": 199277790232.2622, "lr": 0.0009842915805643154, "time_sec": 132.06736636161804 }, { "epoch": 13, "train_loss": 4.58813276260376, "train_acc": 0.01408, "test_loss": 5.858095126342773, "test_acc": 0.01, "lyapunov": 1.6260488749769948, "grad_norm": 0.39204254749475886, "grad_max_sv": 0.3283296298235655, "grad_min_sv": 5.234225415161807e-13, "grad_condition": 249094970429.50763, "lr": 0.000981581283398829, "time_sec": 132.05243945121765 }, { "epoch": 14, "train_loss": 4.583052165374756, "train_acc": 0.01376, "test_loss": 5.763050801086425, "test_acc": 0.0129, "lyapunov": 1.6144071317389799, "grad_norm": 0.5077264967403567, "grad_max_sv": 0.4109547406435013, "grad_min_sv": 1.3599295635453275e-12, "grad_condition": 228187641587.3903, "lr": 0.0009786597487660333, "time_sec": 132.10575103759766 }, { "epoch": 15, "train_loss": 4.5714335003662105, "train_acc": 0.0158, "test_loss": 5.952970848083496, "test_acc": 0.0108, "lyapunov": 1.6084746881519132, "grad_norm": 0.4822199745251536, "grad_max_sv": 0.4148616835474968, "grad_min_sv": 1.325723769366507e-12, "grad_condition": 228332485622.18976, "lr": 0.0009755282581475766, "time_sec": 132.07877397537231 }, { "epoch": 16, "train_loss": 4.565800028839111, "train_acc": 0.0173, "test_loss": 6.017549203491211, "test_acc": 0.0137, "lyapunov": 1.6085086640189676, "grad_norm": 0.47773503355798047, "grad_max_sv": 0.37624144479632377, "grad_min_sv": 1.8790570016513782e-12, "grad_condition": 187345627300.82098, "lr": 0.0009721881851187403, "time_sec": 132.12643265724182 }, { "epoch": 17, "train_loss": 4.561137200317383, "train_acc": 0.01712, "test_loss": 5.580053092956543, "test_acc": 0.0107, "lyapunov": 1.6103480209779861, "grad_norm": 0.42330979896069637, "grad_max_sv": 0.3250656593590975, "grad_min_sv": 2.3677161192719408e-12, "grad_condition": 147724357967.11288, "lr": 0.0009686409947459456, "time_sec": 132.14898109436035 }, { "epoch": 18, "train_loss": 4.563034916381836, "train_acc": 0.0177, "test_loss": 6.472257780456543, "test_acc": 0.012, "lyapunov": 1.60859798714328, "grad_norm": 0.39753763021030414, "grad_max_sv": 0.3068309862166643, "grad_min_sv": 1.984737901050091e-12, "grad_condition": 141601417281.96045, "lr": 0.0009648882429441254, "time_sec": 132.13856673240662 }, { "epoch": 19, "train_loss": 4.573127483978271, "train_acc": 0.01616, "test_loss": 6.564729704284668, "test_acc": 0.01, "lyapunov": 1.6016948787147736, "grad_norm": 0.37413654436559074, "grad_max_sv": 0.25983951464295385, "grad_min_sv": 8.805135414126768e-13, "grad_condition": 167002019939.4643, "lr": 0.00096093157579425, "time_sec": 132.11500477790833 }, { "epoch": 20, "train_loss": 4.56939130859375, "train_acc": 0.01528, "test_loss": 5.16709538116455, "test_acc": 0.01, "lyapunov": 1.597558982841804, "grad_norm": 0.39362856256863293, "grad_max_sv": 0.2981186196208, "grad_min_sv": 1.14360007788262e-12, "grad_condition": 172580154761.56354, "lr": 0.0009567727288213001, "time_sec": 132.1002917289734 }, { "epoch": 21, "train_loss": 4.562076300048828, "train_acc": 0.01692, "test_loss": 7.266219122314453, "test_acc": 0.01, "lyapunov": 1.583339158531345, "grad_norm": 0.3838804885339558, "grad_max_sv": 0.2798105400055647, "grad_min_sv": 7.450625884139858e-13, "grad_condition": 177009367673.91373, "lr": 0.0009524135262330095, "time_sec": 132.13163590431213 }, { "epoch": 22, "train_loss": 4.559008093414307, "train_acc": 0.01742, "test_loss": 8.447665538024902, "test_acc": 0.01, "lyapunov": 1.603207119285603, "grad_norm": 0.34832863438111206, "grad_max_sv": 0.26395418867468834, "grad_min_sv": 1.4773422168547318e-12, "grad_condition": 143366348092.1024, "lr": 0.0009478558801197061, "time_sec": 132.09874486923218 }, { "epoch": 23, "train_loss": 4.567956644134521, "train_acc": 0.01592, "test_loss": 6.940740246582031, "test_acc": 0.01, "lyapunov": 1.585778128460545, "grad_norm": 0.3751847661218295, "grad_max_sv": 0.2457405323628336, "grad_min_sv": 6.231746074838346e-13, "grad_condition": 170137728056.1702, "lr": 0.000943101789615607, "time_sec": 132.0928874015808 }, { "epoch": 24, "train_loss": 4.56678815246582, "train_acc": 0.01628, "test_loss": 7.364704632568359, "test_acc": 0.01, "lyapunov": 1.5802125275287482, "grad_norm": 0.3399018458628351, "grad_max_sv": 0.2711117286235094, "grad_min_sv": 9.27439371401471e-13, "grad_condition": 170001968568.01523, "lr": 0.0009381533400219313, "time_sec": 132.12326908111572 }, { "epoch": 25, "train_loss": 4.551226531219482, "train_acc": 0.01722, "test_loss": 7.127618463134765, "test_acc": 0.01, "lyapunov": 1.5777013463437404, "grad_norm": 0.3789618085380604, "grad_max_sv": 0.2764745395630598, "grad_min_sv": 1.510240189536528e-12, "grad_condition": 150249480387.73657, "lr": 0.0009330127018922189, "time_sec": 132.14744663238525 }, { "epoch": 26, "train_loss": 4.533589083099365, "train_acc": 0.01782, "test_loss": 7.280224295043945, "test_acc": 0.01, "lyapunov": 1.5766756863850158, "grad_norm": 0.4098165679041348, "grad_max_sv": 0.32836851589381694, "grad_min_sv": 1.6846995700798532e-12, "grad_condition": 162596172663.19934, "lr": 0.000927682130080253, "time_sec": 132.10132360458374 }, { "epoch": 27, "train_loss": 4.5178348692321775, "train_acc": 0.01944, "test_loss": 4.609143519592285, "test_acc": 0.01, "lyapunov": 1.5718533059825068, "grad_norm": 0.4317006812537803, "grad_max_sv": 0.299236249551177, "grad_min_sv": 2.0935759289783253e-12, "grad_condition": 152648919866.78998, "lr": 0.0009221639627510072, "time_sec": 132.11033844947815 }, { "epoch": 28, "train_loss": 4.538441289978027, "train_acc": 0.01874, "test_loss": 5.727067053222656, "test_acc": 0.01, "lyapunov": 1.5787607407021096, "grad_norm": 0.4781702015089973, "grad_max_sv": 0.31850807219743726, "grad_min_sv": 3.363601657944103e-12, "grad_condition": 113571776097.28023, "lr": 0.0009164606203550494, "time_sec": 132.13339686393738 }, { "epoch": 29, "train_loss": 4.55489263671875, "train_acc": 0.01978, "test_loss": 6.314897917175293, "test_acc": 0.01, "lyapunov": 1.6226641564722866, "grad_norm": 0.39702511856584055, "grad_max_sv": 0.3101757925003767, "grad_min_sv": 1.643950862890769e-12, "grad_condition": 162529843580.92197, "lr": 0.0009105746045668516, "time_sec": 132.10528302192688 }, { "epoch": 30, "train_loss": 4.5577034072875975, "train_acc": 0.01934, "test_loss": 5.7611766616821285, "test_acc": 0.01, "lyapunov": 1.629781426371211, "grad_norm": 0.4775298671802556, "grad_max_sv": 0.3297189258038998, "grad_min_sv": 3.2226531698260168e-12, "grad_condition": 123880857814.76614, "lr": 0.0009045084971874733, "time_sec": 132.16758227348328 }, { "epoch": 31, "train_loss": 4.549954524230957, "train_acc": 0.01922, "test_loss": 6.9685128242492675, "test_acc": 0.01, "lyapunov": 1.6153524620148836, "grad_norm": 0.39506087923244415, "grad_max_sv": 0.305246427282691, "grad_min_sv": 2.963371775308759e-12, "grad_condition": 116809738976.30655, "lr": 0.0008982649590120977, "time_sec": 132.1613085269928 }, { "epoch": 32, "train_loss": 4.541183842926025, "train_acc": 0.02124, "test_loss": 6.829874574279785, "test_acc": 0.01, "lyapunov": 1.6133781327006151, "grad_norm": 0.38947657187455065, "grad_max_sv": 0.2715518455952406, "grad_min_sv": 2.244930278252747e-12, "grad_condition": 123331380509.9804, "lr": 0.0008918467286629196, "time_sec": 132.16536712646484 }, { "epoch": 33, "train_loss": 4.53525604888916, "train_acc": 0.02098, "test_loss": 6.518293627166748, "test_acc": 0.01, "lyapunov": 1.6150689750071376, "grad_norm": 0.42014951113026694, "grad_max_sv": 0.2435957606881857, "grad_min_sv": 2.048687606811065e-12, "grad_condition": 116665598250.77344, "lr": 0.0008852566213878943, "time_sec": 132.09782457351685 }, { "epoch": 34, "train_loss": 4.5325355252075195, "train_acc": 0.01958, "test_loss": 6.317331722259522, "test_acc": 0.01, "lyapunov": 1.5877615957308913, "grad_norm": 0.3361598121090629, "grad_max_sv": 0.2522958844900131, "grad_min_sv": 3.651040784603148e-12, "grad_condition": 86623505850.41478, "lr": 0.000878497527825878, "time_sec": 132.10610961914062 }, { "epoch": 35, "train_loss": 4.536015074005127, "train_acc": 0.01868, "test_loss": 6.3701594413757325, "test_acc": 0.01, "lyapunov": 1.5917383560439204, "grad_norm": 0.34920551391182975, "grad_max_sv": 0.23412882573902608, "grad_min_sv": 2.182336791137283e-12, "grad_condition": 102971407638.13591, "lr": 0.000871572412738697, "time_sec": 132.09818148612976 }, { "epoch": 36, "train_loss": 4.530319141998291, "train_acc": 0.0189, "test_loss": 6.076102793121338, "test_acc": 0.01, "lyapunov": 1.6073461313686712, "grad_norm": 0.3121785959415577, "grad_max_sv": 0.2200178649276495, "grad_min_sv": 3.2766681152194533e-12, "grad_condition": 85204262775.15216, "lr": 0.0008644843137107055, "time_sec": 132.1121485233307 }, { "epoch": 37, "train_loss": 4.530366974945069, "train_acc": 0.02034, "test_loss": 5.606327301025391, "test_acc": 0.01, "lyapunov": 1.6122757229963531, "grad_norm": 0.3191242103818429, "grad_max_sv": 0.20528502985835076, "grad_min_sv": 1.8868968590479396e-12, "grad_condition": 90563087741.60693, "lr": 0.0008572363398164014, "time_sec": 132.1431803703308 }, { "epoch": 38, "train_loss": 4.531652006530762, "train_acc": 0.0181, "test_loss": 6.281176449584961, "test_acc": 0.01, "lyapunov": 1.5978836668726732, "grad_norm": 0.3226311590239451, "grad_max_sv": 0.18021098636090754, "grad_min_sv": 1.3471604261713563e-12, "grad_condition": 97967821962.4504, "lr": 0.0008498316702566826, "time_sec": 132.1808111667633 }, { "epoch": 39, "train_loss": 4.515576623077393, "train_acc": 0.02002, "test_loss": 7.3591477447509765, "test_acc": 0.01, "lyapunov": 1.595075506688384, "grad_norm": 0.29392491905513246, "grad_max_sv": 0.175280692987144, "grad_min_sv": 1.3060439555812542e-12, "grad_condition": 99096247746.24886, "lr": 0.0008422735529643442, "time_sec": 132.13058257102966 }, { "epoch": 40, "train_loss": 4.508498954620362, "train_acc": 0.02058, "test_loss": 5.166109811401367, "test_acc": 0.01, "lyapunov": 1.592364840190429, "grad_norm": 0.31050287296978984, "grad_max_sv": 0.18211948983371257, "grad_min_sv": 2.1916040644331514e-12, "grad_condition": 89426467797.39761, "lr": 0.0008345653031794289, "time_sec": 132.1956102848053 }, { "epoch": 41, "train_loss": 4.594321117401123, "train_acc": 0.01546, "test_loss": 7.777395164489746, "test_acc": 0.01, "lyapunov": 1.6293273725168174, "grad_norm": 1.0042516112855135, "grad_max_sv": 0.14036097445059567, "grad_min_sv": 2.5427231651336982e-11, "grad_condition": 81054501201.00836, "lr": 0.0008267103019950526, "time_sec": 132.13326239585876 }, { "epoch": 42, "train_loss": 4.569071527404785, "train_acc": 0.01844, "test_loss": 7.213038313293457, "test_acc": 0.01, "lyapunov": 1.6979200718043101, "grad_norm": 0.26172862173554357, "grad_max_sv": 0.16976843364536762, "grad_min_sv": 1.3973847074078634e-12, "grad_condition": 86625374599.54195, "lr": 0.0008187119948743447, "time_sec": 132.11792135238647 }, { "epoch": 43, "train_loss": 4.558605685272217, "train_acc": 0.01936, "test_loss": 7.291248056030273, "test_acc": 0.01, "lyapunov": 1.6884295074531184, "grad_norm": 0.28281726127535384, "grad_max_sv": 0.16570937782526016, "grad_min_sv": 1.422441962513273e-12, "grad_condition": 88001604691.41785, "lr": 0.000810573890139155, "time_sec": 132.1009702682495 }, { "epoch": 44, "train_loss": 4.560630667114258, "train_acc": 0.01868, "test_loss": 7.16728485031128, "test_acc": 0.01, "lyapunov": 1.686604334875141, "grad_norm": 0.28505793697030324, "grad_max_sv": 0.15897216144949197, "grad_min_sv": 1.4942365308149637e-12, "grad_condition": 86276532282.80447, "lr": 0.0008022995574311873, "time_sec": 132.1154272556305 }, { "epoch": 45, "train_loss": 4.5725548426818845, "train_acc": 0.0188, "test_loss": 7.126261402893066, "test_acc": 0.01, "lyapunov": 1.686247174087388, "grad_norm": 0.235009326711948, "grad_max_sv": 0.15716111175715924, "grad_min_sv": 7.169276878089038e-13, "grad_condition": 108521610164.79031, "lr": 0.0007938926261462363, "time_sec": 132.11932492256165 }, { "epoch": 46, "train_loss": 4.583313959960938, "train_acc": 0.0172, "test_loss": 5.289773531341552, "test_acc": 0.01, "lyapunov": 1.698270396198458, "grad_norm": 0.313539150382163, "grad_max_sv": 0.16240414716303347, "grad_min_sv": 6.375463347288685e-13, "grad_condition": 111380569067.90488, "lr": 0.0007853567838422158, "time_sec": 132.14860010147095 }, { "epoch": 47, "train_loss": 4.578197394866943, "train_acc": 0.01782, "test_loss": 6.591432273864746, "test_acc": 0.01, "lyapunov": 1.6831631639119609, "grad_norm": 0.2604809257680144, "grad_max_sv": 0.15823213588446378, "grad_min_sv": 1.3005127228431431e-12, "grad_condition": 88272206869.29628, "lr": 0.0007766957746216719, "time_sec": 132.12520599365234 }, { "epoch": 48, "train_loss": 4.578674370269775, "train_acc": 0.01816, "test_loss": 5.157715400695801, "test_acc": 0.01, "lyapunov": 1.6778625536452778, "grad_norm": 0.36451993025813884, "grad_max_sv": 0.16272996473126114, "grad_min_sv": 2.5139523132342427e-12, "grad_condition": 93980395518.9741, "lr": 0.0007679133974894982, "time_sec": 132.10149908065796 }, { "epoch": 49, "train_loss": 4.558167927093506, "train_acc": 0.0207, "test_loss": 5.5524071670532225, "test_acc": 0.01, "lyapunov": 1.654131231710429, "grad_norm": 0.26398153340032604, "grad_max_sv": 0.15602914486080408, "grad_min_sv": 8.142784605144219e-11, "grad_condition": 49953288517.76509, "lr": 0.000759013504686565, "time_sec": 132.14293909072876 }, { "epoch": 50, "train_loss": 4.556328114318847, "train_acc": 0.02032, "test_loss": 5.053372247314453, "test_acc": 0.01, "lyapunov": 1.658374283319849, "grad_norm": 0.24338078400550828, "grad_max_sv": 0.1512946780771017, "grad_min_sv": 2.964903017923289e-12, "grad_condition": 67110635284.64429, "lr": 0.0007499999999999998, "time_sec": 132.1664924621582 }, { "epoch": 51, "train_loss": 4.570141744995118, "train_acc": 0.01988, "test_loss": 5.131472052001953, "test_acc": 0.01, "lyapunov": 1.6845884472512833, "grad_norm": 0.2817728093100986, "grad_max_sv": 0.13915783632546663, "grad_min_sv": 1.7209330912965342e-12, "grad_condition": 70074791169.44548, "lr": 0.0007408768370508575, "time_sec": 132.25617241859436 }, { "epoch": 52, "train_loss": 4.574759218902588, "train_acc": 0.01936, "test_loss": 5.048821273803711, "test_acc": 0.01, "lyapunov": 1.6568556862414037, "grad_norm": 0.2134662683751272, "grad_max_sv": 0.13759722150862216, "grad_min_sv": 1.421003107907492e-12, "grad_condition": 75951660314.10495, "lr": 0.0007316480175599307, "time_sec": 132.24415564537048 }, { "epoch": 53, "train_loss": 4.578046445617676, "train_acc": 0.01878, "test_loss": 5.305573741149902, "test_acc": 0.01, "lyapunov": 1.6395436802788463, "grad_norm": 0.20939237447265202, "grad_max_sv": 0.13288239240646363, "grad_min_sv": 8.329158668790625e-13, "grad_condition": 89438685434.2227, "lr": 0.0007223175895924635, "time_sec": 132.20375537872314 }, { "epoch": 54, "train_loss": 4.581330629272461, "train_acc": 0.0165, "test_loss": 5.532207501983643, "test_acc": 0.01, "lyapunov": 1.6444858135774618, "grad_norm": 0.2762560677540659, "grad_max_sv": 0.12445617569610476, "grad_min_sv": 3.912145951191304e-12, "grad_condition": 83557962455.66768, "lr": 0.0007128896457825361, "time_sec": 132.15107369422913 }, { "epoch": 55, "train_loss": 4.581049518737793, "train_acc": 0.01652, "test_loss": 5.197387743377686, "test_acc": 0.01, "lyapunov": 1.6384336021550172, "grad_norm": 0.23390564725407778, "grad_max_sv": 0.1323490994051099, "grad_min_sv": 6.793781517885129e-13, "grad_condition": 88731637332.26297, "lr": 0.0007033683215378998, "time_sec": 132.17300724983215 }, { "epoch": 56, "train_loss": 4.584884506378174, "train_acc": 0.01634, "test_loss": 6.454191752624512, "test_acc": 0.01, "lyapunov": 1.6743981499806084, "grad_norm": 0.25387218343472684, "grad_max_sv": 0.13131952080875636, "grad_min_sv": 5.318952729656952e-13, "grad_condition": 95324952785.9041, "lr": 0.0006937577932260512, "time_sec": 132.16189765930176 }, { "epoch": 57, "train_loss": 4.586065352630615, "train_acc": 0.01452, "test_loss": 6.120808155822754, "test_acc": 0.01, "lyapunov": 1.635638156815258, "grad_norm": 0.19075779973568727, "grad_max_sv": 0.10836047828197479, "grad_min_sv": 3.0117655839699465e-13, "grad_condition": 89022659140.15048, "lr": 0.0006840622763423388, "time_sec": 132.1572346687317 }, { "epoch": 58, "train_loss": 4.587811795196533, "train_acc": 0.01474, "test_loss": 5.800351502990723, "test_acc": 0.01, "lyapunov": 1.6200943285851832, "grad_norm": 0.23045480693280587, "grad_max_sv": 0.10783510617911815, "grad_min_sv": 1.62684212425452e-13, "grad_condition": 94564165099.07333, "lr": 0.0006742860236609073, "time_sec": 132.15808749198914 }, { "epoch": 59, "train_loss": 4.591301085662842, "train_acc": 0.01376, "test_loss": 5.996090186309814, "test_acc": 0.01, "lyapunov": 1.6170085330143609, "grad_norm": 0.1857451149070646, "grad_max_sv": 0.10361974723637105, "grad_min_sv": 1.6122890156067053e-13, "grad_condition": 91694547176.55017, "lr": 0.0006644333233692913, "time_sec": 132.1711368560791 }, { "epoch": 60, "train_loss": 4.585452033386231, "train_acc": 0.01522, "test_loss": 5.83253670501709, "test_acc": 0.01, "lyapunov": 1.6162819191622917, "grad_norm": 0.27013125926112547, "grad_max_sv": 0.10345460344105958, "grad_min_sv": 2.5520667445480586e-13, "grad_condition": 86471116288.19133, "lr": 0.0006545084971874734, "time_sec": 132.12959480285645 }, { "epoch": 61, "train_loss": 4.575745923614502, "train_acc": 0.01574, "test_loss": 5.912968054962159, "test_acc": 0.01, "lyapunov": 1.6168097483227626, "grad_norm": 0.19203323317006551, "grad_max_sv": 0.1045845141634345, "grad_min_sv": 2.8391874312669906e-13, "grad_condition": 84748109291.00053, "lr": 0.0006445158984722354, "time_sec": 132.1811854839325 }, { "epoch": 62, "train_loss": 4.581840614318848, "train_acc": 0.01504, "test_loss": 5.784942044067383, "test_acc": 0.01, "lyapunov": 1.6041824201793622, "grad_norm": 0.18322487540118004, "grad_max_sv": 0.11089323591440917, "grad_min_sv": 2.605932741312656e-13, "grad_condition": 91338998422.90005, "lr": 0.0006344599103076324, "time_sec": 132.1614978313446 }, { "epoch": 63, "train_loss": 4.60023887878418, "train_acc": 0.01528, "test_loss": 5.64439457244873, "test_acc": 0.01, "lyapunov": 1.6233063558178484, "grad_norm": 0.2113660918385516, "grad_max_sv": 0.10892452355474233, "grad_min_sv": 2.537344721436935e-13, "grad_condition": 90408295734.5693, "lr": 0.0006243449435824269, "time_sec": 132.14256119728088 }, { "epoch": 64, "train_loss": 4.589049236907959, "train_acc": 0.01542, "test_loss": 5.874572355651855, "test_acc": 0.01, "lyapunov": 1.6047841283061621, "grad_norm": 0.18184052006950477, "grad_max_sv": 0.10828140377998352, "grad_min_sv": 2.791036279353835e-13, "grad_condition": 88102791154.87807, "lr": 0.0006141754350553275, "time_sec": 132.15559458732605 }, { "epoch": 65, "train_loss": 4.5660726802062985, "train_acc": 0.01638, "test_loss": 5.8140344772338866, "test_acc": 0.01, "lyapunov": 1.5915922386871884, "grad_norm": 0.19423334716784915, "grad_max_sv": 0.10693365205079317, "grad_min_sv": 3.330885965231205e-13, "grad_condition": 83112992316.30193, "lr": 0.0006039558454088793, "time_sec": 132.18004989624023 }, { "epoch": 66, "train_loss": 4.580396204833985, "train_acc": 0.01542, "test_loss": 5.797694694519043, "test_acc": 0.01, "lyapunov": 1.5965009342374095, "grad_norm": 0.2125232867000169, "grad_max_sv": 0.10570351034402847, "grad_min_sv": 2.978146282169481e-13, "grad_condition": 85693424811.33855, "lr": 0.000593690657292862, "time_sec": 132.2843222618103 }, { "epoch": 67, "train_loss": 4.573282337646484, "train_acc": 0.01564, "test_loss": 5.954542552185059, "test_acc": 0.01, "lyapunov": 1.601048025938556, "grad_norm": 0.18603658324598782, "grad_max_sv": 0.10089892633259297, "grad_min_sv": 3.469332375289147e-13, "grad_condition": 80778127108.38254, "lr": 0.0005833843733580507, "time_sec": 132.31548929214478 }, { "epoch": 68, "train_loss": 4.571360148773193, "train_acc": 0.0161, "test_loss": 5.669797957611084, "test_acc": 0.01, "lyapunov": 1.5947835719798837, "grad_norm": 0.20014910112057685, "grad_max_sv": 0.105499835498631, "grad_min_sv": 9.770913933804e-13, "grad_condition": 66387740803.896385, "lr": 0.0005730415142812054, "time_sec": 132.14850521087646 }, { "epoch": 69, "train_loss": 4.578122979125976, "train_acc": 0.01662, "test_loss": 6.221010691070557, "test_acc": 0.01, "lyapunov": 1.6033955156955573, "grad_norm": 0.30693039018142426, "grad_max_sv": 0.11157863736152648, "grad_min_sv": 8.756002305516403e-13, "grad_condition": 80609250127.91284, "lr": 0.0005626666167821517, "time_sec": 132.37923741340637 }, { "epoch": 70, "train_loss": 4.565648191833496, "train_acc": 0.01792, "test_loss": 5.099743925476075, "test_acc": 0.01, "lyapunov": 1.6167474094864047, "grad_norm": 0.22355495861014546, "grad_max_sv": 0.1181858729571104, "grad_min_sv": 4.5336824184788683e-13, "grad_condition": 88479511676.05211, "lr": 0.0005522642316338265, "time_sec": 132.16482520103455 }, { "epoch": 71, "train_loss": 4.5823839192199705, "train_acc": 0.01686, "test_loss": 5.610829375457763, "test_acc": 0.01, "lyapunov": 1.640915547795308, "grad_norm": 0.21533848262037789, "grad_max_sv": 0.10482716094702482, "grad_min_sv": 2.352225111137488e-13, "grad_condition": 88706026678.10991, "lr": 0.0005418389216661573, "time_sec": 132.1553201675415 }, { "epoch": 72, "train_loss": 4.586939775238037, "train_acc": 0.01644, "test_loss": 5.6766823959350585, "test_acc": 0.01, "lyapunov": 1.6386277257938824, "grad_norm": 0.21193209754597628, "grad_max_sv": 0.09875305313616992, "grad_min_sv": 3.8445128177488697e-13, "grad_condition": 80890057907.66025, "lr": 0.0005313952597646563, "time_sec": 132.1702263355255 }, { "epoch": 73, "train_loss": 4.565450923156738, "train_acc": 0.01786, "test_loss": 5.090951374053955, "test_acc": 0.01, "lyapunov": 1.5904299654924046, "grad_norm": 0.19354037031175023, "grad_max_sv": 0.10569104105234146, "grad_min_sv": 4.874789243593624e-13, "grad_condition": 80729120343.229, "lr": 0.0005209378268645994, "time_sec": 132.16868782043457 }, { "epoch": 74, "train_loss": 4.5504186448669435, "train_acc": 0.0181, "test_loss": 5.612113465881348, "test_acc": 0.01, "lyapunov": 1.5932684325806015, "grad_norm": 0.2020325382395806, "grad_max_sv": 0.1039424953982234, "grad_min_sv": 1.1594278629870026e-12, "grad_condition": 62545889757.239746, "lr": 0.0005104712099416781, "time_sec": 132.14726519584656 }, { "epoch": 75, "train_loss": 4.5482193190002445, "train_acc": 0.01858, "test_loss": 6.069068190002441, "test_acc": 0.01, "lyapunov": 1.604267351767596, "grad_norm": 0.2266064763923867, "grad_max_sv": 0.11460568010807037, "grad_min_sv": 1.7911878418656585e-12, "grad_condition": 63236708994.86294, "lr": 0.0004999999999999996, "time_sec": 132.14808058738708 }, { "epoch": 76, "train_loss": 4.547421706695556, "train_acc": 0.01796, "test_loss": 5.810434713745117, "test_acc": 0.01, "lyapunov": 1.6127760651166483, "grad_norm": 0.21661099340887846, "grad_max_sv": 0.11015285402536393, "grad_min_sv": 1.6610576221168998e-12, "grad_condition": 56473316901.58356, "lr": 0.0004895287900583212, "time_sec": 132.38169169425964 }, { "epoch": 77, "train_loss": 4.5509974664306645, "train_acc": 0.02, "test_loss": 5.662685046386719, "test_acc": 0.01, "lyapunov": 1.6085883635084341, "grad_norm": 0.22829542556288998, "grad_max_sv": 0.11323911305516958, "grad_min_sv": 1.2826856675589158e-12, "grad_condition": 59045967769.00034, "lr": 0.0004790621731353997, "time_sec": 132.19757294654846 }, { "epoch": 78, "train_loss": 4.551352957153321, "train_acc": 0.01882, "test_loss": 5.566857955932617, "test_acc": 0.01, "lyapunov": 1.6337723820410726, "grad_norm": 0.25602140985448185, "grad_max_sv": 0.11203370597213506, "grad_min_sv": 1.3258904637988123e-12, "grad_condition": 62071250445.38745, "lr": 0.000468604740235343, "time_sec": 132.21045851707458 }, { "epoch": 79, "train_loss": 4.545634266510009, "train_acc": 0.01956, "test_loss": 5.292388404846191, "test_acc": 0.01, "lyapunov": 1.633863453365043, "grad_norm": 0.261991339098316, "grad_max_sv": 0.11294185262013343, "grad_min_sv": 2.2926638646691538e-12, "grad_condition": 57437613489.9528, "lr": 0.00045816107833384175, "time_sec": 132.16106390953064 }, { "epoch": 80, "train_loss": 4.544438370513916, "train_acc": 0.02008, "test_loss": 5.594520863342285, "test_acc": 0.01, "lyapunov": 1.6360818525714338, "grad_norm": 0.27680249132769946, "grad_max_sv": 0.12154058534651994, "grad_min_sv": 4.6932727855827e-12, "grad_condition": 38848618049.80592, "lr": 0.0004477357683661729, "time_sec": 132.17013382911682 }, { "epoch": 81, "train_loss": 4.539229464416504, "train_acc": 0.02094, "test_loss": 5.203748289489746, "test_acc": 0.01, "lyapunov": 1.6401681241476933, "grad_norm": 0.2346300301923333, "grad_max_sv": 0.11762278378009797, "grad_min_sv": 4.245260345659918e-12, "grad_condition": 45140986862.910706, "lr": 0.00043733338321784746, "time_sec": 132.1922423839569 }, { "epoch": 82, "train_loss": 4.511806388244629, "train_acc": 0.02256, "test_loss": 5.1750801635742185, "test_acc": 0.01, "lyapunov": 1.6131305651896446, "grad_norm": 0.21894630317091804, "grad_max_sv": 0.11400092151015997, "grad_min_sv": 1.204121461777062e-11, "grad_condition": 37883001192.43938, "lr": 0.0004269584857187939, "time_sec": 132.2294306755066 }, { "epoch": 83, "train_loss": 4.560598617706299, "train_acc": 0.01922, "test_loss": 5.039254272460938, "test_acc": 0.01, "lyapunov": 1.6179730105583014, "grad_norm": 0.6818929560069714, "grad_max_sv": 0.10932031758129597, "grad_min_sv": 3.5758800721917905e-11, "grad_condition": 41961243110.78183, "lr": 0.0004166156266419484, "time_sec": 132.16398668289185 }, { "epoch": 84, "train_loss": 4.538027311553955, "train_acc": 0.02012, "test_loss": 5.358105621337891, "test_acc": 0.01, "lyapunov": 1.630713469841901, "grad_norm": 0.23515180969917246, "grad_max_sv": 0.11126796789467334, "grad_min_sv": 3.733440409242942e-12, "grad_condition": 42021389131.16902, "lr": 0.0004063093427071373, "time_sec": 132.17217254638672 }, { "epoch": 85, "train_loss": 4.533066810150147, "train_acc": 0.02142, "test_loss": 5.210582428741455, "test_acc": 0.01, "lyapunov": 1.6099314771954665, "grad_norm": 0.23743119261123188, "grad_max_sv": 0.11509178727865219, "grad_min_sv": 9.24621530124588e-12, "grad_condition": 33409415784.932446, "lr": 0.0003960441545911199, "time_sec": 132.18297863006592 }, { "epoch": 86, "train_loss": 4.514812325439453, "train_acc": 0.02338, "test_loss": 5.010178847503662, "test_acc": 0.01, "lyapunov": 1.5926586319418514, "grad_norm": 0.2162543490750504, "grad_max_sv": 0.1109484301880002, "grad_min_sv": 4.5705949216622454e-10, "grad_condition": 11504727044.022625, "lr": 0.0003858245649446718, "time_sec": 132.147221326828 }, { "epoch": 87, "train_loss": 4.511024246826172, "train_acc": 0.022, "test_loss": 5.345004454040527, "test_acc": 0.01, "lyapunov": 1.5887958646735267, "grad_norm": 0.25657197110027863, "grad_max_sv": 0.1051843574270606, "grad_min_sv": 1.705161448824656e-10, "grad_condition": 25039598073.63558, "lr": 0.00037565505641757235, "time_sec": 132.14885830879211 }, { "epoch": 88, "train_loss": 4.505899262237548, "train_acc": 0.02334, "test_loss": 4.936904384613037, "test_acc": 0.01, "lyapunov": 1.6046001039197684, "grad_norm": 0.24194115234056338, "grad_max_sv": 0.11062774620950222, "grad_min_sv": 8.66749245303117e-11, "grad_condition": 18998356971.070953, "lr": 0.00036554008969236695, "time_sec": 132.13108325004578 }, { "epoch": 89, "train_loss": 4.509913777923584, "train_acc": 0.02288, "test_loss": 4.863644284057617, "test_acc": 0.01, "lyapunov": 1.6005188049867636, "grad_norm": 0.2399799817677917, "grad_max_sv": 0.10860499612490457, "grad_min_sv": 6.798252102655834e-11, "grad_condition": 18908436070.961212, "lr": 0.0003554841015277638, "time_sec": 132.194641828537 }, { "epoch": 90, "train_loss": 4.537508490905762, "train_acc": 0.02064, "test_loss": 5.445182901763916, "test_acc": 0.01, "lyapunov": 1.5926521418954405, "grad_norm": 0.1984924919711564, "grad_max_sv": 0.1050485922023654, "grad_min_sv": 7.577653377773176e-12, "grad_condition": 30774293544.0844, "lr": 0.000345491502812526, "time_sec": 132.17840719223022 }, { "epoch": 91, "train_loss": 4.521757569274902, "train_acc": 0.02238, "test_loss": 5.262060061645508, "test_acc": 0.01, "lyapunov": 1.5892650910350672, "grad_norm": 0.2847263318092328, "grad_max_sv": 0.10287641081959009, "grad_min_sv": 1.91736922530795e-10, "grad_condition": 18967974102.564293, "lr": 0.0003355666766307081, "time_sec": 132.18149828910828 }, { "epoch": 92, "train_loss": 4.519360184631347, "train_acc": 0.02082, "test_loss": 5.320795262908936, "test_acc": 0.01, "lyapunov": 1.5871959750914513, "grad_norm": 0.2370639034610865, "grad_max_sv": 0.10874731410294772, "grad_min_sv": 7.319739596956258e-12, "grad_condition": 27639015872.358166, "lr": 0.00032571397633909225, "time_sec": 132.22724723815918 }, { "epoch": 93, "train_loss": 4.512343827972412, "train_acc": 0.022, "test_loss": 5.345669583129883, "test_acc": 0.01, "lyapunov": 1.5883484478191952, "grad_norm": 0.23157908229447258, "grad_max_sv": 0.10562088992446661, "grad_min_sv": 1.2009558277386558e-11, "grad_condition": 16084905305.476273, "lr": 0.00031593772365766094, "time_sec": 132.24062776565552 }, { "epoch": 94, "train_loss": 4.507626133422852, "train_acc": 0.02282, "test_loss": 5.232546983337403, "test_acc": 0.01, "lyapunov": 1.582219293355332, "grad_norm": 0.25414870293495084, "grad_max_sv": 0.10162105709314347, "grad_min_sv": 1.5387781568668625e-11, "grad_condition": 19577209942.564514, "lr": 0.0003062422067739483, "time_sec": 132.21938920021057 }, { "epoch": 95, "train_loss": 4.5046430790710446, "train_acc": 0.02322, "test_loss": 5.702656979370118, "test_acc": 0.01, "lyapunov": 1.5933423502670834, "grad_norm": 0.22296672954904517, "grad_max_sv": 0.10369365382939577, "grad_min_sv": 1.464815680454453e-11, "grad_condition": 19604050143.141273, "lr": 0.00029663167846209965, "time_sec": 132.21640634536743 }, { "epoch": 96, "train_loss": 4.50480010559082, "train_acc": 0.02282, "test_loss": 5.597961514282226, "test_acc": 0.01, "lyapunov": 1.583764209771705, "grad_norm": 0.25490663774480726, "grad_max_sv": 0.10260288586723618, "grad_min_sv": 1.5525958737926244e-11, "grad_condition": 16728424588.234934, "lr": 0.00028711035421746345, "time_sec": 132.1660978794098 }, { "epoch": 97, "train_loss": 4.469037200622559, "train_acc": 0.02894, "test_loss": 5.864905759429932, "test_acc": 0.01, "lyapunov": 1.5917478577255288, "grad_norm": 0.23870917284644627, "grad_max_sv": 0.12171203531324863, "grad_min_sv": 1.4733043387116664e-09, "grad_condition": 1570381038.4230928, "lr": 0.00027768241040753615, "time_sec": 132.178719997406 }, { "epoch": 98, "train_loss": 4.470558769683838, "train_acc": 0.02786, "test_loss": 6.108024346923828, "test_acc": 0.01, "lyapunov": 1.5934783141021533, "grad_norm": 0.30827407557184827, "grad_max_sv": 0.12690354958176614, "grad_min_sv": 1.3345814640474545e-09, "grad_condition": 2937579113.826585, "lr": 0.00026835198244006903, "time_sec": 132.1512405872345 }, { "epoch": 99, "train_loss": 4.484580178527832, "train_acc": 0.02542, "test_loss": 5.846526190185547, "test_acc": 0.01, "lyapunov": 1.5788978844347512, "grad_norm": 0.221869552528174, "grad_max_sv": 0.11516296844929456, "grad_min_sv": 6.437623919727277e-10, "grad_condition": 3127665808.238943, "lr": 0.0002591231629491421, "time_sec": 132.13360047340393 }, { "epoch": 100, "train_loss": 4.483458242340088, "train_acc": 0.0259, "test_loss": 5.841338038635254, "test_acc": 0.01, "lyapunov": 1.5934071232900595, "grad_norm": 0.27882300961773687, "grad_max_sv": 0.11602762639522553, "grad_min_sv": 7.004058964700434e-10, "grad_condition": 3782223950.51213, "lr": 0.0002499999999999997, "time_sec": 132.2558717727661 }, { "epoch": 101, "train_loss": 4.499455378265381, "train_acc": 0.02344, "test_loss": 5.443247247314453, "test_acc": 0.01, "lyapunov": 1.5859141483941042, "grad_norm": 0.25072615175177326, "grad_max_sv": 0.11183246672153473, "grad_min_sv": 1.6060449399156376e-10, "grad_condition": 6795488555.526062, "lr": 0.00024098649531343477, "time_sec": 132.28790807724 }, { "epoch": 102, "train_loss": 4.49708987487793, "train_acc": 0.02284, "test_loss": 5.607777552032471, "test_acc": 0.01, "lyapunov": 1.5908644315226914, "grad_norm": 0.22348474047746483, "grad_max_sv": 0.11046325713396073, "grad_min_sv": 3.8719351463923063e-10, "grad_condition": 6001916881.77612, "lr": 0.0002320866025105016, "time_sec": 132.18588161468506 }, { "epoch": 103, "train_loss": 4.4955732382202145, "train_acc": 0.0236, "test_loss": 5.745177990722656, "test_acc": 0.01, "lyapunov": 1.5917734240022157, "grad_norm": 0.2534263836701249, "grad_max_sv": 0.110052939504385, "grad_min_sv": 2.750547882733342e-10, "grad_condition": 9464587786.428852, "lr": 0.0002233042253783278, "time_sec": 132.16262555122375 }, { "epoch": 104, "train_loss": 4.501874127349853, "train_acc": 0.02266, "test_loss": 5.61523842163086, "test_acc": 0.01, "lyapunov": 1.58528883255961, "grad_norm": 0.27420737869929585, "grad_max_sv": 0.10906471610069275, "grad_min_sv": 2.0978145145694022e-10, "grad_condition": 9953736672.96781, "lr": 0.000214643216157784, "time_sec": 132.20356059074402 }, { "epoch": 105, "train_loss": 4.527709134521484, "train_acc": 0.02124, "test_loss": 5.809187103271484, "test_acc": 0.01, "lyapunov": 1.5925516539522449, "grad_norm": 0.23170044660415676, "grad_max_sv": 0.1055134791880846, "grad_min_sv": 7.825866377728172e-11, "grad_condition": 26017131256.645947, "lr": 0.00020610737385376332, "time_sec": 132.20340204238892 }, { "epoch": 106, "train_loss": 4.538254840545655, "train_acc": 0.02052, "test_loss": 5.702211804962158, "test_acc": 0.01, "lyapunov": 1.5994793835198482, "grad_norm": 0.22739631788820852, "grad_max_sv": 0.10190589521080255, "grad_min_sv": 2.392879430639463e-12, "grad_condition": 41858905566.539444, "lr": 0.00019770044256881242, "time_sec": 132.2257125377655 }, { "epoch": 107, "train_loss": 4.537451904602051, "train_acc": 0.01914, "test_loss": 5.932393156433106, "test_acc": 0.01, "lyapunov": 1.5854461083326803, "grad_norm": 0.21156136855576158, "grad_max_sv": 0.09718370195478201, "grad_min_sv": 2.1334573155528867e-12, "grad_condition": 44438773786.1716, "lr": 0.0001894261098608447, "time_sec": 132.20696210861206 }, { "epoch": 108, "train_loss": 4.54288639175415, "train_acc": 0.01946, "test_loss": 6.020662310791016, "test_acc": 0.01, "lyapunov": 1.5982869247646283, "grad_norm": 0.22336362248783215, "grad_max_sv": 0.0942000387236476, "grad_min_sv": 2.070612785490142e-12, "grad_condition": 38681493255.63291, "lr": 0.000181288005125655, "time_sec": 132.15775275230408 }, { "epoch": 109, "train_loss": 4.539118989257813, "train_acc": 0.02004, "test_loss": 5.875737568664551, "test_acc": 0.01, "lyapunov": 1.597143233889509, "grad_norm": 0.24209283453668126, "grad_max_sv": 0.09231847468599881, "grad_min_sv": 2.4290148967334254e-12, "grad_condition": 41122755985.59834, "lr": 0.0001732896980049473, "time_sec": 132.2014491558075 }, { "epoch": 110, "train_loss": 4.533240603179932, "train_acc": 0.02078, "test_loss": 6.020731507873535, "test_acc": 0.01, "lyapunov": 1.5895807243064237, "grad_norm": 0.24031990384630442, "grad_max_sv": 0.09458559956401587, "grad_min_sv": 4.9697159162748165e-12, "grad_condition": 34976084384.10825, "lr": 0.00016543469682057076, "time_sec": 132.15150785446167 }, { "epoch": 111, "train_loss": 4.518356960906982, "train_acc": 0.02294, "test_loss": 5.969912101745606, "test_acc": 0.01, "lyapunov": 1.604492220122491, "grad_norm": 0.22602265116800407, "grad_max_sv": 0.09987993091344834, "grad_min_sv": 2.419991108871221e-10, "grad_condition": 19549830485.2588, "lr": 0.00015772644703565552, "time_sec": 132.23562288284302 }, { "epoch": 112, "train_loss": 4.52961797088623, "train_acc": 0.02194, "test_loss": 5.610896324157715, "test_acc": 0.01, "lyapunov": 1.6014201195953448, "grad_norm": 0.24431543872984524, "grad_max_sv": 0.09510019868612289, "grad_min_sv": 1.6583184662959947e-11, "grad_condition": 24172749617.446175, "lr": 0.00015016832974331713, "time_sec": 132.2202250957489 }, { "epoch": 113, "train_loss": 4.534737938232422, "train_acc": 0.02108, "test_loss": 5.882650997924805, "test_acc": 0.01, "lyapunov": 1.6089779333690244, "grad_norm": 0.2408463440419859, "grad_max_sv": 0.09545416701585055, "grad_min_sv": 8.265506817575693e-12, "grad_condition": 26886346060.009724, "lr": 0.00014276366018359834, "time_sec": 132.39671301841736 }, { "epoch": 114, "train_loss": 4.528099235992432, "train_acc": 0.0216, "test_loss": 6.349718654632569, "test_acc": 0.01, "lyapunov": 1.6125300259846251, "grad_norm": 0.24308443287212356, "grad_max_sv": 0.09617761392146348, "grad_min_sv": 2.4579975111898598e-11, "grad_condition": 33881398145.36089, "lr": 0.00013551568628929425, "time_sec": 132.3225646018982 }, { "epoch": 115, "train_loss": 4.519340593109131, "train_acc": 0.02402, "test_loss": 6.121589573669434, "test_acc": 0.01, "lyapunov": 1.6377504332291195, "grad_norm": 0.2592364007942639, "grad_max_sv": 0.09955059625208378, "grad_min_sv": 9.771481077080514e-11, "grad_condition": 10355098029.396868, "lr": 0.00012842758726130276, "time_sec": 132.17340803146362 }, { "epoch": 116, "train_loss": 4.532410475921631, "train_acc": 0.02288, "test_loss": 6.244934426879883, "test_acc": 0.01, "lyapunov": 1.666187497660937, "grad_norm": 0.31169546460365094, "grad_max_sv": 0.09843376744538546, "grad_min_sv": 5.1638096920723736e-11, "grad_condition": 18012362556.947014, "lr": 0.0001215024721741218, "time_sec": 132.24165844917297 }, { "epoch": 117, "train_loss": 4.535684629211426, "train_acc": 0.0223, "test_loss": 6.586191843414307, "test_acc": 0.01, "lyapunov": 1.6899945476780767, "grad_norm": 0.3135195405807995, "grad_max_sv": 0.10071753729134798, "grad_min_sv": 7.336645736394951e-11, "grad_condition": 12673080594.516361, "lr": 0.00011474337861210538, "time_sec": 132.23825097084045 }, { "epoch": 118, "train_loss": 4.546351953430176, "train_acc": 0.02212, "test_loss": 6.257575799560547, "test_acc": 0.01, "lyapunov": 1.7288513323839974, "grad_norm": 0.41941424039533404, "grad_max_sv": 0.09607745744287968, "grad_min_sv": 7.789500681913805e-11, "grad_condition": 16545952885.282751, "lr": 0.00010815327133708009, "time_sec": 132.21766591072083 }, { "epoch": 119, "train_loss": 4.531073229370117, "train_acc": 0.02256, "test_loss": 6.456183740997314, "test_acc": 0.01, "lyapunov": 1.6964583756673672, "grad_norm": 0.25613400920512375, "grad_max_sv": 0.09485051818192006, "grad_min_sv": 4.685287637259971e-11, "grad_condition": 12061244650.910728, "lr": 0.00010173504098790182, "time_sec": 132.30614709854126 }, { "epoch": 120, "train_loss": 4.541061541137696, "train_acc": 0.0237, "test_loss": 6.413670517730713, "test_acc": 0.01, "lyapunov": 1.739644906709871, "grad_norm": 0.3693183435156443, "grad_max_sv": 0.09833505425194744, "grad_min_sv": 3.894246489996689e-11, "grad_condition": 17507367358.884224, "lr": 9.549150281252629e-05, "time_sec": 132.18320536613464 }, { "epoch": 121, "train_loss": 4.5607890040588375, "train_acc": 0.0232, "test_loss": 6.3454551567077635, "test_acc": 0.01, "lyapunov": 1.8264712491608641, "grad_norm": 0.8551675055665584, "grad_max_sv": 0.1001248000189662, "grad_min_sv": 3.8870165434796247e-10, "grad_condition": 11774673434.16497, "lr": 8.942539543314794e-05, "time_sec": 132.19883823394775 }, { "epoch": 122, "train_loss": 4.561086259918213, "train_acc": 0.02154, "test_loss": 5.992345477294922, "test_acc": 0.01, "lyapunov": 1.802467906566532, "grad_norm": 0.35207234081524835, "grad_max_sv": 0.09587623235711362, "grad_min_sv": 3.822705043577684e-10, "grad_condition": 17845122251.05708, "lr": 8.353937964495024e-05, "time_sec": 132.44755220413208 }, { "epoch": 123, "train_loss": 4.573194706115722, "train_acc": 0.02058, "test_loss": 5.8545154296875, "test_acc": 0.01, "lyapunov": 1.816409704020566, "grad_norm": 0.3735027051691648, "grad_max_sv": 0.09373153795404505, "grad_min_sv": 2.715693798334913e-11, "grad_condition": 28875711989.57364, "lr": 7.783603724899243e-05, "time_sec": 132.26207613945007 }, { "epoch": 124, "train_loss": 4.572661248168945, "train_acc": 0.02148, "test_loss": 5.896555422973633, "test_acc": 0.01, "lyapunov": 1.8480512553163806, "grad_norm": 0.3134804302549242, "grad_max_sv": 0.09899624399840831, "grad_min_sv": 1.2754484528129877e-10, "grad_condition": 31805856694.423676, "lr": 7.231786991974666e-05, "time_sec": 132.45608854293823 }, { "epoch": 125, "train_loss": 4.580600358886719, "train_acc": 0.02084, "test_loss": 5.708856204223633, "test_acc": 0.01, "lyapunov": 1.8661305547675209, "grad_norm": 0.5029799512519317, "grad_max_sv": 0.10123962573707104, "grad_min_sv": 1.8373754739270858e-11, "grad_condition": 32052285848.35261, "lr": 6.698729810778072e-05, "time_sec": 132.43874192237854 }, { "epoch": 126, "train_loss": 4.609690670166016, "train_acc": 0.01856, "test_loss": 5.770978012084961, "test_acc": 0.01, "lyapunov": 1.9074160238665998, "grad_norm": 1.9260693563122895, "grad_max_sv": 0.08174233604597703, "grad_min_sv": 5.527462332474612e-11, "grad_condition": 24363510202.6125, "lr": 6.184665997806817e-05, "time_sec": 132.24991106987 }, { "epoch": 127, "train_loss": 4.640943519897461, "train_acc": 0.01876, "test_loss": 5.077701470947265, "test_acc": 0.01, "lyapunov": 1.9559716467967119, "grad_norm": 1.0457106969740626, "grad_max_sv": 0.09646339530616928, "grad_min_sv": 3.4253201033677874e-10, "grad_condition": 17416671105.52501, "lr": 5.6898210384392595e-05, "time_sec": 132.16351675987244 }, { "epoch": 128, "train_loss": 4.598363189086914, "train_acc": 0.02078, "test_loss": 4.975116259765625, "test_acc": 0.01, "lyapunov": 1.8845891751291808, "grad_norm": 0.8220120863964331, "grad_max_sv": 0.08199532476752439, "grad_min_sv": 8.623996275121066e-10, "grad_condition": 9056773581.269657, "lr": 5.214411988029363e-05, "time_sec": 132.3097848892212 }, { "epoch": 129, "train_loss": 4.541455926513672, "train_acc": 0.0247, "test_loss": 5.7549523315429685, "test_acc": 0.01, "lyapunov": 1.8803200340636856, "grad_norm": 0.2569299215166405, "grad_max_sv": 0.10282012969255447, "grad_min_sv": 1.0507987653726909e-09, "grad_condition": 9769165472.089832, "lr": 4.7586473766990294e-05, "time_sec": 132.27577376365662 }, { "epoch": 130, "train_loss": 4.584647702636719, "train_acc": 0.02022, "test_loss": 5.332480350494385, "test_acc": 0.01, "lyapunov": 1.901323552326778, "grad_norm": 0.3548472872087693, "grad_max_sv": 0.1086544806137681, "grad_min_sv": 9.814503552650124e-11, "grad_condition": 22478674485.849125, "lr": 4.32272711786996e-05, "time_sec": 132.3002369403839 }, { "epoch": 131, "train_loss": 4.581521871185303, "train_acc": 0.02126, "test_loss": 5.6270052955627445, "test_acc": 0.01, "lyapunov": 1.9170096432766341, "grad_norm": 0.21502212949334182, "grad_max_sv": 0.10107578802853823, "grad_min_sv": 4.709314182512565e-12, "grad_condition": 28702045833.35929, "lr": 3.906842420574966e-05, "time_sec": 132.58341455459595 }, { "epoch": 132, "train_loss": 4.603923379821778, "train_acc": 0.02086, "test_loss": 5.753756982421875, "test_acc": 0.01, "lyapunov": 2.0209065084262274, "grad_norm": 0.24096511248455096, "grad_max_sv": 0.09993877708911895, "grad_min_sv": 7.1246287590231335e-12, "grad_condition": 29623139032.43003, "lr": 3.5111757055874305e-05, "time_sec": 132.31662130355835 }, { "epoch": 133, "train_loss": 4.622827220458984, "train_acc": 0.02166, "test_loss": 5.880264813232422, "test_acc": 0.01, "lyapunov": 2.0902158723157993, "grad_norm": 0.37428368144939567, "grad_max_sv": 0.09831619988790408, "grad_min_sv": 4.434330920707163e-12, "grad_condition": 32791799106.98709, "lr": 3.1359005254054254e-05, "time_sec": 132.16932916641235 }, { "epoch": 134, "train_loss": 4.6172026605224605, "train_acc": 0.02178, "test_loss": 5.7553314712524415, "test_acc": 0.01, "lyapunov": 2.0609848694423274, "grad_norm": 1.1257846952613533, "grad_max_sv": 0.09743457045406104, "grad_min_sv": 3.0741354169823606e-11, "grad_condition": 13593193192.516785, "lr": 2.7811814881259484e-05, "time_sec": 132.19739365577698 }, { "epoch": 135, "train_loss": 4.635151025238037, "train_acc": 0.021, "test_loss": 5.5024827880859375, "test_acc": 0.01, "lyapunov": 1.9769353912309613, "grad_norm": 2.02772923429031, "grad_max_sv": 0.07839736734087524, "grad_min_sv": 3.7352801946025573e-10, "grad_condition": 6440628915.387049, "lr": 2.4471741852423218e-05, "time_sec": 132.1603286266327 }, { "epoch": 136, "train_loss": 4.68249575958252, "train_acc": 0.0219, "test_loss": 5.25179546508789, "test_acc": 0.01, "lyapunov": 2.0190668633526854, "grad_norm": 1.6997169038698898, "grad_max_sv": 0.08753072819376939, "grad_min_sv": 1.2251687187667402e-09, "grad_condition": 432467715.9748623, "lr": 2.1340251233966362e-05, "time_sec": 132.14581847190857 }, { "epoch": 137, "train_loss": 4.631195866546631, "train_acc": 0.02544, "test_loss": 5.392911587524414, "test_acc": 0.01, "lyapunov": 1.9715384879075657, "grad_norm": 0.7892430119447663, "grad_max_sv": 0.10768030200561043, "grad_min_sv": 1.7614047353271475e-09, "grad_condition": 109282059.02686039, "lr": 1.8418716601170932e-05, "time_sec": 132.1871361732483 }, { "epoch": 138, "train_loss": 4.587350132141113, "train_acc": 0.02568, "test_loss": 5.4693435791015625, "test_acc": 0.01, "lyapunov": 1.991891508821941, "grad_norm": 0.7469521916290953, "grad_max_sv": 0.11756768673658372, "grad_min_sv": 1.9356462725657374e-09, "grad_condition": 1022350892.4888865, "lr": 1.570841943568445e-05, "time_sec": 132.11142563819885 }, { "epoch": 139, "train_loss": 4.577352908630371, "train_acc": 0.02708, "test_loss": 5.601054759979248, "test_acc": 0.01, "lyapunov": 1.9843372856564534, "grad_norm": 0.8085739729926078, "grad_max_sv": 0.12083102430333384, "grad_min_sv": 1.96632062201673e-09, "grad_condition": 76824680.74466217, "lr": 1.3210548563419845e-05, "time_sec": 132.16676545143127 }, { "epoch": 140, "train_loss": 4.552192511444092, "train_acc": 0.02732, "test_loss": 5.383674153137207, "test_acc": 0.01, "lyapunov": 1.9721098985818342, "grad_norm": 0.6793156974859339, "grad_max_sv": 0.12086031896079703, "grad_min_sv": 1.9605524922258888e-09, "grad_condition": 123266932.04338643, "lr": 1.0926199633097203e-05, "time_sec": 132.13540196418762 }, { "epoch": 141, "train_loss": 4.551412692871094, "train_acc": 0.02748, "test_loss": 5.406689046478271, "test_acc": 0.01, "lyapunov": 1.9343544891118394, "grad_norm": 0.6725109238271549, "grad_max_sv": 0.11751907898869832, "grad_min_sv": 1.9861858326650564e-09, "grad_condition": 74216850.21639355, "lr": 8.856374635655688e-06, "time_sec": 132.12982821464539 }, { "epoch": 142, "train_loss": 4.727527248229981, "train_acc": 0.01824, "test_loss": 5.770706779479981, "test_acc": 0.01, "lyapunov": 2.350969208475879, "grad_norm": 2.282933232543126, "grad_max_sv": 0.11755687685454178, "grad_min_sv": 1.4490837774683643e-09, "grad_condition": 631119004.4434631, "lr": 7.001981464747503e-06, "time_sec": 132.14570784568787 }, { "epoch": 143, "train_loss": 4.774733398284912, "train_acc": 0.01748, "test_loss": 5.42293524093628, "test_acc": 0.01, "lyapunov": 2.5337743533541786, "grad_norm": 3.084857123459247, "grad_max_sv": 0.08506426704443584, "grad_min_sv": 1.0878406072247764e-09, "grad_condition": 95670235.35140035, "lr": 5.3638335185058295e-06, "time_sec": 132.17597699165344 }, { "epoch": 144, "train_loss": 4.801961855010986, "train_acc": 0.01764, "test_loss": 5.572767419433593, "test_acc": 0.01, "lyapunov": 2.5992656010191153, "grad_norm": 2.2910220858954014, "grad_max_sv": 0.14899966653709953, "grad_min_sv": 2.0148015595278023e-09, "grad_condition": 176782893.45203692, "lr": 3.942649342761114e-06, "time_sec": 132.12091755867004 }, { "epoch": 145, "train_loss": 4.850462348022461, "train_acc": 0.02024, "test_loss": 5.516320917510987, "test_acc": 0.01, "lyapunov": 2.7130372066936834, "grad_norm": 1.0265954725835216, "grad_max_sv": 0.21464332040486625, "grad_min_sv": 3.1526066665652634e-09, "grad_condition": 97161987.48706797, "lr": 2.7390523158633524e-06, "time_sec": 132.0690953731537 }, { "epoch": 146, "train_loss": 4.856118622894287, "train_acc": 0.02, "test_loss": 5.461014266967774, "test_acc": 0.01, "lyapunov": 2.718469413040239, "grad_norm": 1.0099887200055417, "grad_max_sv": 0.15561392254603562, "grad_min_sv": 2.2754747437366604e-09, "grad_condition": 1019144627.7729056, "lr": 1.7535703752478133e-06, "time_sec": 132.11823773384094 }, { "epoch": 147, "train_loss": 4.924606959075928, "train_acc": 0.01686, "test_loss": 20.649002047729493, "test_acc": 0.01, "lyapunov": 2.6374005685986766, "grad_norm": 3.1423913582004523, "grad_max_sv": 0.21941849166760222, "grad_min_sv": 3.0307538921017438e-09, "grad_condition": 120403007.5867976, "lr": 9.866357858642196e-07, "time_sec": 132.07725739479065 }, { "epoch": 148, "train_loss": 4.767027478179932, "train_acc": 0.01794, "test_loss": 5.494908865356446, "test_acc": 0.01, "lyapunov": 2.1720430088774934, "grad_norm": 3.0001678190775194, "grad_max_sv": 0.06730101421089785, "grad_min_sv": 5.6080486708198344e-11, "grad_condition": 32628105419.335045, "lr": 4.38584950570808e-07, "time_sec": 132.16628646850586 }, { "epoch": 149, "train_loss": 4.725253110198975, "train_acc": 0.01852, "test_loss": 5.4529930709838865, "test_acc": 0.01, "lyapunov": 2.1247258430246805, "grad_norm": 2.425421227254264, "grad_max_sv": 0.06302208096294634, "grad_min_sv": 8.06056723307697e-12, "grad_condition": 24980400399.38557, "lr": 1.096582625772501e-07, "time_sec": 132.17798447608948 }, { "epoch": 150, "train_loss": 4.724624121398926, "train_acc": 0.01896, "test_loss": 5.454324950408935, "test_acc": 0.01, "lyapunov": 2.1117066599219045, "grad_norm": 2.2782652512729027, "grad_max_sv": 0.06824387344677234, "grad_min_sv": 1.3984562009526476e-11, "grad_condition": 35779591216.93815, "lr": 0.0, "time_sec": 132.24787974357605 } ], "16": [ { "epoch": 1, "train_loss": 5.052905302276612, "train_acc": 0.01584, "test_loss": 4.867012271118164, "test_acc": 0.0108, "lyapunov": 2.5116785645789808, "grad_norm": 5.121741212106656, "grad_max_sv": 4.439184683561325, "grad_min_sv": 8.58994061270213e-08, "grad_condition": 81112713.35007669, "lr": 0.0009998903417374227, "time_sec": 177.38097023963928 }, { "epoch": 2, "train_loss": 4.7834703578186035, "train_acc": 0.0185, "test_loss": 4.856568830871582, "test_acc": 0.0105, "lyapunov": 2.04087689069226, "grad_norm": 3.485253038009916, "grad_max_sv": 2.8998831868171693, "grad_min_sv": 5.773870767437905e-08, "grad_condition": 487880276.00022805, "lr": 0.0009995614150494292, "time_sec": 177.40509605407715 }, { "epoch": 3, "train_loss": 4.663032297821045, "train_acc": 0.01814, "test_loss": 4.829788903808594, "test_acc": 0.01, "lyapunov": 1.8697960974310366, "grad_norm": 2.5433134222817766, "grad_max_sv": 1.7969021894054094, "grad_min_sv": 3.7302616086586385e-08, "grad_condition": 424272904.7057018, "lr": 0.0009990133642141358, "time_sec": 177.55998063087463 }, { "epoch": 4, "train_loss": 4.580566212463379, "train_acc": 0.01816, "test_loss": 5.0227375442504885, "test_acc": 0.01, "lyapunov": 1.7420489681346336, "grad_norm": 1.5123120559078784, "grad_max_sv": 1.0997331857681274, "grad_min_sv": 2.3435378404546015e-08, "grad_condition": 50550380.27519056, "lr": 0.0009982464296247522, "time_sec": 177.36285305023193 }, { "epoch": 5, "train_loss": 4.571687319335937, "train_acc": 0.0169, "test_loss": 4.605651480102539, "test_acc": 0.01, "lyapunov": 1.7220315366144985, "grad_norm": 1.03184611340308, "grad_max_sv": 0.7467024937272072, "grad_min_sv": 9.665682879938559e-09, "grad_condition": 55185094270.727005, "lr": 0.0009972609476841367, "time_sec": 177.37269806861877 }, { "epoch": 6, "train_loss": 4.555875413513184, "train_acc": 0.01516, "test_loss": 4.674408260345459, "test_acc": 0.01, "lyapunov": 1.7398752916194593, "grad_norm": 0.9957876060665515, "grad_max_sv": 0.5100040049292147, "grad_min_sv": 2.519896859816943e-10, "grad_condition": 106528792765.2457, "lr": 0.000996057350657239, "time_sec": 177.46758604049683 }, { "epoch": 7, "train_loss": 4.543562595672608, "train_acc": 0.01678, "test_loss": 4.860989706420899, "test_acc": 0.01, "lyapunov": 1.7311897963818992, "grad_norm": 0.6570743063224779, "grad_max_sv": 0.5500264666974545, "grad_min_sv": 1.8619091907383225e-09, "grad_condition": 101307067487.53836, "lr": 0.000994636166481494, "time_sec": 177.4092240333557 }, { "epoch": 8, "train_loss": 4.546422679748535, "train_acc": 0.01748, "test_loss": 4.704587471008301, "test_acc": 0.01, "lyapunov": 1.7199046867887686, "grad_norm": 0.6503196899352705, "grad_max_sv": 0.4841625154018402, "grad_min_sv": 1.3860141552013199e-09, "grad_condition": 92427076016.0824, "lr": 0.0009929980185352525, "time_sec": 177.34343218803406 }, { "epoch": 9, "train_loss": 4.555562373046875, "train_acc": 0.01632, "test_loss": 4.984462910461426, "test_acc": 0.01, "lyapunov": 1.7168824087323435, "grad_norm": 0.4710924143848028, "grad_max_sv": 0.3569773003458977, "grad_min_sv": 2.9924371274558933e-12, "grad_condition": 163638150611.22946, "lr": 0.0009911436253643444, "time_sec": 177.2937033176422 }, { "epoch": 10, "train_loss": 4.572519063873291, "train_acc": 0.01446, "test_loss": 4.622131011962891, "test_acc": 0.01, "lyapunov": 1.6881294174267507, "grad_norm": 0.5058537650400963, "grad_max_sv": 0.36440472304821014, "grad_min_sv": 6.516127066976764e-13, "grad_condition": 259926216911.04242, "lr": 0.0009890738003669028, "time_sec": 177.31165838241577 }, { "epoch": 11, "train_loss": 4.565913163909912, "train_acc": 0.01558, "test_loss": 5.445963431549072, "test_acc": 0.01, "lyapunov": 1.6539141406183657, "grad_norm": 0.48047604578041114, "grad_max_sv": 0.3803807333111763, "grad_min_sv": 9.42464814059806e-13, "grad_condition": 226641538861.88174, "lr": 0.00098678945143658, "time_sec": 177.28680086135864 }, { "epoch": 12, "train_loss": 4.585704666290283, "train_acc": 0.01426, "test_loss": 5.591514777374267, "test_acc": 0.01, "lyapunov": 1.6391262849578467, "grad_norm": 0.3984247324953335, "grad_max_sv": 0.32813584208488467, "grad_min_sv": 9.868289842027034e-13, "grad_condition": 205156435878.04105, "lr": 0.0009842915805643154, "time_sec": 177.34117722511292 }, { "epoch": 13, "train_loss": 4.604436149597168, "train_acc": 0.01222, "test_loss": 4.690793671417237, "test_acc": 0.01, "lyapunov": 1.641747108810698, "grad_norm": 0.3654356558343784, "grad_max_sv": 0.2650721728801727, "grad_min_sv": 2.5128712845214346e-14, "grad_condition": 259015002047.89975, "lr": 0.000981581283398829, "time_sec": 177.3893666267395 }, { "epoch": 14, "train_loss": 4.607583849945068, "train_acc": 0.01194, "test_loss": 4.637583544921875, "test_acc": 0.01, "lyapunov": 1.647905475953046, "grad_norm": 0.3152206467371112, "grad_max_sv": 0.24337820373475552, "grad_min_sv": 2.2884600952186276e-19, "grad_condition": 243378149152.73965, "lr": 0.0009786597487660333, "time_sec": 177.42928194999695 }, { "epoch": 15, "train_loss": 4.609895180664062, "train_acc": 0.01204, "test_loss": 4.618253812408447, "test_acc": 0.01, "lyapunov": 1.631026401239283, "grad_norm": 0.2910629294744733, "grad_max_sv": 0.25453653037548063, "grad_min_sv": 1.096334686408586e-14, "grad_condition": 251632031244.05, "lr": 0.0009755282581475766, "time_sec": 177.26571369171143 }, { "epoch": 16, "train_loss": 4.620552892456055, "train_acc": 0.01092, "test_loss": 4.829088508605957, "test_acc": 0.01, "lyapunov": 1.6514442287137747, "grad_norm": 0.32315656842976964, "grad_max_sv": 0.2540007773786783, "grad_min_sv": 2.6148553957350966e-15, "grad_condition": 253349213677.79898, "lr": 0.0009721881851187403, "time_sec": 177.23212313652039 }, { "epoch": 17, "train_loss": 4.645780512695312, "train_acc": 0.01148, "test_loss": 5.213332609558106, "test_acc": 0.0118, "lyapunov": 1.7068933586940132, "grad_norm": 0.4780888546414525, "grad_max_sv": 0.33272466212511065, "grad_min_sv": 1.1442340742877327e-13, "grad_condition": 310520393785.63025, "lr": 0.0009686409947459456, "time_sec": 177.3003396987915 }, { "epoch": 18, "train_loss": 4.643788212127686, "train_acc": 0.01072, "test_loss": 4.7405077087402345, "test_acc": 0.01, "lyapunov": 1.700578610305591, "grad_norm": 0.4623759718719876, "grad_max_sv": 0.36730299033224584, "grad_min_sv": 3.818205128193156e-15, "grad_condition": 365867778353.78564, "lr": 0.0009648882429441254, "time_sec": 177.37098169326782 }, { "epoch": 19, "train_loss": 4.6578716897583, "train_acc": 0.0106, "test_loss": 5.001485794830322, "test_acc": 0.01, "lyapunov": 1.7619636241737229, "grad_norm": 0.5961977275221398, "grad_max_sv": 0.3942902203649282, "grad_min_sv": 2.946577326860146e-13, "grad_condition": 343308843771.1844, "lr": 0.00096093157579425, "time_sec": 177.48300218582153 }, { "epoch": 20, "train_loss": 4.671879530639648, "train_acc": 0.00988, "test_loss": 4.9071829193115235, "test_acc": 0.01, "lyapunov": 1.8025801248867492, "grad_norm": 0.5059310784067265, "grad_max_sv": 0.3557112220674753, "grad_min_sv": 1.5333297747627812e-13, "grad_condition": 328969482461.7643, "lr": 0.0009567727288213001, "time_sec": 177.32300353050232 }, { "epoch": 21, "train_loss": 4.653441105194092, "train_acc": 0.0101, "test_loss": 5.037871252441406, "test_acc": 0.01, "lyapunov": 1.7085216252700142, "grad_norm": 0.3698981456336605, "grad_max_sv": 0.32922359369695187, "grad_min_sv": 2.0854029706572434e-14, "grad_condition": 323091955093.61206, "lr": 0.0009524135262330095, "time_sec": 177.3196620941162 }, { "epoch": 22, "train_loss": 4.632678106536865, "train_acc": 0.01074, "test_loss": 5.238784426116943, "test_acc": 0.01, "lyapunov": 1.6952984226329246, "grad_norm": 0.4241090659984796, "grad_max_sv": 0.386181453615427, "grad_min_sv": 2.802362135740985e-14, "grad_condition": 377561785396.401, "lr": 0.0009478558801197061, "time_sec": 177.29510116577148 }, { "epoch": 23, "train_loss": 4.638225617523194, "train_acc": 0.01138, "test_loss": 5.275448854064941, "test_acc": 0.01, "lyapunov": 1.6717191449821454, "grad_norm": 0.4690453217532838, "grad_max_sv": 0.36180934831500056, "grad_min_sv": 7.689419929357006e-14, "grad_condition": 343504771054.1229, "lr": 0.000943101789615607, "time_sec": 177.27985095977783 }, { "epoch": 24, "train_loss": 4.645476407775879, "train_acc": 0.01184, "test_loss": 5.105841419219971, "test_acc": 0.01, "lyapunov": 1.6884696520198033, "grad_norm": 0.46211885946676406, "grad_max_sv": 0.41755540743470193, "grad_min_sv": 3.2064806913220934e-13, "grad_condition": 342942332027.1542, "lr": 0.0009381533400219313, "time_sec": 177.25587034225464 }, { "epoch": 25, "train_loss": 4.6320624351501465, "train_acc": 0.0119, "test_loss": 6.030343013000488, "test_acc": 0.01, "lyapunov": 1.707195217042323, "grad_norm": 0.5021589283462617, "grad_max_sv": 0.39102165041840636, "grad_min_sv": 5.243264004713223e-13, "grad_condition": 307511385553.97986, "lr": 0.0009330127018922189, "time_sec": 177.37623739242554 }, { "epoch": 26, "train_loss": 4.612996809234619, "train_acc": 0.0124, "test_loss": 4.7069967758178715, "test_acc": 0.01, "lyapunov": 1.6614662732004815, "grad_norm": 0.41182683188165653, "grad_max_sv": 0.36811394318938256, "grad_min_sv": 1.8671300799803038e-13, "grad_condition": 326597103772.6738, "lr": 0.000927682130080253, "time_sec": 177.34338855743408 }, { "epoch": 27, "train_loss": 4.615120216217041, "train_acc": 0.01294, "test_loss": 5.169810830688476, "test_acc": 0.01, "lyapunov": 1.6869621197585865, "grad_norm": 0.48352542649856634, "grad_max_sv": 0.40701944530010226, "grad_min_sv": 2.212590997783025e-13, "grad_condition": 351263915868.759, "lr": 0.0009221639627510072, "time_sec": 177.37520146369934 }, { "epoch": 28, "train_loss": 4.618173647613525, "train_acc": 0.0121, "test_loss": 4.701211013793945, "test_acc": 0.01, "lyapunov": 1.6625224543959283, "grad_norm": 0.49633059160738635, "grad_max_sv": 0.42104807291179897, "grad_min_sv": 8.098768546668247e-14, "grad_condition": 390777126515.4154, "lr": 0.0009164606203550494, "time_sec": 177.30147242546082 }, { "epoch": 29, "train_loss": 4.620836652526855, "train_acc": 0.01168, "test_loss": 5.855577803039551, "test_acc": 0.01, "lyapunov": 1.6738867168231388, "grad_norm": 0.46837018531534874, "grad_max_sv": 0.41829773411154747, "grad_min_sv": 6.839261746330108e-14, "grad_condition": 396621981755.1995, "lr": 0.0009105746045668516, "time_sec": 177.59404516220093 }, { "epoch": 30, "train_loss": 4.620147025604248, "train_acc": 0.01212, "test_loss": 5.105264408111572, "test_acc": 0.0024, "lyapunov": 1.6637281100158496, "grad_norm": 0.5269676291306111, "grad_max_sv": 0.4443404793739319, "grad_min_sv": 4.246975380253858e-14, "grad_condition": 429585177175.7853, "lr": 0.0009045084971874733, "time_sec": 177.3182647228241 }, { "epoch": 31, "train_loss": 4.6263528985595705, "train_acc": 0.01214, "test_loss": 4.881978817749023, "test_acc": 0.01, "lyapunov": 1.679152080774917, "grad_norm": 0.4813838001178168, "grad_max_sv": 0.44175935424864293, "grad_min_sv": 7.640593233486203e-14, "grad_condition": 412963565609.7972, "lr": 0.0008982649590120977, "time_sec": 177.52869391441345 }, { "epoch": 32, "train_loss": 4.64666208404541, "train_acc": 0.01024, "test_loss": 4.607140179443359, "test_acc": 0.01, "lyapunov": 1.6733192260308034, "grad_norm": 0.9644658562133654, "grad_max_sv": 0.32155169621109964, "grad_min_sv": 4.501243792038921e-14, "grad_condition": 307022698703.9159, "lr": 0.0008918467286629196, "time_sec": 177.55723929405212 }, { "epoch": 33, "train_loss": 4.629158392181396, "train_acc": 0.01256, "test_loss": 4.610281867980957, "test_acc": 0.01, "lyapunov": 1.7062030826383234, "grad_norm": 0.8603320661340712, "grad_max_sv": 0.3315905283205211, "grad_min_sv": 1.30026839163971e-13, "grad_condition": 311972159847.4972, "lr": 0.0008852566213878943, "time_sec": 177.52309370040894 }, { "epoch": 34, "train_loss": 4.61046769607544, "train_acc": 0.01252, "test_loss": 4.61788650970459, "test_acc": 0.01, "lyapunov": 1.6976071282116043, "grad_norm": 0.49261012177272534, "grad_max_sv": 0.3965699575841427, "grad_min_sv": 1.5454696301012257e-13, "grad_condition": 361671513434.2426, "lr": 0.000878497527825878, "time_sec": 177.35865092277527 }, { "epoch": 35, "train_loss": 4.610115225982666, "train_acc": 0.0133, "test_loss": 4.610134786224365, "test_acc": 0.01, "lyapunov": 1.7059512098731897, "grad_norm": 0.6359621148942639, "grad_max_sv": 0.38861413495615127, "grad_min_sv": 4.932618749060156e-13, "grad_condition": 303490840826.2363, "lr": 0.000871572412738697, "time_sec": 177.262850522995 }, { "epoch": 36, "train_loss": 4.599939749145507, "train_acc": 0.01366, "test_loss": 4.967366139221191, "test_acc": 0.01, "lyapunov": 1.6910303544510357, "grad_norm": 0.48781695526823965, "grad_max_sv": 0.3771605670452118, "grad_min_sv": 1.087613697669073e-12, "grad_condition": 257003832809.76837, "lr": 0.0008644843137107055, "time_sec": 177.29217314720154 }, { "epoch": 37, "train_loss": 4.5619960546875, "train_acc": 0.01694, "test_loss": 4.731475791931152, "test_acc": 0.01, "lyapunov": 1.6942788399089024, "grad_norm": 0.5025968244527356, "grad_max_sv": 0.3710522945970297, "grad_min_sv": 1.7366462838151458e-12, "grad_condition": 182613054683.41757, "lr": 0.0008572363398164014, "time_sec": 177.32313704490662 }, { "epoch": 38, "train_loss": 4.565163485412597, "train_acc": 0.01702, "test_loss": 4.821879299926758, "test_acc": 0.01, "lyapunov": 1.7136198645052703, "grad_norm": 0.3647367948752072, "grad_max_sv": 0.2595147430896759, "grad_min_sv": 8.982830963644869e-13, "grad_condition": 165264606800.54236, "lr": 0.0008498316702566826, "time_sec": 177.30079579353333 }, { "epoch": 39, "train_loss": 4.564778382873535, "train_acc": 0.01674, "test_loss": 4.7682116500854494, "test_acc": 0.01, "lyapunov": 1.717852655579062, "grad_norm": 0.3050778193964112, "grad_max_sv": 0.23688307516276835, "grad_min_sv": 7.061831886877416e-13, "grad_condition": 158702297955.0819, "lr": 0.0008422735529643442, "time_sec": 177.48431873321533 }, { "epoch": 40, "train_loss": 4.5591833352661135, "train_acc": 0.0181, "test_loss": 4.824417631530761, "test_acc": 0.01, "lyapunov": 1.7331721334506178, "grad_norm": 0.3159273980899205, "grad_max_sv": 0.2037038005888462, "grad_min_sv": 9.425467893049303e-13, "grad_condition": 137011838971.33943, "lr": 0.0008345653031794289, "time_sec": 177.31830286979675 }, { "epoch": 41, "train_loss": 4.578043832092285, "train_acc": 0.01756, "test_loss": 4.636139833068848, "test_acc": 0.01, "lyapunov": 1.8264592937801196, "grad_norm": 0.3694732916545973, "grad_max_sv": 0.18727784380316734, "grad_min_sv": 5.982392141838314e-13, "grad_condition": 126511514412.27226, "lr": 0.0008267103019950526, "time_sec": 177.335711479187 }, { "epoch": 42, "train_loss": 4.673806926269531, "train_acc": 0.01194, "test_loss": 4.6080057914733885, "test_acc": 0.01, "lyapunov": 1.9006618404632334, "grad_norm": 1.9332134687963871, "grad_max_sv": 0.11263461007879413, "grad_min_sv": 3.077567965127664e-13, "grad_condition": 84300063979.57101, "lr": 0.0008187119948743447, "time_sec": 177.32483506202698 }, { "epoch": 43, "train_loss": 4.688161468811035, "train_acc": 0.01068, "test_loss": 4.629961785125732, "test_acc": 0.01, "lyapunov": 1.7131454627532179, "grad_norm": 0.6010997717026842, "grad_max_sv": 0.29899735348299145, "grad_min_sv": 2.479182783007377e-09, "grad_condition": 66211640983.312706, "lr": 0.000810573890139155, "time_sec": 177.3025574684143 }, { "epoch": 44, "train_loss": 4.646988244628906, "train_acc": 0.0095, "test_loss": 4.6228884521484375, "test_acc": 0.01, "lyapunov": 1.5909017861041876, "grad_norm": 0.3503759029299944, "grad_max_sv": 0.2046256795525551, "grad_min_sv": 3.5303733441678653e-14, "grad_condition": 197873606364.90146, "lr": 0.0008022995574311873, "time_sec": 177.30037641525269 }, { "epoch": 45, "train_loss": 4.643654596862793, "train_acc": 0.00948, "test_loss": 4.658484869384766, "test_acc": 0.01, "lyapunov": 1.5862659612275145, "grad_norm": 0.2656233273924739, "grad_max_sv": 0.17473686374723912, "grad_min_sv": 1.813760877293352e-16, "grad_condition": 174705104463.56973, "lr": 0.0007938926261462363, "time_sec": 177.3814389705658 }, { "epoch": 46, "train_loss": 4.64409400894165, "train_acc": 0.0089, "test_loss": 4.812335470581055, "test_acc": 0.01, "lyapunov": 1.590341107619693, "grad_norm": 0.2648745471846797, "grad_max_sv": 0.16318325139582157, "grad_min_sv": 9.479088537998935e-17, "grad_condition": 163165251374.67862, "lr": 0.0007853567838422158, "time_sec": 177.3781590461731 }, { "epoch": 47, "train_loss": 4.643036758270264, "train_acc": 0.00928, "test_loss": 4.609914025878906, "test_acc": 0.01, "lyapunov": 1.5894581573393645, "grad_norm": 0.2691116464860412, "grad_max_sv": 0.15965580381453037, "grad_min_sv": 1.0509738482436128e-46, "grad_condition": 159655803814.53036, "lr": 0.0007766957746216719, "time_sec": 177.31791877746582 }, { "epoch": 48, "train_loss": 4.642327072753906, "train_acc": 0.00992, "test_loss": 4.8127995941162105, "test_acc": 0.01, "lyapunov": 1.5860872100991057, "grad_norm": 0.23492399170085265, "grad_max_sv": 0.1611787799745798, "grad_min_sv": 6.216856363016735e-39, "grad_condition": 161178779974.57983, "lr": 0.0007679133974894982, "time_sec": 177.36284637451172 }, { "epoch": 49, "train_loss": 4.642729123077393, "train_acc": 0.00984, "test_loss": 4.621463303375244, "test_acc": 0.01, "lyapunov": 1.591500211859603, "grad_norm": 0.21793856766380534, "grad_max_sv": 0.15185034908354283, "grad_min_sv": 2.264801692824062e-26, "grad_condition": 151850349083.53925, "lr": 0.000759013504686565, "time_sec": 177.32554411888123 }, { "epoch": 50, "train_loss": 4.643996462554932, "train_acc": 0.0102, "test_loss": 4.609245301818848, "test_acc": 0.01, "lyapunov": 1.5983945966681556, "grad_norm": 0.22457837692293584, "grad_max_sv": 0.15547131709754466, "grad_min_sv": 0.0, "grad_condition": 155471317097.54468, "lr": 0.0007499999999999998, "time_sec": 177.34761261940002 }, { "epoch": 51, "train_loss": 4.6476463407897946, "train_acc": 0.0094, "test_loss": 4.637005358123779, "test_acc": 0.01, "lyapunov": 1.608639404291997, "grad_norm": 0.22991701525164646, "grad_max_sv": 0.14587618354707957, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 145876183547.07956, "lr": 0.0007408768370508575, "time_sec": 177.40973281860352 }, { "epoch": 52, "train_loss": 4.643522353057861, "train_acc": 0.0091, "test_loss": 4.635898374176025, "test_acc": 0.01, "lyapunov": 1.5934445269577338, "grad_norm": 0.2512821617756961, "grad_max_sv": 0.11034320006147028, "grad_min_sv": 4.951726746617114e-32, "grad_condition": 110343200061.47026, "lr": 0.0007316480175599307, "time_sec": 177.36693692207336 }, { "epoch": 53, "train_loss": 4.652315429840088, "train_acc": 0.00954, "test_loss": 4.609224298095703, "test_acc": 0.01, "lyapunov": 1.634396403951718, "grad_norm": 0.5467593180422932, "grad_max_sv": 0.09123059632256628, "grad_min_sv": 2.430316909663535e-15, "grad_condition": 90896353773.23637, "lr": 0.0007223175895924635, "time_sec": 177.31507325172424 }, { "epoch": 54, "train_loss": 4.651325719604492, "train_acc": 0.00994, "test_loss": 4.626620025634765, "test_acc": 0.01, "lyapunov": 1.611309678048429, "grad_norm": 0.2940157240002703, "grad_max_sv": 0.13391106240451336, "grad_min_sv": 3.421636554179791e-13, "grad_condition": 110883017208.70781, "lr": 0.0007128896457825361, "time_sec": 177.39624953269958 }, { "epoch": 55, "train_loss": 4.64362153503418, "train_acc": 0.00934, "test_loss": 4.62131148147583, "test_acc": 0.01, "lyapunov": 1.5918327890088797, "grad_norm": 0.17460806885429525, "grad_max_sv": 0.08889081897214055, "grad_min_sv": 1.944495872420277e-15, "grad_condition": 88670543660.1524, "lr": 0.0007033683215378998, "time_sec": 177.32203340530396 }, { "epoch": 56, "train_loss": 4.644567786254883, "train_acc": 0.00952, "test_loss": 4.62790345993042, "test_acc": 0.01, "lyapunov": 1.5998888466974048, "grad_norm": 0.16766781878427695, "grad_max_sv": 0.07534359227865935, "grad_min_sv": 6.543167764955624e-20, "grad_condition": 75343581885.12659, "lr": 0.0006937577932260512, "time_sec": 177.3884792327881 }, { "epoch": 57, "train_loss": 4.644828259429931, "train_acc": 0.00976, "test_loss": 4.606487982940674, "test_acc": 0.01, "lyapunov": 1.5974730362977518, "grad_norm": 0.1793373629191484, "grad_max_sv": 0.07966042589396238, "grad_min_sv": 6.23405577303343e-15, "grad_condition": 78875044427.86894, "lr": 0.0006840622763423388, "time_sec": 177.43391919136047 }, { "epoch": 58, "train_loss": 4.644080760650635, "train_acc": 0.0091, "test_loss": 4.625753155517578, "test_acc": 0.01, "lyapunov": 1.6024256923314555, "grad_norm": 0.2678862199559515, "grad_max_sv": 0.06979989502578973, "grad_min_sv": 2.271738328433089e-16, "grad_condition": 69772902566.56038, "lr": 0.0006742860236609073, "time_sec": 177.34277653694153 }, { "epoch": 59, "train_loss": 4.642539700622558, "train_acc": 0.0104, "test_loss": 4.606066676330566, "test_acc": 0.01, "lyapunov": 1.5953022006832425, "grad_norm": 0.18186171250969738, "grad_max_sv": 0.052746226685121654, "grad_min_sv": 0.0, "grad_condition": 52746226685.12166, "lr": 0.0006644333233692913, "time_sec": 177.2813150882721 }, { "epoch": 60, "train_loss": 4.643028160400391, "train_acc": 0.0096, "test_loss": 4.606985287475586, "test_acc": 0.01, "lyapunov": 1.5944073910603438, "grad_norm": 0.16605928285367347, "grad_max_sv": 0.04408669015392661, "grad_min_sv": 0.0, "grad_condition": 44086690153.926605, "lr": 0.0006545084971874734, "time_sec": 177.34340691566467 }, { "epoch": 61, "train_loss": 4.641566214599609, "train_acc": 0.00942, "test_loss": 4.6096303787231445, "test_acc": 0.01, "lyapunov": 1.5902936217730002, "grad_norm": 0.17097577525317767, "grad_max_sv": 0.048659399058669804, "grad_min_sv": 0.0, "grad_condition": 48659399058.6698, "lr": 0.0006445158984722354, "time_sec": 177.41231846809387 }, { "epoch": 62, "train_loss": 4.643437232666016, "train_acc": 0.00904, "test_loss": 4.614830825805664, "test_acc": 0.01, "lyapunov": 1.597925158717748, "grad_norm": 0.17398079786227064, "grad_max_sv": 0.04662688081152737, "grad_min_sv": 0.0, "grad_condition": 46626880811.52737, "lr": 0.0006344599103076324, "time_sec": 177.41233468055725 }, { "epoch": 63, "train_loss": 4.64204384475708, "train_acc": 0.01014, "test_loss": 4.608532351684571, "test_acc": 0.01, "lyapunov": 1.591071292567436, "grad_norm": 0.18148049003675806, "grad_max_sv": 0.03887187172658742, "grad_min_sv": 0.0, "grad_condition": 38871871726.58742, "lr": 0.0006243449435824269, "time_sec": 177.32782816886902 }, { "epoch": 64, "train_loss": 4.642362080993652, "train_acc": 0.00976, "test_loss": 4.605919379425049, "test_acc": 0.01, "lyapunov": 1.59339769935364, "grad_norm": 0.16947785318867856, "grad_max_sv": 0.04678878029808402, "grad_min_sv": 0.0, "grad_condition": 46788780298.08402, "lr": 0.0006141754350553275, "time_sec": 177.36176109313965 }, { "epoch": 65, "train_loss": 4.64135870513916, "train_acc": 0.0098, "test_loss": 4.6061177238464355, "test_acc": 0.01, "lyapunov": 1.5889410545758884, "grad_norm": 0.200660646453697, "grad_max_sv": 0.052430361462756994, "grad_min_sv": 0.0, "grad_condition": 52430361462.75699, "lr": 0.0006039558454088793, "time_sec": 177.57254838943481 }, { "epoch": 66, "train_loss": 4.6474862211608885, "train_acc": 0.00968, "test_loss": 4.605675552368164, "test_acc": 0.01, "lyapunov": 1.6025549606289096, "grad_norm": 0.24193311739345152, "grad_max_sv": 0.06446847971528769, "grad_min_sv": 8.023691354480991e-14, "grad_condition": 58142616242.219055, "lr": 0.000593690657292862, "time_sec": 177.27647042274475 }, { "epoch": 67, "train_loss": 4.6455588671875, "train_acc": 0.00932, "test_loss": 4.608942795562744, "test_acc": 0.01, "lyapunov": 1.6029961197577474, "grad_norm": 0.5642775506276186, "grad_max_sv": 0.06661056466400624, "grad_min_sv": 4.989178535200188e-27, "grad_condition": 66610564664.00575, "lr": 0.0005833843733580507, "time_sec": 177.30575489997864 }, { "epoch": 68, "train_loss": 4.6422839654541015, "train_acc": 0.00948, "test_loss": 4.613675955200195, "test_acc": 0.01, "lyapunov": 1.5871542494010438, "grad_norm": 0.40260870408483307, "grad_max_sv": 0.06906388867646455, "grad_min_sv": 2.943967978666477e-19, "grad_condition": 69063862019.90744, "lr": 0.0005730415142812054, "time_sec": 177.3839509487152 }, { "epoch": 69, "train_loss": 4.641787251281738, "train_acc": 0.0095, "test_loss": 4.605676875305176, "test_acc": 0.01, "lyapunov": 1.5912645625336397, "grad_norm": 0.34254968614340625, "grad_max_sv": 0.04287184816785157, "grad_min_sv": 0.0, "grad_condition": 42871848167.85156, "lr": 0.0005626666167821517, "time_sec": 177.32984590530396 }, { "epoch": 70, "train_loss": 4.651252772827148, "train_acc": 0.00948, "test_loss": 4.605676740264893, "test_acc": 0.01, "lyapunov": 1.6005148091889403, "grad_norm": 0.32314191918702384, "grad_max_sv": 0.07503386735916137, "grad_min_sv": 1.515944273746056e-14, "grad_condition": 72060515877.79199, "lr": 0.0005522642316338265, "time_sec": 177.35727500915527 }, { "epoch": 71, "train_loss": 4.642202633666992, "train_acc": 0.00952, "test_loss": 4.60564603805542, "test_acc": 0.01, "lyapunov": 1.5934118678807603, "grad_norm": 0.19098601600212814, "grad_max_sv": 0.04769439417868852, "grad_min_sv": 0.0, "grad_condition": 47694394178.68852, "lr": 0.0005418389216661573, "time_sec": 177.31805086135864 }, { "epoch": 72, "train_loss": 4.643372284545898, "train_acc": 0.01042, "test_loss": 4.605551630401611, "test_acc": 0.01, "lyapunov": 1.6024812432506201, "grad_norm": 0.1850692588702891, "grad_max_sv": 0.029727647779509425, "grad_min_sv": 0.0, "grad_condition": 29727647779.509422, "lr": 0.0005313952597646563, "time_sec": 177.26796555519104 }, { "epoch": 73, "train_loss": 4.640834873046875, "train_acc": 0.01012, "test_loss": 4.605487160491943, "test_acc": 0.01, "lyapunov": 1.5882229832432153, "grad_norm": 0.18526548732293277, "grad_max_sv": 0.037329256813973186, "grad_min_sv": 0.0, "grad_condition": 37329256813.97318, "lr": 0.0005209378268645994, "time_sec": 177.25225377082825 }, { "epoch": 74, "train_loss": 4.64209197479248, "train_acc": 0.00906, "test_loss": 4.605482194519043, "test_acc": 0.01, "lyapunov": 1.5956125628307958, "grad_norm": 0.19272835899448448, "grad_max_sv": 0.03931440911255777, "grad_min_sv": 0.0, "grad_condition": 39314409112.55777, "lr": 0.0005104712099416781, "time_sec": 177.2522575855255 }, { "epoch": 75, "train_loss": 4.646220574035644, "train_acc": 0.00904, "test_loss": 4.605418196105957, "test_acc": 0.01, "lyapunov": 1.6149345593684166, "grad_norm": 0.18848455976917208, "grad_max_sv": 0.03723890888504684, "grad_min_sv": 0.0, "grad_condition": 37238908885.04684, "lr": 0.0004999999999999996, "time_sec": 177.2818944454193 }, { "epoch": 76, "train_loss": 4.648384475402832, "train_acc": 0.00998, "test_loss": 4.6053966011047365, "test_acc": 0.01, "lyapunov": 1.6287647842446251, "grad_norm": 1.8057917745549752, "grad_max_sv": 0.029743389310897327, "grad_min_sv": 3.7199142558296474e-21, "grad_condition": 29743389301.013134, "lr": 0.0004895287900583212, "time_sec": 177.26618552207947 }, { "epoch": 77, "train_loss": 4.721213637390137, "train_acc": 0.00964, "test_loss": 4.6436636322021485, "test_acc": 0.01, "lyapunov": 2.058074002985454, "grad_norm": 3.091860129305993, "grad_max_sv": 0.054268574403249656, "grad_min_sv": 8.376052745740116e-34, "grad_condition": 54268574403.24966, "lr": 0.0004790621731353997, "time_sec": 177.27104544639587 }, { "epoch": 78, "train_loss": 4.721108419342041, "train_acc": 0.0102, "test_loss": 4.665742019653321, "test_acc": 0.01, "lyapunov": 2.0632075443292215, "grad_norm": 0.16746757148328467, "grad_max_sv": 0.05550560392439365, "grad_min_sv": 2.1720126197034665e-45, "grad_condition": 55505603924.393654, "lr": 0.000468604740235343, "time_sec": 177.2460799217224 }, { "epoch": 79, "train_loss": 4.748111321258545, "train_acc": 0.00948, "test_loss": 4.609986500549317, "test_acc": 0.01, "lyapunov": 2.195971542307178, "grad_norm": 0.24040083874318255, "grad_max_sv": 0.05709849054073857, "grad_min_sv": 1.4965270295518628e-39, "grad_condition": 57098490540.73856, "lr": 0.00045816107833384175, "time_sec": 177.27070450782776 }, { "epoch": 80, "train_loss": 4.7519070631408695, "train_acc": 0.0117, "test_loss": 4.627280041503906, "test_acc": 0.01, "lyapunov": 2.2188175566056194, "grad_norm": 0.8805430521303074, "grad_max_sv": 0.057838325266129684, "grad_min_sv": 1.5422340573742856e-42, "grad_condition": 57838325266.129684, "lr": 0.0004477357683661729, "time_sec": 177.29695653915405 }, { "epoch": 81, "train_loss": 4.677329037322998, "train_acc": 0.00938, "test_loss": 4.61901457901001, "test_acc": 0.01, "lyapunov": 1.7923584527066907, "grad_norm": 0.8776582765129182, "grad_max_sv": 0.04953184952028096, "grad_min_sv": 3.503246160812043e-47, "grad_condition": 49531849520.28096, "lr": 0.00043733338321784746, "time_sec": 177.28252363204956 }, { "epoch": 82, "train_loss": 4.649648946685791, "train_acc": 0.00968, "test_loss": 4.616988354492188, "test_acc": 0.01, "lyapunov": 1.636922500627425, "grad_norm": 1.3865972070708266, "grad_max_sv": 0.01087386254221201, "grad_min_sv": 0.0, "grad_condition": 10873862542.21201, "lr": 0.0004269584857187939, "time_sec": 177.24314332008362 }, { "epoch": 83, "train_loss": 4.642039197845459, "train_acc": 0.00996, "test_loss": 4.614689962768555, "test_acc": 0.01, "lyapunov": 1.5991996630378391, "grad_norm": 1.3716621678192378, "grad_max_sv": 0.018109424225986003, "grad_min_sv": 0.0, "grad_condition": 18109424225.986004, "lr": 0.0004166156266419484, "time_sec": 177.229647397995 }, { "epoch": 84, "train_loss": 4.641844508972168, "train_acc": 0.00878, "test_loss": 4.617015579223633, "test_acc": 0.01, "lyapunov": 1.60060031792087, "grad_norm": 1.3175623049235154, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004063093427071373, "time_sec": 177.2538447380066 }, { "epoch": 85, "train_loss": 4.643175181274414, "train_acc": 0.0094, "test_loss": 4.614698597717285, "test_acc": 0.01, "lyapunov": 1.6059161156339719, "grad_norm": 1.2845631564383488, "grad_max_sv": 0.008081613527610897, "grad_min_sv": 0.0, "grad_condition": 8081613527.610898, "lr": 0.0003960441545911199, "time_sec": 177.20055627822876 }, { "epoch": 86, "train_loss": 4.643574464263916, "train_acc": 0.0098, "test_loss": 4.614707907104492, "test_acc": 0.01, "lyapunov": 1.6075664575752395, "grad_norm": 1.4187544153998444, "grad_max_sv": 0.00905034514144063, "grad_min_sv": 0.0, "grad_condition": 9050345141.440632, "lr": 0.0003858245649446718, "time_sec": 177.21315360069275 }, { "epoch": 87, "train_loss": 4.694294710845948, "train_acc": 0.00954, "test_loss": 4.623233102416992, "test_acc": 0.01, "lyapunov": 1.9175829625190677, "grad_norm": 4.082558395603232, "grad_max_sv": 0.02438779656608254, "grad_min_sv": 6.337662028039815e-35, "grad_condition": 24387796566.082542, "lr": 0.00037565505641757235, "time_sec": 177.25639843940735 }, { "epoch": 88, "train_loss": 4.717588612060547, "train_acc": 0.01098, "test_loss": 4.654013455200196, "test_acc": 0.01, "lyapunov": 2.087744262822144, "grad_norm": 0.17835559132091938, "grad_max_sv": 0.07744973180815577, "grad_min_sv": 2.3523356446513927e-16, "grad_condition": 77434631231.10988, "lr": 0.00036554008969236695, "time_sec": 177.38599228858948 }, { "epoch": 89, "train_loss": 4.734110566711426, "train_acc": 0.0155, "test_loss": 4.653230757141113, "test_acc": 0.01, "lyapunov": 2.1995491454058596, "grad_norm": 0.13356986466644585, "grad_max_sv": 0.0670669173821807, "grad_min_sv": 2.875717693613099e-34, "grad_condition": 67066917382.18069, "lr": 0.0003554841015277638, "time_sec": 177.2775719165802 }, { "epoch": 90, "train_loss": 4.692502493743897, "train_acc": 0.01608, "test_loss": 4.685703827667236, "test_acc": 0.01, "lyapunov": 2.1217137315998906, "grad_norm": 0.18454505411948288, "grad_max_sv": 0.09909263849258423, "grad_min_sv": 9.485088852608362e-15, "grad_condition": 98142092685.66644, "lr": 0.000345491502812526, "time_sec": 177.33423161506653 }, { "epoch": 91, "train_loss": 4.689375361785888, "train_acc": 0.01532, "test_loss": 5.054153802490235, "test_acc": 0.01, "lyapunov": 2.080054032528187, "grad_norm": 0.5188803350503319, "grad_max_sv": 0.1383956030011177, "grad_min_sv": 3.288818752125065e-14, "grad_condition": 133990904819.13261, "lr": 0.0003355666766307081, "time_sec": 177.33309030532837 }, { "epoch": 92, "train_loss": 4.63797587173462, "train_acc": 0.01862, "test_loss": 4.71228084487915, "test_acc": 0.01, "lyapunov": 2.1218495975674876, "grad_norm": 0.6784268973745995, "grad_max_sv": 0.1671210890635848, "grad_min_sv": 7.533849064621124e-14, "grad_condition": 156896122443.4754, "lr": 0.00032571397633909225, "time_sec": 177.35465455055237 }, { "epoch": 93, "train_loss": 4.629223160095215, "train_acc": 0.0201, "test_loss": 4.768279981994629, "test_acc": 0.01, "lyapunov": 2.231684987807213, "grad_norm": 0.2698404719461384, "grad_max_sv": 0.1522567519918084, "grad_min_sv": 2.610390891244236e-13, "grad_condition": 128146800497.54839, "lr": 0.00031593772365766094, "time_sec": 177.41608834266663 }, { "epoch": 94, "train_loss": 4.672454256744385, "train_acc": 0.0155, "test_loss": 4.625922811889648, "test_acc": 0.01, "lyapunov": 2.0642213479942066, "grad_norm": 1.2838784932252858, "grad_max_sv": 0.1068689662408179, "grad_min_sv": 3.5497216486826963e-13, "grad_condition": 81702903527.8157, "lr": 0.0003062422067739483, "time_sec": 177.35895490646362 }, { "epoch": 95, "train_loss": 4.682060436248779, "train_acc": 0.01154, "test_loss": 5.053488528442383, "test_acc": 0.01, "lyapunov": 1.908135286377519, "grad_norm": 1.423394417746509, "grad_max_sv": 0.06458842717497518, "grad_min_sv": 2.2284196585027795e-14, "grad_condition": 62761299140.91392, "lr": 0.00029663167846209965, "time_sec": 177.43999791145325 }, { "epoch": 96, "train_loss": 4.64783102355957, "train_acc": 0.0158, "test_loss": 5.105888792419433, "test_acc": 0.01, "lyapunov": 1.9445471297139707, "grad_norm": 0.21161345330658576, "grad_max_sv": 0.09921222645789385, "grad_min_sv": 5.191301724766352e-14, "grad_condition": 94303871341.31389, "lr": 0.00028711035421746345, "time_sec": 177.3871088027954 }, { "epoch": 97, "train_loss": 4.619986424102783, "train_acc": 0.01798, "test_loss": 4.954860754394531, "test_acc": 0.01, "lyapunov": 1.9772856226357658, "grad_norm": 0.22380684108271168, "grad_max_sv": 0.10661779213696718, "grad_min_sv": 6.269415747523095e-14, "grad_condition": 100907105733.10144, "lr": 0.00027768241040753615, "time_sec": 177.3668417930603 }, { "epoch": 98, "train_loss": 4.708672041168213, "train_acc": 0.01462, "test_loss": 5.008634625244141, "test_acc": 0.01, "lyapunov": 2.0945300257114496, "grad_norm": 1.4979433862072131, "grad_max_sv": 0.09214200942307252, "grad_min_sv": 8.393969521570709e-14, "grad_condition": 84461106378.82773, "lr": 0.00026835198244006903, "time_sec": 177.33356857299805 }, { "epoch": 99, "train_loss": 4.692991460723877, "train_acc": 0.01672, "test_loss": 4.888367279052734, "test_acc": 0.01, "lyapunov": 2.20108045184094, "grad_norm": 0.385891368064135, "grad_max_sv": 0.11020931415259838, "grad_min_sv": 4.014219483338492e-13, "grad_condition": 88357297169.3239, "lr": 0.0002591231629491421, "time_sec": 177.36116933822632 }, { "epoch": 100, "train_loss": 4.679412184295654, "train_acc": 0.01748, "test_loss": 4.801361751556397, "test_acc": 0.01, "lyapunov": 2.1626759752288196, "grad_norm": 0.29188655689728976, "grad_max_sv": 0.10528047941625118, "grad_min_sv": 7.079886157137732e-13, "grad_condition": 70271036997.56067, "lr": 0.0002499999999999997, "time_sec": 177.36359167099 }, { "epoch": 101, "train_loss": 4.670090843048095, "train_acc": 0.01908, "test_loss": 4.845812666320801, "test_acc": 0.01, "lyapunov": 2.191265623282898, "grad_norm": 0.2721459181488543, "grad_max_sv": 0.11140938717871904, "grad_min_sv": 9.673542537562727e-13, "grad_condition": 69811952897.07645, "lr": 0.00024098649531343477, "time_sec": 177.350919008255 }, { "epoch": 102, "train_loss": 4.7038639653015135, "train_acc": 0.01622, "test_loss": 4.827154957580566, "test_acc": 0.01, "lyapunov": 2.236257368036548, "grad_norm": 0.37089976502154626, "grad_max_sv": 0.10384687632322312, "grad_min_sv": 6.884885540002143e-13, "grad_condition": 72812162645.31807, "lr": 0.0002320866025105016, "time_sec": 177.35117840766907 }, { "epoch": 103, "train_loss": 4.815245042877197, "train_acc": 0.01124, "test_loss": 4.606607830810547, "test_acc": 0.01, "lyapunov": 2.2844167551421144, "grad_norm": 4.100047695451907, "grad_max_sv": 0.05260885274793026, "grad_min_sv": 1.3802032362544088e-13, "grad_condition": 46932354731.69929, "lr": 0.0002233042253783278, "time_sec": 177.36591219902039 }, { "epoch": 104, "train_loss": 4.874257210388183, "train_acc": 0.0107, "test_loss": 4.615321169281006, "test_acc": 0.01, "lyapunov": 2.5303738708691217, "grad_norm": 4.641557506783305, "grad_max_sv": 0.04989699286900873, "grad_min_sv": 6.455291206487273e-16, "grad_condition": 49867710747.47777, "lr": 0.000214643216157784, "time_sec": 177.35230231285095 }, { "epoch": 105, "train_loss": 4.723299936981201, "train_acc": 0.01176, "test_loss": 4.638908140563965, "test_acc": 0.01, "lyapunov": 2.0839424148544934, "grad_norm": 1.355378299816155, "grad_max_sv": 0.07086729909481657, "grad_min_sv": 3.4057078840793797e-16, "grad_condition": 70843059990.87044, "lr": 0.00020610737385376332, "time_sec": 177.27781128883362 }, { "epoch": 106, "train_loss": 4.7231269412231445, "train_acc": 0.01514, "test_loss": 4.6237520652771, "test_acc": 0.01, "lyapunov": 2.1920783269740736, "grad_norm": 0.23046249442621652, "grad_max_sv": 0.08427620781585574, "grad_min_sv": 2.6872672205060264e-14, "grad_condition": 82259478658.28171, "lr": 0.00019770044256881242, "time_sec": 177.32385993003845 }, { "epoch": 107, "train_loss": 4.718143957061767, "train_acc": 0.01406, "test_loss": 6.732960067749024, "test_acc": 0.01, "lyapunov": 2.1179436051937017, "grad_norm": 2.388318428417535, "grad_max_sv": 0.06378129383232674, "grad_min_sv": 4.2658139494079437e-14, "grad_condition": 60789693053.35014, "lr": 0.0001894261098608447, "time_sec": 177.3540232181549 }, { "epoch": 108, "train_loss": 4.714431188049317, "train_acc": 0.01334, "test_loss": 4.613714739990234, "test_acc": 0.01, "lyapunov": 2.1213468349803133, "grad_norm": 2.8791461854741613, "grad_max_sv": 0.07117215000674204, "grad_min_sv": 1.694507032491845e-13, "grad_condition": 60059951698.86328, "lr": 0.000181288005125655, "time_sec": 177.47124576568604 }, { "epoch": 109, "train_loss": 4.721813513946533, "train_acc": 0.01472, "test_loss": 4.676416804504394, "test_acc": 0.01, "lyapunov": 2.25968545111244, "grad_norm": 2.212408550707043, "grad_max_sv": 0.07278494546897427, "grad_min_sv": 3.1126578738112443e-13, "grad_condition": 57077814227.08296, "lr": 0.0001732896980049473, "time_sec": 177.3752965927124 }, { "epoch": 110, "train_loss": 4.620515478363037, "train_acc": 0.0199, "test_loss": 4.849770021820069, "test_acc": 0.01, "lyapunov": 2.1241518365757543, "grad_norm": 0.4180712607860875, "grad_max_sv": 0.11002402473702984, "grad_min_sv": 1.172731082199846e-12, "grad_condition": 61549668598.997536, "lr": 0.00016543469682057076, "time_sec": 177.33867812156677 }, { "epoch": 111, "train_loss": 4.623785068969727, "train_acc": 0.0175, "test_loss": 4.637153623199463, "test_acc": 0.01, "lyapunov": 2.0509809773901235, "grad_norm": 0.8463969572958269, "grad_max_sv": 0.11101528165804334, "grad_min_sv": 1.87112152381424e-12, "grad_condition": 53576443216.59273, "lr": 0.00015772644703565552, "time_sec": 177.3645510673523 }, { "epoch": 112, "train_loss": 4.6054680319213865, "train_acc": 0.01996, "test_loss": 4.732485404968262, "test_acc": 0.01, "lyapunov": 1.9695151327820994, "grad_norm": 0.286979599544395, "grad_max_sv": 0.11297413185238839, "grad_min_sv": 1.5087152961486214e-12, "grad_condition": 66174816958.725464, "lr": 0.00015016832974331713, "time_sec": 177.3794810771942 }, { "epoch": 113, "train_loss": 4.6047257371520995, "train_acc": 0.021, "test_loss": 4.738913871765137, "test_acc": 0.01, "lyapunov": 2.0082323267636704, "grad_norm": 0.34791771509662284, "grad_max_sv": 0.11338779628276825, "grad_min_sv": 1.4891821340656678e-12, "grad_condition": 59376578972.79028, "lr": 0.00014276366018359834, "time_sec": 177.3533172607422 }, { "epoch": 114, "train_loss": 4.588227640686035, "train_acc": 0.02222, "test_loss": 4.73422000579834, "test_acc": 0.01, "lyapunov": 2.009492777497567, "grad_norm": 0.35363950275472883, "grad_max_sv": 0.1159886697307229, "grad_min_sv": 1.90550844743669e-12, "grad_condition": 54207670472.89293, "lr": 0.00013551568628929425, "time_sec": 177.36692142486572 }, { "epoch": 115, "train_loss": 4.6900716258239745, "train_acc": 0.01612, "test_loss": 4.658303358459473, "test_acc": 0.01, "lyapunov": 2.135267421412651, "grad_norm": 1.3246217912641853, "grad_max_sv": 0.10598969534124456, "grad_min_sv": 1.3219100092920473e-12, "grad_condition": 61126734552.39955, "lr": 0.00012842758726130276, "time_sec": 177.3328320980072 }, { "epoch": 116, "train_loss": 4.786548847961426, "train_acc": 0.01006, "test_loss": 4.61871778717041, "test_acc": 0.01, "lyapunov": 2.3106003911293986, "grad_norm": 0.20288682229149946, "grad_max_sv": 0.07976289726793766, "grad_min_sv": 9.703750835778777e-14, "grad_condition": 73480681043.72867, "lr": 0.0001215024721741218, "time_sec": 177.3196315765381 }, { "epoch": 117, "train_loss": 4.737495873718261, "train_acc": 0.00978, "test_loss": 5.255185474395752, "test_acc": 0.01, "lyapunov": 2.141355973680306, "grad_norm": 1.2090832667169469, "grad_max_sv": 0.06462649000441803, "grad_min_sv": 4.712035785133647e-14, "grad_condition": 61562797934.37225, "lr": 0.00011474337861210538, "time_sec": 177.3440716266632 }, { "epoch": 118, "train_loss": 4.7640791331481935, "train_acc": 0.01042, "test_loss": 4.606605186462402, "test_acc": 0.01, "lyapunov": 2.2581872031511856, "grad_norm": 1.4638342931368784, "grad_max_sv": 0.06105093636777751, "grad_min_sv": 3.379161065598181e-14, "grad_condition": 58851399772.93186, "lr": 0.00010815327133708009, "time_sec": 177.32141637802124 }, { "epoch": 119, "train_loss": 4.764838110656738, "train_acc": 0.01, "test_loss": 4.609263079833984, "test_acc": 0.01, "lyapunov": 2.2616506915568086, "grad_norm": 1.5774818313640573, "grad_max_sv": 0.05949288122285177, "grad_min_sv": 9.459326270127109e-15, "grad_condition": 58897801267.18583, "lr": 0.00010173504098790182, "time_sec": 177.3150999546051 }, { "epoch": 120, "train_loss": 4.745092378540039, "train_acc": 0.00954, "test_loss": 4.691408560180664, "test_acc": 0.01, "lyapunov": 2.1814588677242894, "grad_norm": 0.9224368099956493, "grad_max_sv": 0.06503358271721853, "grad_min_sv": 6.0891251611874775e-15, "grad_condition": 64617582544.06616, "lr": 9.549150281252629e-05, "time_sec": 177.2845914363861 }, { "epoch": 121, "train_loss": 4.715786669311523, "train_acc": 0.00966, "test_loss": 4.7921840202331545, "test_acc": 0.01, "lyapunov": 2.0026006262625575, "grad_norm": 9.006667150025358, "grad_max_sv": 0.008544169525441167, "grad_min_sv": 2.554875264407016e-15, "grad_condition": 8406179861.052277, "lr": 8.942539543314794e-05, "time_sec": 177.5404670238495 }, { "epoch": 122, "train_loss": 4.728659786224365, "train_acc": 0.01478, "test_loss": 4.716466751098633, "test_acc": 0.01, "lyapunov": 2.2308361682745503, "grad_norm": 2.3677820237911122, "grad_max_sv": 0.08329055261057261, "grad_min_sv": 5.30326773979997e-14, "grad_condition": 78769851023.79935, "lr": 8.353937964495024e-05, "time_sec": 177.3092577457428 }, { "epoch": 123, "train_loss": 4.741206109161377, "train_acc": 0.01406, "test_loss": 4.632773582458496, "test_acc": 0.01, "lyapunov": 2.229069578982985, "grad_norm": 3.8848615316118043, "grad_max_sv": 0.07590833908627041, "grad_min_sv": 3.6579889540451006e-14, "grad_condition": 72297092377.36781, "lr": 7.783603724899243e-05, "time_sec": 177.35984468460083 }, { "epoch": 124, "train_loss": 4.9050667370605465, "train_acc": 0.0107, "test_loss": 4.692931840515136, "test_acc": 0.01, "lyapunov": 2.5950029045724503, "grad_norm": 8.40683796480657, "grad_max_sv": 0.020135342784899812, "grad_min_sv": 1.1905984424824726e-14, "grad_condition": 19073293863.494404, "lr": 7.231786991974666e-05, "time_sec": 177.38076376914978 }, { "epoch": 125, "train_loss": 4.918515665893555, "train_acc": 0.01042, "test_loss": 4.800165419769287, "test_acc": 0.01, "lyapunov": 2.6619165169308556, "grad_norm": 9.502093865016478, "grad_max_sv": 0.0075993670089607775, "grad_min_sv": 1.2921884398822422e-14, "grad_condition": 6651468556.477142, "lr": 6.698729810778072e-05, "time_sec": 177.32155227661133 }, { "epoch": 126, "train_loss": 4.9456257382202145, "train_acc": 0.0101, "test_loss": 4.7986811172485355, "test_acc": 0.01, "lyapunov": 2.735420986209684, "grad_norm": 9.875822964888467, "grad_max_sv": 2.0739924829859918e-08, "grad_min_sv": 1.5032395739436103e-20, "grad_condition": 20739.924347962224, "lr": 6.184665997806817e-05, "time_sec": 177.3872947692871 }, { "epoch": 127, "train_loss": 4.886805105133057, "train_acc": 0.01126, "test_loss": 4.686759169006348, "test_acc": 0.01, "lyapunov": 2.63063982624532, "grad_norm": 7.634737807457953, "grad_max_sv": 0.027599985009449268, "grad_min_sv": 1.635026756284981e-14, "grad_condition": 25865594145.297913, "lr": 5.6898210384392595e-05, "time_sec": 177.42079973220825 }, { "epoch": 128, "train_loss": 4.948583959960938, "train_acc": 0.01006, "test_loss": 4.721134532165527, "test_acc": 0.01, "lyapunov": 2.7480261216078268, "grad_norm": 9.950271022813126, "grad_max_sv": 1.1180130898673368e-08, "grad_min_sv": 9.511312933176111e-21, "grad_condition": 11180.130536020879, "lr": 5.214411988029363e-05, "time_sec": 177.41947960853577 }, { "epoch": 129, "train_loss": 4.9554425132751465, "train_acc": 0.0104, "test_loss": 4.75336584854126, "test_acc": 0.01, "lyapunov": 2.751198763127827, "grad_norm": 9.975110420091031, "grad_max_sv": 0.0031297963534476316, "grad_min_sv": 4.913090963459592e-16, "grad_condition": 3069475100.3614955, "lr": 4.7586473766990294e-05, "time_sec": 177.42596411705017 }, { "epoch": 130, "train_loss": 4.96307178024292, "train_acc": 0.01048, "test_loss": 4.728824792480469, "test_acc": 0.01, "lyapunov": 2.754974961585706, "grad_norm": 9.999999996542677, "grad_max_sv": 6.772306379056181e-09, "grad_min_sv": 1.446285168596469e-20, "grad_condition": 6772.306171552807, "lr": 4.32272711786996e-05, "time_sec": 177.44565844535828 }, { "epoch": 131, "train_loss": 4.956811699676513, "train_acc": 0.0093, "test_loss": 4.750110374450683, "test_acc": 0.01, "lyapunov": 2.7515772535368, "grad_norm": 10.000000073356507, "grad_max_sv": 5.959159604055491e-09, "grad_min_sv": 1.476098261934064e-20, "grad_condition": 5959.1593520792685, "lr": 3.906842420574966e-05, "time_sec": 177.42677664756775 }, { "epoch": 132, "train_loss": 4.9561549958801265, "train_acc": 0.01016, "test_loss": 5.696090490722656, "test_acc": 0.01, "lyapunov": 2.7502345179048038, "grad_norm": 9.999999973626117, "grad_max_sv": 7.992252583702286e-09, "grad_min_sv": 2.4784692224406337e-20, "grad_condition": 7992.2521699460685, "lr": 3.5111757055874305e-05, "time_sec": 177.4220016002655 }, { "epoch": 133, "train_loss": 4.857832619476318, "train_acc": 0.01246, "test_loss": 4.677371379089355, "test_acc": 0.01, "lyapunov": 2.512646475411437, "grad_norm": 7.117012627349442, "grad_max_sv": 0.031855909609874486, "grad_min_sv": 1.649919424059889e-14, "grad_condition": 30285643652.368275, "lr": 3.1359005254054254e-05, "time_sec": 177.3773238658905 }, { "epoch": 134, "train_loss": 4.68506044845581, "train_acc": 0.01548, "test_loss": 4.609123469543457, "test_acc": 0.01, "lyapunov": 2.1184186959815454, "grad_norm": 1.9204167306730333, "grad_max_sv": 0.09412179148760884, "grad_min_sv": 4.6394519786537835e-14, "grad_condition": 89429686329.23029, "lr": 2.7811814881259484e-05, "time_sec": 177.34491610527039 }, { "epoch": 135, "train_loss": 4.681999072875977, "train_acc": 0.01576, "test_loss": 4.83034912109375, "test_acc": 0.01, "lyapunov": 2.150207258551322, "grad_norm": 1.143763847197843, "grad_max_sv": 0.10519317688898003, "grad_min_sv": 5.07688327121443e-14, "grad_condition": 99689376270.31213, "lr": 2.4471741852423218e-05, "time_sec": 177.33815479278564 }, { "epoch": 136, "train_loss": 4.695164921264649, "train_acc": 0.01672, "test_loss": 4.654338619232178, "test_acc": 0.01, "lyapunov": 2.2090382295496322, "grad_norm": 1.1474803627472534, "grad_max_sv": 0.11123525651727122, "grad_min_sv": 9.495798219714258e-14, "grad_condition": 102782907554.42734, "lr": 2.1340251233966362e-05, "time_sec": 177.36866855621338 }, { "epoch": 137, "train_loss": 4.692152431335449, "train_acc": 0.01646, "test_loss": 4.81933528137207, "test_acc": 0.01, "lyapunov": 2.2094227846931007, "grad_norm": 0.6303897036424283, "grad_max_sv": 0.11831559501588344, "grad_min_sv": 8.349289767505628e-14, "grad_condition": 109746710531.71823, "lr": 1.8418716601170932e-05, "time_sec": 177.3661823272705 }, { "epoch": 138, "train_loss": 4.6894233569335935, "train_acc": 0.01706, "test_loss": 4.791972970581055, "test_acc": 0.01, "lyapunov": 2.2000036544507116, "grad_norm": 2.1899555272870477, "grad_max_sv": 0.09350968728547274, "grad_min_sv": 4.120797655506886e-14, "grad_condition": 88843401487.6287, "lr": 1.570841943568445e-05, "time_sec": 177.3641233444214 }, { "epoch": 139, "train_loss": 4.694636091156005, "train_acc": 0.0159, "test_loss": 4.829331467437744, "test_acc": 0.01, "lyapunov": 2.215796913942108, "grad_norm": 0.9784986049838148, "grad_max_sv": 0.12486231978982687, "grad_min_sv": 1.0247936181848821e-13, "grad_condition": 113419375367.18208, "lr": 1.3210548563419845e-05, "time_sec": 177.35728001594543 }, { "epoch": 140, "train_loss": 4.694870633392334, "train_acc": 0.01644, "test_loss": 4.815142876434326, "test_acc": 0.01, "lyapunov": 2.217364390487866, "grad_norm": 1.2916272628863348, "grad_max_sv": 0.11291685290662548, "grad_min_sv": 5.3537487011776554e-14, "grad_condition": 106360741194.21178, "lr": 1.0926199633097203e-05, "time_sec": 177.3576626777649 }, { "epoch": 141, "train_loss": 4.677861398468018, "train_acc": 0.0173, "test_loss": 4.815771765899658, "test_acc": 0.01, "lyapunov": 2.1779102489466555, "grad_norm": 0.8766949577062909, "grad_max_sv": 0.12149501488558231, "grad_min_sv": 8.143102612255778e-14, "grad_condition": 111956733978.91446, "lr": 8.856374635655688e-06, "time_sec": 177.35283827781677 }, { "epoch": 142, "train_loss": 4.686267812042236, "train_acc": 0.01684, "test_loss": 4.823100394439697, "test_acc": 0.01, "lyapunov": 2.227254505962362, "grad_norm": 0.5331148714010232, "grad_max_sv": 0.1205288675238089, "grad_min_sv": 8.176555294007943e-14, "grad_condition": 111062530094.41301, "lr": 7.001981464747503e-06, "time_sec": 177.35118770599365 }, { "epoch": 143, "train_loss": 4.692831365509033, "train_acc": 0.01716, "test_loss": 4.897853678894043, "test_acc": 0.01, "lyapunov": 2.2571963544391913, "grad_norm": 0.6114897960642978, "grad_max_sv": 0.12478593328297125, "grad_min_sv": 8.340670293644858e-14, "grad_condition": 115479694388.34305, "lr": 5.3638335185058295e-06, "time_sec": 177.36120533943176 }, { "epoch": 144, "train_loss": 4.70658299621582, "train_acc": 0.0171, "test_loss": 4.83040984954834, "test_acc": 0.01, "lyapunov": 2.287657803586682, "grad_norm": 0.9510676579378554, "grad_max_sv": 0.1171010570952277, "grad_min_sv": 6.361800175176714e-14, "grad_condition": 109355119446.73831, "lr": 3.942649342761114e-06, "time_sec": 177.34865474700928 }, { "epoch": 145, "train_loss": 4.701995197296142, "train_acc": 0.0173, "test_loss": 4.613565782165527, "test_acc": 0.01, "lyapunov": 2.264257175233358, "grad_norm": 0.8111639031310902, "grad_max_sv": 0.11689584073509067, "grad_min_sv": 7.425262413111732e-14, "grad_condition": 108241392397.88205, "lr": 2.7390523158633524e-06, "time_sec": 177.34988021850586 }, { "epoch": 146, "train_loss": 4.698547594909668, "train_acc": 0.01698, "test_loss": 4.831944055175781, "test_acc": 0.01, "lyapunov": 2.264427444209223, "grad_norm": 0.7687759810394293, "grad_max_sv": 0.11922218743320086, "grad_min_sv": 7.928289197503764e-14, "grad_condition": 110429208233.33487, "lr": 1.7535703752478133e-06, "time_sec": 177.375305891037 }, { "epoch": 147, "train_loss": 4.703107703094482, "train_acc": 0.01644, "test_loss": 4.832024374389649, "test_acc": 0.01, "lyapunov": 2.262833438565969, "grad_norm": 0.8980427547431384, "grad_max_sv": 0.12822539806609132, "grad_min_sv": 9.266738943909007e-14, "grad_condition": 117774825403.93326, "lr": 9.866357858642196e-07, "time_sec": 177.37703728675842 }, { "epoch": 148, "train_loss": 4.694877036437989, "train_acc": 0.01716, "test_loss": 4.741145161437989, "test_acc": 0.01, "lyapunov": 2.2374743762833385, "grad_norm": 1.2386113783762993, "grad_max_sv": 0.13271797422266368, "grad_min_sv": 9.874739286162734e-14, "grad_condition": 121226456943.3418, "lr": 4.38584950570808e-07, "time_sec": 177.3770706653595 }, { "epoch": 149, "train_loss": 4.691502552185058, "train_acc": 0.0184, "test_loss": 4.9060412048339845, "test_acc": 0.01, "lyapunov": 2.2420086558822474, "grad_norm": 1.0935576324459544, "grad_max_sv": 0.1251808095059495, "grad_min_sv": 7.87008918289173e-14, "grad_condition": 115742557747.01627, "lr": 1.096582625772501e-07, "time_sec": 177.38786363601685 }, { "epoch": 150, "train_loss": 4.682859961853027, "train_acc": 0.0175, "test_loss": 4.898887846374512, "test_acc": 0.01, "lyapunov": 2.2194432437877216, "grad_norm": 0.9410314426818256, "grad_max_sv": 0.12126885750057496, "grad_min_sv": 7.283089248142724e-14, "grad_condition": 113197772104.82927, "lr": 0.0, "time_sec": 177.3536741733551 } ] } }