{ "vanilla": { "4": [ { "epoch": 1, "train_loss": 1.87523081199646, "train_acc": 0.3904, "test_loss": 1.3005033981323242, "test_acc": 0.538, "lyapunov": null, "grad_norm": 7.167065437345997, "grad_max_sv": 6.2841449797153475, "grad_min_sv": 2.820393511626662e-07, "grad_condition": 22637653.325481158, "lr": 0.0009997532801828658, "time_sec": 17.83638072013855 }, { "epoch": 2, "train_loss": 1.330778917236328, "train_acc": 0.53242, "test_loss": 1.3051589399337769, "test_acc": 0.5299, "lyapunov": null, "grad_norm": 5.684293544168513, "grad_max_sv": 4.961454087495804, "grad_min_sv": 2.2011614504435783e-07, "grad_condition": 23000049.3006949, "lr": 0.0009990133642141358, "time_sec": 15.308318853378296 }, { "epoch": 3, "train_loss": 1.1224762370300292, "train_acc": 0.59994, "test_loss": 1.1229688482284546, "test_acc": 0.6085, "lyapunov": null, "grad_norm": 4.767601837094887, "grad_max_sv": 4.13027862906456, "grad_min_sv": 1.9442289698190506e-07, "grad_condition": 21218061.296424918, "lr": 0.00099778098230154, "time_sec": 15.306547403335571 }, { "epoch": 4, "train_loss": 0.9929985418510437, "train_acc": 0.6506, "test_loss": 1.0345463452339172, "test_acc": 0.6476, "lyapunov": null, "grad_norm": 4.154534311876162, "grad_max_sv": 3.4217750519514083, "grad_min_sv": 1.738904227721605e-07, "grad_condition": 19945043.08817544, "lr": 0.000996057350657239, "time_sec": 15.302969694137573 }, { "epoch": 5, "train_loss": 0.8976026094818115, "train_acc": 0.68438, "test_loss": 0.8756585054397583, "test_acc": 0.6914, "lyapunov": null, "grad_norm": 3.6333960771107905, "grad_max_sv": 2.9354925364255906, "grad_min_sv": 1.6106242668456615e-07, "grad_condition": 18489046.232839655, "lr": 0.0009938441702975688, "time_sec": 15.317728281021118 }, { "epoch": 6, "train_loss": 0.8413557116317749, "train_acc": 0.70288, "test_loss": 1.0890468210220337, "test_acc": 0.6361, "lyapunov": null, "grad_norm": 3.416502916483722, "grad_max_sv": 2.8772784233093263, "grad_min_sv": 1.524946609876565e-07, "grad_condition": 19017545.32666207, "lr": 0.0009911436253643444, "time_sec": 15.30530047416687 }, { "epoch": 7, "train_loss": 0.780380486125946, "train_acc": 0.72624, "test_loss": 0.7749503490447998, "test_acc": 0.7328, "lyapunov": null, "grad_norm": 3.046069709126096, "grad_max_sv": 2.3629971712827684, "grad_min_sv": 1.380081055657456e-07, "grad_condition": 17149009.230771504, "lr": 0.0009879583809693736, "time_sec": 15.307675838470459 }, { "epoch": 8, "train_loss": 0.7390781346511841, "train_acc": 0.7414, "test_loss": 0.7958005157470703, "test_acc": 0.7277, "lyapunov": null, "grad_norm": 2.7435338958916513, "grad_max_sv": 2.05181370973587, "grad_min_sv": 1.2932217341443675e-07, "grad_condition": 16036517.768211821, "lr": 0.0009842915805643154, "time_sec": 15.307319641113281 }, { "epoch": 9, "train_loss": 0.7052495925521851, "train_acc": 0.75274, "test_loss": 1.0447007677078246, "test_acc": 0.6745, "lyapunov": null, "grad_norm": 2.552586529905072, "grad_max_sv": 2.0337040573358536, "grad_min_sv": 1.2101497901539914e-07, "grad_condition": 16963155.872520845, "lr": 0.0009801468428384714, "time_sec": 15.290063619613647 }, { "epoch": 10, "train_loss": 0.6694383864402771, "train_acc": 0.76588, "test_loss": 0.9462176066398621, "test_acc": 0.6842, "lyapunov": null, "grad_norm": 2.3520331395340692, "grad_max_sv": 1.7684333354234696, "grad_min_sv": 1.1190378259584577e-07, "grad_condition": 15955738.307438832, "lr": 0.0009755282581475767, "time_sec": 15.305615901947021 }, { "epoch": 11, "train_loss": 0.6340117832756043, "train_acc": 0.77878, "test_loss": 0.7613432981491088, "test_acc": 0.7377, "lyapunov": null, "grad_norm": 2.164571307713442, "grad_max_sv": 1.7057331085205079, "grad_min_sv": 1.0792852087604387e-07, "grad_condition": 15783530.208328355, "lr": 0.0009704403844771127, "time_sec": 15.29656457901001 }, { "epoch": 12, "train_loss": 0.6060477030181884, "train_acc": 0.78728, "test_loss": 0.7971237164974213, "test_acc": 0.729, "lyapunov": null, "grad_norm": 1.993298876301324, "grad_max_sv": 1.514353270828724, "grad_min_sv": 1.009763655801521e-07, "grad_condition": 14944755.026175302, "lr": 0.0009648882429441257, "time_sec": 15.30236530303955 }, { "epoch": 13, "train_loss": 0.5870892490005493, "train_acc": 0.79524, "test_loss": 0.8448094959259034, "test_acc": 0.7127, "lyapunov": null, "grad_norm": 1.8629217723116693, "grad_max_sv": 1.3949483826756477, "grad_min_sv": 9.635141964281502e-08, "grad_condition": 14581029.38399595, "lr": 0.0009588773128419905, "time_sec": 15.315025806427002 }, { "epoch": 14, "train_loss": 0.5539195073699951, "train_acc": 0.80644, "test_loss": 0.7561563467979431, "test_acc": 0.7394, "lyapunov": null, "grad_norm": 1.6986166991338625, "grad_max_sv": 1.245494757592678, "grad_min_sv": 8.711651755533012e-08, "grad_condition": 14401234.8235637, "lr": 0.0009524135262330098, "time_sec": 15.308890104293823 }, { "epoch": 15, "train_loss": 0.5333379591941834, "train_acc": 0.8143, "test_loss": 0.6968033623695373, "test_acc": 0.7569, "lyapunov": null, "grad_norm": 1.5656089916965232, "grad_max_sv": 1.1909169003367424, "grad_min_sv": 8.488269482853639e-08, "grad_condition": 14106351.27298153, "lr": 0.0009455032620941839, "time_sec": 15.311123609542847 }, { "epoch": 16, "train_loss": 0.5167095581436157, "train_acc": 0.82042, "test_loss": 0.849514400100708, "test_acc": 0.7133, "lyapunov": null, "grad_norm": 1.496171987836298, "grad_max_sv": 1.0258999049663544, "grad_min_sv": 8.006283778172473e-08, "grad_condition": 12841377.110361751, "lr": 0.0009381533400219318, "time_sec": 15.310609817504883 }, { "epoch": 17, "train_loss": 0.49894729826927187, "train_acc": 0.8262, "test_loss": 0.7154086270809173, "test_acc": 0.7552, "lyapunov": null, "grad_norm": 1.3884031919720434, "grad_max_sv": 0.9819801226258278, "grad_min_sv": 7.953692726658801e-08, "grad_condition": 12477520.833613167, "lr": 0.0009303710135019719, "time_sec": 15.301868200302124 }, { "epoch": 18, "train_loss": 0.4833205630302429, "train_acc": 0.83074, "test_loss": 0.8212436129570008, "test_acc": 0.7372, "lyapunov": null, "grad_norm": 1.322943153444315, "grad_max_sv": 0.9954353883862496, "grad_min_sv": 7.706266931251094e-08, "grad_condition": 12928888.561653998, "lr": 0.0009221639627510076, "time_sec": 15.304028987884521 }, { "epoch": 19, "train_loss": 0.46378349807739255, "train_acc": 0.8371, "test_loss": 0.6447551451683045, "test_acc": 0.789, "lyapunov": null, "grad_norm": 1.231933968586028, "grad_max_sv": 0.7683330580592156, "grad_min_sv": 6.892571695615856e-08, "grad_condition": 11194075.895721275, "lr": 0.000913540287137281, "time_sec": 15.304960489273071 }, { "epoch": 20, "train_loss": 0.44474551233291626, "train_acc": 0.84504, "test_loss": 0.6990101715087891, "test_acc": 0.7693, "lyapunov": null, "grad_norm": 1.1785280692983833, "grad_max_sv": 0.8134334728121757, "grad_min_sv": 6.934622298615523e-08, "grad_condition": 11771827.214910198, "lr": 0.0009045084971874739, "time_sec": 15.309978008270264 }, { "epoch": 21, "train_loss": 0.4328971823978424, "train_acc": 0.8493, "test_loss": 0.605803295135498, "test_acc": 0.7971, "lyapunov": null, "grad_norm": 1.1010893792673297, "grad_max_sv": 0.74788568764925, "grad_min_sv": 6.635127869358826e-08, "grad_condition": 11337903.371089932, "lr": 0.0008950775061878452, "time_sec": 15.304766416549683 }, { "epoch": 22, "train_loss": 0.42013943620681765, "train_acc": 0.85398, "test_loss": 0.6351155483245849, "test_acc": 0.7873, "lyapunov": null, "grad_norm": 1.050275059187082, "grad_max_sv": 0.733056052774191, "grad_min_sv": 6.172693325368073e-08, "grad_condition": 11926578.893480929, "lr": 0.0008852566213878947, "time_sec": 15.304250001907349 }, { "epoch": 23, "train_loss": 0.4068706720542908, "train_acc": 0.85872, "test_loss": 0.6962938892364502, "test_acc": 0.7771, "lyapunov": null, "grad_norm": 1.0041008989601972, "grad_max_sv": 0.6977266952395439, "grad_min_sv": 6.174876086006975e-08, "grad_condition": 11375115.065625418, "lr": 0.0008750555348152298, "time_sec": 15.29546570777893 }, { "epoch": 24, "train_loss": 0.3927080359458923, "train_acc": 0.86198, "test_loss": 0.6316822688102722, "test_acc": 0.797, "lyapunov": null, "grad_norm": 0.9591057928108919, "grad_max_sv": 0.6601924143731595, "grad_min_sv": 5.981677704269828e-08, "grad_condition": 10958128.320144685, "lr": 0.0008644843137107057, "time_sec": 15.319843292236328 }, { "epoch": 25, "train_loss": 0.37991392849445343, "train_acc": 0.8662, "test_loss": 0.7685016389846802, "test_acc": 0.7528, "lyapunov": null, "grad_norm": 0.9185108543931831, "grad_max_sv": 0.5813446715474129, "grad_min_sv": 5.7562914257403006e-08, "grad_condition": 10132723.13073414, "lr": 0.0008535533905932737, "time_sec": 15.314316272735596 }, { "epoch": 26, "train_loss": 0.3740078569984436, "train_acc": 0.86904, "test_loss": 0.6302923937797547, "test_acc": 0.7894, "lyapunov": null, "grad_norm": 0.896823092741051, "grad_max_sv": 0.5897809371352196, "grad_min_sv": 5.612208120453488e-08, "grad_condition": 10555219.724126566, "lr": 0.0008422735529643444, "time_sec": 15.295911312103271 }, { "epoch": 27, "train_loss": 0.35986615454673765, "train_acc": 0.8722, "test_loss": 0.5293433817148209, "test_acc": 0.8255, "lyapunov": null, "grad_norm": 0.8414160526480361, "grad_max_sv": 0.5433246113359929, "grad_min_sv": 5.460546566027347e-08, "grad_condition": 10029361.12551422, "lr": 0.0008306559326618259, "time_sec": 15.296611309051514 }, { "epoch": 28, "train_loss": 0.34749350198745727, "train_acc": 0.87846, "test_loss": 0.6013012096405029, "test_acc": 0.8077, "lyapunov": null, "grad_norm": 0.8012028361027335, "grad_max_sv": 0.5324302047491074, "grad_min_sv": 5.343053706141632e-08, "grad_condition": 9995030.902296156, "lr": 0.0008187119948743449, "time_sec": 15.314170122146606 }, { "epoch": 29, "train_loss": 0.33312201313018797, "train_acc": 0.88212, "test_loss": 0.5545183982849121, "test_acc": 0.8162, "lyapunov": null, "grad_norm": 0.7852771005330633, "grad_max_sv": 0.5164767228066921, "grad_min_sv": 5.198521888516439e-08, "grad_condition": 10107248.49432898, "lr": 0.0008064535268264883, "time_sec": 15.311892986297607 }, { "epoch": 30, "train_loss": 0.3230313647842407, "train_acc": 0.88538, "test_loss": 0.658975659275055, "test_acc": 0.7951, "lyapunov": null, "grad_norm": 0.7620779575769897, "grad_max_sv": 0.5038670122623443, "grad_min_sv": 5.0398949014152095e-08, "grad_condition": 10038873.739317197, "lr": 0.0007938926261462367, "time_sec": 15.305739402770996 }, { "epoch": 31, "train_loss": 0.318023904876709, "train_acc": 0.88796, "test_loss": 0.6099616609573364, "test_acc": 0.8127, "lyapunov": null, "grad_norm": 0.7501021639283835, "grad_max_sv": 0.48214229866862296, "grad_min_sv": 5.136175964537415e-08, "grad_condition": 9343056.264591306, "lr": 0.0007810416889260654, "time_sec": 15.325766324996948 }, { "epoch": 32, "train_loss": 0.31232675287246703, "train_acc": 0.89082, "test_loss": 0.5936648756027222, "test_acc": 0.8109, "lyapunov": null, "grad_norm": 0.7279129448401558, "grad_max_sv": 0.4431505911052227, "grad_min_sv": 4.812153910904726e-08, "grad_condition": 9245973.275864627, "lr": 0.0007679133974894983, "time_sec": 15.317164897918701 }, { "epoch": 33, "train_loss": 0.29341697571754455, "train_acc": 0.8967, "test_loss": 0.5134524160385132, "test_acc": 0.8357, "lyapunov": null, "grad_norm": 0.6884958324446571, "grad_max_sv": 0.4426784858107567, "grad_min_sv": 4.9337259699910875e-08, "grad_condition": 9173234.108017813, "lr": 0.0007545207078751857, "time_sec": 15.312905311584473 }, { "epoch": 34, "train_loss": 0.2897170938873291, "train_acc": 0.89828, "test_loss": 0.5332132309913635, "test_acc": 0.8335, "lyapunov": null, "grad_norm": 0.6750271636840882, "grad_max_sv": 0.4532689817249775, "grad_min_sv": 4.866335441278125e-08, "grad_condition": 9412153.339201316, "lr": 0.0007408768370508577, "time_sec": 15.313745260238647 }, { "epoch": 35, "train_loss": 0.28602589085578917, "train_acc": 0.89756, "test_loss": 0.6111867341041565, "test_acc": 0.8164, "lyapunov": null, "grad_norm": 0.6693786571127541, "grad_max_sv": 0.4255728892982006, "grad_min_sv": 4.737296563916971e-08, "grad_condition": 9020003.170186436, "lr": 0.0007269952498697734, "time_sec": 15.32437539100647 }, { "epoch": 36, "train_loss": 0.2724088624763489, "train_acc": 0.90408, "test_loss": 0.5054482436180114, "test_acc": 0.8387, "lyapunov": null, "grad_norm": 0.6416324201224461, "grad_max_sv": 0.4291106700897217, "grad_min_sv": 4.6136759568327077e-08, "grad_condition": 9385408.654433403, "lr": 0.0007128896457825364, "time_sec": 15.322253704071045 }, { "epoch": 37, "train_loss": 0.26598569943904876, "train_acc": 0.90576, "test_loss": 0.5292941621780396, "test_acc": 0.8315, "lyapunov": null, "grad_norm": 0.6311835178833255, "grad_max_sv": 0.372799988463521, "grad_min_sv": 4.42526025601353e-08, "grad_condition": 8432960.688056583, "lr": 0.0006985739453173903, "time_sec": 15.330822467803955 }, { "epoch": 38, "train_loss": 0.2548411606884003, "train_acc": 0.90972, "test_loss": 0.5889158064842224, "test_acc": 0.8304, "lyapunov": null, "grad_norm": 0.6075907586779873, "grad_max_sv": 0.40464401319622995, "grad_min_sv": 4.5029356776638e-08, "grad_condition": 9144084.308266882, "lr": 0.0006840622763423391, "time_sec": 15.306779623031616 }, { "epoch": 39, "train_loss": 0.2488733386993408, "train_acc": 0.91114, "test_loss": 0.5380938538551331, "test_acc": 0.8325, "lyapunov": null, "grad_norm": 0.6071846116294305, "grad_max_sv": 0.3960565410554409, "grad_min_sv": 4.6051877067299075e-08, "grad_condition": 8601152.95310002, "lr": 0.0006693689601226458, "time_sec": 15.341014862060547 }, { "epoch": 40, "train_loss": 0.24494112944602967, "train_acc": 0.91272, "test_loss": 0.5513611147403717, "test_acc": 0.8299, "lyapunov": null, "grad_norm": 0.592226155692726, "grad_max_sv": 0.3729955680668354, "grad_min_sv": 4.293505284636012e-08, "grad_condition": 8794710.30872355, "lr": 0.0006545084971874737, "time_sec": 15.389995813369751 }, { "epoch": 41, "train_loss": 0.23727083059310913, "train_acc": 0.9153, "test_loss": 0.516801796245575, "test_acc": 0.8461, "lyapunov": null, "grad_norm": 0.5812900748217327, "grad_max_sv": 0.38579080179333686, "grad_min_sv": 4.4259539766500214e-08, "grad_condition": 8748753.244401883, "lr": 0.0006394955530196147, "time_sec": 15.318362474441528 }, { "epoch": 42, "train_loss": 0.22481181490898133, "train_acc": 0.92022, "test_loss": 0.5416705925941467, "test_acc": 0.8322, "lyapunov": null, "grad_norm": 0.5619779097810216, "grad_max_sv": 0.35356797464191914, "grad_min_sv": 4.2614826689657547e-08, "grad_condition": 8335709.16485816, "lr": 0.0006243449435824273, "time_sec": 15.315505743026733 }, { "epoch": 43, "train_loss": 0.22531912160873413, "train_acc": 0.9199, "test_loss": 0.5833574778556824, "test_acc": 0.8338, "lyapunov": null, "grad_norm": 0.557199013327348, "grad_max_sv": 0.33938006646931174, "grad_min_sv": 4.300346327923421e-08, "grad_condition": 7932422.911212927, "lr": 0.0006090716206982714, "time_sec": 15.32206392288208 }, { "epoch": 44, "train_loss": 0.216223452000618, "train_acc": 0.92378, "test_loss": 0.5012358224868775, "test_acc": 0.8491, "lyapunov": null, "grad_norm": 0.5383308349401124, "grad_max_sv": 0.3396204937249422, "grad_min_sv": 4.201267005399245e-08, "grad_condition": 8110585.992247519, "lr": 0.0005936906572928625, "time_sec": 15.314954042434692 }, { "epoch": 45, "train_loss": 0.21238275866508483, "train_acc": 0.92506, "test_loss": 0.5394745681762695, "test_acc": 0.8426, "lyapunov": null, "grad_norm": 0.5338537929467614, "grad_max_sv": 0.34414798244833944, "grad_min_sv": 4.2673109312829635e-08, "grad_condition": 8155102.629835799, "lr": 0.0005782172325201156, "time_sec": 15.313148975372314 }, { "epoch": 46, "train_loss": 0.2043999564409256, "train_acc": 0.9264, "test_loss": 0.4982535705089569, "test_acc": 0.851, "lyapunov": null, "grad_norm": 0.518001070564685, "grad_max_sv": 0.3181751623749733, "grad_min_sv": 4.258852284166892e-08, "grad_condition": 7586177.211236173, "lr": 0.0005626666167821523, "time_sec": 15.31693696975708 }, { "epoch": 47, "train_loss": 0.19748862716674806, "train_acc": 0.93056, "test_loss": 0.511198134803772, "test_acc": 0.8512, "lyapunov": null, "grad_norm": 0.5066091467854666, "grad_max_sv": 0.3097307480871677, "grad_min_sv": 4.0578768167875976e-08, "grad_condition": 7694719.511876054, "lr": 0.0005470541566592572, "time_sec": 15.311876773834229 }, { "epoch": 48, "train_loss": 0.18840614411354065, "train_acc": 0.93296, "test_loss": 0.5223799973011017, "test_acc": 0.8486, "lyapunov": null, "grad_norm": 0.4947799501006328, "grad_max_sv": 0.32398409508168696, "grad_min_sv": 3.967475805666254e-08, "grad_condition": 8181991.0382896485, "lr": 0.0005313952597646569, "time_sec": 15.324450016021729 }, { "epoch": 49, "train_loss": 0.1852111140346527, "train_acc": 0.93434, "test_loss": 0.5372783863067627, "test_acc": 0.8442, "lyapunov": null, "grad_norm": 0.49013002688624263, "grad_max_sv": 0.3128523100167513, "grad_min_sv": 4.042725132435976e-08, "grad_condition": 7786375.414612537, "lr": 0.0005157053795390643, "time_sec": 15.311121940612793 }, { "epoch": 50, "train_loss": 0.17850845782279967, "train_acc": 0.9363, "test_loss": 0.5162768915176391, "test_acc": 0.8514, "lyapunov": null, "grad_norm": 0.4757476361255021, "grad_max_sv": 0.3146433509886265, "grad_min_sv": 3.966314778836022e-08, "grad_condition": 7931529.673702802, "lr": 0.0005000000000000002, "time_sec": 15.3083016872406 }, { "epoch": 51, "train_loss": 0.17266313230514527, "train_acc": 0.9392, "test_loss": 0.5169307453155517, "test_acc": 0.8514, "lyapunov": null, "grad_norm": 0.47267825902613214, "grad_max_sv": 0.30655047073960306, "grad_min_sv": 3.728870501262804e-08, "grad_condition": 8340291.307145154, "lr": 0.00048429462046093607, "time_sec": 15.306477308273315 }, { "epoch": 52, "train_loss": 0.1663313666152954, "train_acc": 0.94122, "test_loss": 0.5442662063598633, "test_acc": 0.8474, "lyapunov": null, "grad_norm": 0.46294043228921017, "grad_max_sv": 0.31195108480751516, "grad_min_sv": 3.8414651104545784e-08, "grad_condition": 8124213.069898104, "lr": 0.0004686047402353435, "time_sec": 15.31308388710022 }, { "epoch": 53, "train_loss": 0.16149800906658174, "train_acc": 0.94246, "test_loss": 0.580558476114273, "test_acc": 0.8416, "lyapunov": null, "grad_norm": 0.4519494684602909, "grad_max_sv": 0.2916812110692263, "grad_min_sv": 3.7287610199499e-08, "grad_condition": 7889287.089630139, "lr": 0.000452945843340743, "time_sec": 15.30961537361145 }, { "epoch": 54, "train_loss": 0.16166152165412903, "train_acc": 0.94208, "test_loss": 0.5555281185150146, "test_acc": 0.8473, "lyapunov": null, "grad_norm": 0.45553329333157905, "grad_max_sv": 0.2948467206209898, "grad_min_sv": 3.7315171308449634e-08, "grad_condition": 7971105.5751351025, "lr": 0.00043733338321784806, "time_sec": 15.302156925201416 }, { "epoch": 55, "train_loss": 0.1565243923521042, "train_acc": 0.94508, "test_loss": 0.5074358646392823, "test_acc": 0.8554, "lyapunov": null, "grad_norm": 0.4482394365745094, "grad_max_sv": 0.2973413269966841, "grad_min_sv": 3.757956048566768e-08, "grad_condition": 8002347.089848238, "lr": 0.0004217827674798847, "time_sec": 15.313871145248413 }, { "epoch": 56, "train_loss": 0.14638519546031953, "train_acc": 0.94786, "test_loss": 0.4880453747272491, "test_acc": 0.8653, "lyapunov": null, "grad_norm": 0.4314707571224286, "grad_max_sv": 0.2860257361084223, "grad_min_sv": 3.907978447514893e-08, "grad_condition": 7325521.391552436, "lr": 0.00040630934270713783, "time_sec": 15.315257549285889 }, { "epoch": 57, "train_loss": 0.14646475307941437, "train_acc": 0.94766, "test_loss": 0.576962650680542, "test_acc": 0.847, "lyapunov": null, "grad_norm": 0.4344661359835185, "grad_max_sv": 0.27631179951131346, "grad_min_sv": 3.824539080987677e-08, "grad_condition": 7229591.786889655, "lr": 0.000390928379301729, "time_sec": 15.307274341583252 }, { "epoch": 58, "train_loss": 0.13712914622783662, "train_acc": 0.95096, "test_loss": 0.577113539648056, "test_acc": 0.8499, "lyapunov": null, "grad_norm": 0.42148317642657124, "grad_max_sv": 0.2975440930575132, "grad_min_sv": 3.797022123386284e-08, "grad_condition": 7915512.058803884, "lr": 0.0003756550564175727, "time_sec": 15.30914568901062 }, { "epoch": 59, "train_loss": 0.13448802095890044, "train_acc": 0.95234, "test_loss": 0.5032788132190704, "test_acc": 0.8625, "lyapunov": null, "grad_norm": 0.4112977684378401, "grad_max_sv": 0.2814919870346785, "grad_min_sv": 3.85102704836271e-08, "grad_condition": 7377336.951999759, "lr": 0.00036050444698038553, "time_sec": 15.317845106124878 }, { "epoch": 60, "train_loss": 0.13363940123558044, "train_acc": 0.952, "test_loss": 0.5432449889659882, "test_acc": 0.854, "lyapunov": null, "grad_norm": 0.4126784436246539, "grad_max_sv": 0.2804244253784418, "grad_min_sv": 3.7023297405625045e-08, "grad_condition": 7621956.91724248, "lr": 0.00034549150281252655, "time_sec": 15.322251796722412 }, { "epoch": 61, "train_loss": 0.12653651702404023, "train_acc": 0.9556, "test_loss": 0.49968673663139346, "test_acc": 0.8678, "lyapunov": null, "grad_norm": 0.4007355103640766, "grad_max_sv": 0.27012523673474786, "grad_min_sv": 3.795508094484035e-08, "grad_condition": 7141541.257203001, "lr": 0.0003306310398773544, "time_sec": 15.314436435699463 }, { "epoch": 62, "train_loss": 0.12188665760755539, "train_acc": 0.9566, "test_loss": 0.5593991501808167, "test_acc": 0.8565, "lyapunov": null, "grad_norm": 0.3921398359098778, "grad_max_sv": 0.27338829450309277, "grad_min_sv": 3.639061785243314e-08, "grad_condition": 7584044.263979311, "lr": 0.00031593772365766127, "time_sec": 15.302758693695068 }, { "epoch": 63, "train_loss": 0.1223608536529541, "train_acc": 0.95622, "test_loss": 0.5149862161636353, "test_acc": 0.8612, "lyapunov": null, "grad_norm": 0.39447951861080405, "grad_max_sv": 0.2628227811306715, "grad_min_sv": 3.7084175330548416e-08, "grad_condition": 7085494.638547185, "lr": 0.0003014260546826097, "time_sec": 15.300389051437378 }, { "epoch": 64, "train_loss": 0.11717436948299408, "train_acc": 0.95768, "test_loss": 0.5029231981754303, "test_acc": 0.8645, "lyapunov": null, "grad_norm": 0.3837842917710247, "grad_max_sv": 0.2503308400511742, "grad_min_sv": 3.676226967286311e-08, "grad_condition": 6852674.209660569, "lr": 0.0002871103542174637, "time_sec": 15.306849479675293 }, { "epoch": 65, "train_loss": 0.1104171419763565, "train_acc": 0.96138, "test_loss": 0.5105278373241424, "test_acc": 0.8621, "lyapunov": null, "grad_norm": 0.37324824392122696, "grad_max_sv": 0.24798878654837608, "grad_min_sv": 3.5933988673519934e-08, "grad_condition": 6928104.161500673, "lr": 0.0002730047501302267, "time_sec": 15.306128978729248 }, { "epoch": 66, "train_loss": 0.11005497314453125, "train_acc": 0.9604, "test_loss": 0.5454881217956543, "test_acc": 0.8593, "lyapunov": null, "grad_norm": 0.3740796827280413, "grad_max_sv": 0.25094335451722144, "grad_min_sv": 3.760543059172505e-08, "grad_condition": 6680130.259128613, "lr": 0.00025912316294914234, "time_sec": 15.311371803283691 }, { "epoch": 67, "train_loss": 0.1054667473077774, "train_acc": 0.96206, "test_loss": 0.5242725006103516, "test_acc": 0.8654, "lyapunov": null, "grad_norm": 0.368892738378212, "grad_max_sv": 0.25266984924674035, "grad_min_sv": 3.633599621188921e-08, "grad_condition": 7013352.02049877, "lr": 0.0002454792921248144, "time_sec": 15.30515193939209 }, { "epoch": 68, "train_loss": 0.10004293047904968, "train_acc": 0.96412, "test_loss": 0.5743433611869811, "test_acc": 0.8538, "lyapunov": null, "grad_norm": 0.3572601369548122, "grad_max_sv": 0.24928448162972927, "grad_min_sv": 3.5534662101710524e-08, "grad_condition": 7054160.907809177, "lr": 0.00023208660251050164, "time_sec": 15.31411099433899 }, { "epoch": 69, "train_loss": 0.09898206293821335, "train_acc": 0.96434, "test_loss": 0.5453432657718659, "test_acc": 0.8647, "lyapunov": null, "grad_norm": 0.3575462219401736, "grad_max_sv": 0.22338325902819633, "grad_min_sv": 3.5619033011968784e-08, "grad_condition": 6388845.433191194, "lr": 0.00021895831107393473, "time_sec": 15.320244789123535 }, { "epoch": 70, "train_loss": 0.09576731202960015, "train_acc": 0.96662, "test_loss": 0.5289871492862701, "test_acc": 0.8673, "lyapunov": null, "grad_norm": 0.3475548635629844, "grad_max_sv": 0.22887863107025624, "grad_min_sv": 3.558577605922153e-08, "grad_condition": 6520932.801253774, "lr": 0.00020610737385376356, "time_sec": 15.312981367111206 }, { "epoch": 71, "train_loss": 0.09435438349246979, "train_acc": 0.96552, "test_loss": 0.5673801244735718, "test_acc": 0.8597, "lyapunov": null, "grad_norm": 0.35002047617094667, "grad_max_sv": 0.24012817665934563, "grad_min_sv": 3.424292120968175e-08, "grad_condition": 7037803.21914607, "lr": 0.00019354647317351177, "time_sec": 15.323097705841064 }, { "epoch": 72, "train_loss": 0.0899286351108551, "train_acc": 0.96766, "test_loss": 0.5408580667495727, "test_acc": 0.8662, "lyapunov": null, "grad_norm": 0.34100528699001653, "grad_max_sv": 0.22443376183509828, "grad_min_sv": 3.460758826179244e-08, "grad_condition": 6548190.204110672, "lr": 0.0001812880051256552, "time_sec": 15.303936243057251 }, { "epoch": 73, "train_loss": 0.08644640971183777, "train_acc": 0.9696, "test_loss": 0.5231532414436341, "test_acc": 0.8687, "lyapunov": null, "grad_norm": 0.3297853844853395, "grad_max_sv": 0.23831307105720043, "grad_min_sv": 3.648763895469642e-08, "grad_condition": 6564265.399345921, "lr": 0.00016934406733817422, "time_sec": 15.323826313018799 }, { "epoch": 74, "train_loss": 0.08675267961740493, "train_acc": 0.96966, "test_loss": 0.531370454120636, "test_acc": 0.8724, "lyapunov": null, "grad_norm": 0.33474921077291964, "grad_max_sv": 0.23228033129125833, "grad_min_sv": 3.54595965035287e-08, "grad_condition": 6646670.669053013, "lr": 0.0001577264470356557, "time_sec": 15.305448532104492 }, { "epoch": 75, "train_loss": 0.08520255417346954, "train_acc": 0.96946, "test_loss": 0.5489996848106384, "test_acc": 0.8629, "lyapunov": null, "grad_norm": 0.333062577424503, "grad_max_sv": 0.23861498832702638, "grad_min_sv": 3.416034828340742e-08, "grad_condition": 7057996.098654354, "lr": 0.00014644660940672634, "time_sec": 15.307157516479492 }, { "epoch": 76, "train_loss": 0.08347911696434021, "train_acc": 0.97006, "test_loss": 0.5250146618843079, "test_acc": 0.8686, "lyapunov": null, "grad_norm": 0.3315871550000043, "grad_max_sv": 0.23978985324501992, "grad_min_sv": 3.5313697566152766e-08, "grad_condition": 6836692.7541990755, "lr": 0.0001355156862892944, "time_sec": 15.2927827835083 }, { "epoch": 77, "train_loss": 0.08182602140903474, "train_acc": 0.97104, "test_loss": 0.5350998015880585, "test_acc": 0.8704, "lyapunov": null, "grad_norm": 0.3273538350101595, "grad_max_sv": 0.23843283373862506, "grad_min_sv": 3.504422023681286e-08, "grad_condition": 6836027.998268524, "lr": 0.00012494446518477025, "time_sec": 15.317047834396362 }, { "epoch": 78, "train_loss": 0.07884973392605782, "train_acc": 0.9722, "test_loss": 0.543610359621048, "test_acc": 0.869, "lyapunov": null, "grad_norm": 0.318085721614815, "grad_max_sv": 0.2306290850043297, "grad_min_sv": 3.51138401910589e-08, "grad_condition": 6598865.01839647, "lr": 0.00011474337861210548, "time_sec": 15.346408605575562 }, { "epoch": 79, "train_loss": 0.07515444636344909, "train_acc": 0.97302, "test_loss": 0.5453424057006836, "test_acc": 0.8685, "lyapunov": null, "grad_norm": 0.30764732453726595, "grad_max_sv": 0.23328058049082756, "grad_min_sv": 3.4018917194345025e-08, "grad_condition": 6898312.859708968, "lr": 0.00010492249381215483, "time_sec": 15.312849998474121 }, { "epoch": 80, "train_loss": 0.07553981874942779, "train_acc": 0.97342, "test_loss": 0.5447598055839539, "test_acc": 0.8687, "lyapunov": null, "grad_norm": 0.3126827627293077, "grad_max_sv": 0.22440926413983106, "grad_min_sv": 3.5051727831358904e-08, "grad_condition": 6508990.801328001, "lr": 9.549150281252637e-05, "time_sec": 15.31579327583313 }, { "epoch": 81, "train_loss": 0.0691981615459919, "train_acc": 0.9767, "test_loss": 0.6010801038742065, "test_acc": 0.8592, "lyapunov": null, "grad_norm": 0.2964655372784287, "grad_max_sv": 0.20926067158579825, "grad_min_sv": 3.334633209561844e-08, "grad_condition": 6336645.734981732, "lr": 8.645971286271918e-05, "time_sec": 15.311565399169922 }, { "epoch": 82, "train_loss": 0.07134237255096436, "train_acc": 0.97564, "test_loss": 0.5511228674888611, "test_acc": 0.8685, "lyapunov": null, "grad_norm": 0.3035210287863858, "grad_max_sv": 0.2166539143770933, "grad_min_sv": 3.444789098416834e-08, "grad_condition": 6316501.5285459785, "lr": 7.78360372489926e-05, "time_sec": 15.321164846420288 }, { "epoch": 83, "train_loss": 0.06894262619018554, "train_acc": 0.97574, "test_loss": 0.5341768414020538, "test_acc": 0.8666, "lyapunov": null, "grad_norm": 0.3006016750160245, "grad_max_sv": 0.214569428935647, "grad_min_sv": 3.390297984573465e-08, "grad_condition": 6347736.579489769, "lr": 6.962898649802815e-05, "time_sec": 15.31421685218811 }, { "epoch": 84, "train_loss": 0.06843596329629421, "train_acc": 0.97558, "test_loss": 0.5208944204807282, "test_acc": 0.8703, "lyapunov": null, "grad_norm": 0.2931609715468412, "grad_max_sv": 0.2041362512856722, "grad_min_sv": 3.608063616766799e-08, "grad_condition": 5852493.960090882, "lr": 6.184665997806824e-05, "time_sec": 15.313952445983887 }, { "epoch": 85, "train_loss": 0.06798111920118331, "train_acc": 0.97708, "test_loss": 0.5408778586387635, "test_acc": 0.869, "lyapunov": null, "grad_norm": 0.2949462881166867, "grad_max_sv": 0.2191694311797619, "grad_min_sv": 3.3161099466383345e-08, "grad_condition": 6683084.915046187, "lr": 5.449673790581613e-05, "time_sec": 15.323522567749023 }, { "epoch": 86, "train_loss": 0.06374187029123306, "train_acc": 0.97854, "test_loss": 0.534241654920578, "test_acc": 0.8701, "lyapunov": null, "grad_norm": 0.28381214745100436, "grad_max_sv": 0.21770549267530442, "grad_min_sv": 3.4639007706616096e-08, "grad_condition": 6392279.068014438, "lr": 4.758647376699034e-05, "time_sec": 15.312573432922363 }, { "epoch": 87, "train_loss": 0.06471459998726845, "train_acc": 0.97748, "test_loss": 0.5297845101356506, "test_acc": 0.8726, "lyapunov": null, "grad_norm": 0.28897487313019665, "grad_max_sv": 0.19332378804683686, "grad_min_sv": 3.343392815935431e-08, "grad_condition": 5824270.640002059, "lr": 4.112268715800956e-05, "time_sec": 15.310936450958252 }, { "epoch": 88, "train_loss": 0.06347171569228173, "train_acc": 0.97814, "test_loss": 0.5321846860408783, "test_acc": 0.8722, "lyapunov": null, "grad_norm": 0.2861217885894181, "grad_max_sv": 0.18890463691204787, "grad_min_sv": 3.443075908826643e-08, "grad_condition": 5578610.167209303, "lr": 3.511175705587434e-05, "time_sec": 15.30883502960205 }, { "epoch": 89, "train_loss": 0.06456126765966415, "train_acc": 0.97732, "test_loss": 0.5306058297157288, "test_acc": 0.8724, "lyapunov": null, "grad_norm": 0.2911671580013793, "grad_max_sv": 0.20169610902667046, "grad_min_sv": 3.3340199756537456e-08, "grad_condition": 6113921.310843622, "lr": 2.9559615522887284e-05, "time_sec": 15.325217247009277 }, { "epoch": 90, "train_loss": 0.05981739419221878, "train_acc": 0.97936, "test_loss": 0.5510406871795654, "test_acc": 0.8698, "lyapunov": null, "grad_norm": 0.27406962038993515, "grad_max_sv": 0.20393476765602828, "grad_min_sv": 3.436182409721766e-08, "grad_condition": 6006804.61096659, "lr": 2.447174185242324e-05, "time_sec": 15.308394432067871 }, { "epoch": 91, "train_loss": 0.05843851445674896, "train_acc": 0.97988, "test_loss": 0.5369569517612457, "test_acc": 0.8726, "lyapunov": null, "grad_norm": 0.270215680703968, "grad_max_sv": 0.19462423361837863, "grad_min_sv": 3.2800926286213895e-08, "grad_condition": 5976870.852957519, "lr": 1.9853157161528526e-05, "time_sec": 15.312544584274292 }, { "epoch": 92, "train_loss": 0.06141342503786087, "train_acc": 0.9789, "test_loss": 0.5492124430656433, "test_acc": 0.8715, "lyapunov": null, "grad_norm": 0.28355491226552393, "grad_max_sv": 0.20141606461256742, "grad_min_sv": 3.389024190170176e-08, "grad_condition": 6025484.075561702, "lr": 1.570841943568452e-05, "time_sec": 15.318751096725464 }, { "epoch": 93, "train_loss": 0.06185958398580551, "train_acc": 0.9791, "test_loss": 0.5353557282447815, "test_acc": 0.8734, "lyapunov": null, "grad_norm": 0.28019086696986784, "grad_max_sv": 0.20358563121408224, "grad_min_sv": 3.4872499954374805e-08, "grad_condition": 5972181.870711091, "lr": 1.204161903062634e-05, "time_sec": 15.310726404190063 }, { "epoch": 94, "train_loss": 0.061077375268936154, "train_acc": 0.97862, "test_loss": 0.5403136486530304, "test_acc": 0.8726, "lyapunov": null, "grad_norm": 0.27793458972654056, "grad_max_sv": 0.21468139700591565, "grad_min_sv": 3.314470546911252e-08, "grad_condition": 6531953.716980138, "lr": 8.85637463565564e-06, "time_sec": 15.322482585906982 }, { "epoch": 95, "train_loss": 0.059067166829109195, "train_acc": 0.9801, "test_loss": 0.5499792334079743, "test_acc": 0.8706, "lyapunov": null, "grad_norm": 0.2726950869177449, "grad_max_sv": 0.1847312103956938, "grad_min_sv": 3.442832863242984e-08, "grad_condition": 5484378.490748374, "lr": 6.155829702431171e-06, "time_sec": 15.331462860107422 }, { "epoch": 96, "train_loss": 0.058869197854995725, "train_acc": 0.97992, "test_loss": 0.5609679688453675, "test_acc": 0.8699, "lyapunov": null, "grad_norm": 0.2733600212103379, "grad_max_sv": 0.203422649204731, "grad_min_sv": 3.4962690476092464e-08, "grad_condition": 5877045.15462194, "lr": 3.942649342761118e-06, "time_sec": 15.318592071533203 }, { "epoch": 97, "train_loss": 0.05934914319038391, "train_acc": 0.97972, "test_loss": 0.5556031215667725, "test_acc": 0.8687, "lyapunov": null, "grad_norm": 0.2765716324142509, "grad_max_sv": 0.1996933190152049, "grad_min_sv": 3.3284164402402895e-08, "grad_condition": 6129925.740326188, "lr": 2.2190176984600023e-06, "time_sec": 15.329679727554321 }, { "epoch": 98, "train_loss": 0.05874215810537338, "train_acc": 0.97992, "test_loss": 0.5451333051681518, "test_acc": 0.8712, "lyapunov": null, "grad_norm": 0.2696205462857481, "grad_max_sv": 0.19026922769844531, "grad_min_sv": 3.324827377859663e-08, "grad_condition": 5756655.141047328, "lr": 9.866357858642206e-07, "time_sec": 15.31182599067688 }, { "epoch": 99, "train_loss": 0.059339061715602874, "train_acc": 0.98046, "test_loss": 0.5511723966598511, "test_acc": 0.8694, "lyapunov": null, "grad_norm": 0.2722387278016211, "grad_max_sv": 0.17949199080467224, "grad_min_sv": 3.178271090753526e-08, "grad_condition": 5671386.367227938, "lr": 2.467198171342e-07, "time_sec": 15.313301801681519 }, { "epoch": 100, "train_loss": 0.05937783687353134, "train_acc": 0.97908, "test_loss": 0.5341217585086823, "test_acc": 0.8723, "lyapunov": null, "grad_norm": 0.275408042809645, "grad_max_sv": 0.19940215721726418, "grad_min_sv": 3.299201711826072e-08, "grad_condition": 6121670.713258359, "lr": 0.0, "time_sec": 15.337401151657104 } ], "8": [ { "epoch": 1, "train_loss": 2.1551968896484377, "train_acc": 0.2953, "test_loss": 1.8477057243347168, "test_acc": 0.3437, "lyapunov": null, "grad_norm": 8.144943624656428, "grad_max_sv": 7.675079941749573, "grad_min_sv": 2.827612160416493e-07, "grad_condition": 28317355.270070046, "lr": 0.0009997532801828658, "time_sec": 32.46485447883606 }, { "epoch": 2, "train_loss": 1.6082625040054321, "train_acc": 0.42284, "test_loss": 1.6673745800018311, "test_acc": 0.406, "lyapunov": null, "grad_norm": 6.065037474589551, "grad_max_sv": 5.5711340546607975, "grad_min_sv": 2.234880795981553e-07, "grad_condition": 25327173.99046154, "lr": 0.0009990133642141358, "time_sec": 32.39758110046387 }, { "epoch": 3, "train_loss": 1.4377277154159547, "train_acc": 0.48488, "test_loss": 1.5402760635375976, "test_acc": 0.4555, "lyapunov": null, "grad_norm": 5.494687491087257, "grad_max_sv": 4.691517299413681, "grad_min_sv": 1.9618108950680835e-07, "grad_condition": 24150344.903272796, "lr": 0.00099778098230154, "time_sec": 32.400826930999756 }, { "epoch": 4, "train_loss": 1.2879639573669435, "train_acc": 0.53716, "test_loss": 1.8371749683380127, "test_acc": 0.4098, "lyapunov": null, "grad_norm": 4.741620609793776, "grad_max_sv": 4.525534170866012, "grad_min_sv": 1.8297150106150184e-07, "grad_condition": 24870782.059164062, "lr": 0.000996057350657239, "time_sec": 32.39713406562805 }, { "epoch": 5, "train_loss": 1.196011114768982, "train_acc": 0.5717, "test_loss": 1.1917746976852417, "test_acc": 0.5662, "lyapunov": null, "grad_norm": 4.225084445671327, "grad_max_sv": 3.8811924695968627, "grad_min_sv": 1.7304786759098079e-07, "grad_condition": 22788363.03168846, "lr": 0.0009938441702975688, "time_sec": 32.39927625656128 }, { "epoch": 6, "train_loss": 1.1017011584854126, "train_acc": 0.60624, "test_loss": 1.2156044723510742, "test_acc": 0.5524, "lyapunov": null, "grad_norm": 3.8500733224578765, "grad_max_sv": 3.3867243230342865, "grad_min_sv": 1.5910630946081028e-07, "grad_condition": 21517993.207089722, "lr": 0.0009911436253643444, "time_sec": 32.41104435920715 }, { "epoch": 7, "train_loss": 1.019956372566223, "train_acc": 0.63884, "test_loss": 1.0341911317825316, "test_acc": 0.6312, "lyapunov": null, "grad_norm": 3.4050623209558424, "grad_max_sv": 2.8642074435949327, "grad_min_sv": 1.3970929391149411e-07, "grad_condition": 20503012.26948414, "lr": 0.0009879583809693736, "time_sec": 32.39900183677673 }, { "epoch": 8, "train_loss": 0.952932172832489, "train_acc": 0.66154, "test_loss": 0.9561027820587158, "test_acc": 0.6654, "lyapunov": null, "grad_norm": 3.069081296040065, "grad_max_sv": 2.5316490083932877, "grad_min_sv": 1.2806189264580325e-07, "grad_condition": 19934874.23822563, "lr": 0.0009842915805643154, "time_sec": 32.39242911338806 }, { "epoch": 9, "train_loss": 0.8849921081352234, "train_acc": 0.68628, "test_loss": 1.0301121936798097, "test_acc": 0.6342, "lyapunov": null, "grad_norm": 2.63645918277651, "grad_max_sv": 2.232751601934433, "grad_min_sv": 1.2227004724252312e-07, "grad_condition": 18401740.489395566, "lr": 0.0009801468428384714, "time_sec": 32.409496545791626 }, { "epoch": 10, "train_loss": 0.8236279186630249, "train_acc": 0.70854, "test_loss": 0.8807288621902466, "test_acc": 0.682, "lyapunov": null, "grad_norm": 2.300239690915013, "grad_max_sv": 1.9658639460802079, "grad_min_sv": 1.1437598530505966e-07, "grad_condition": 17605252.06510754, "lr": 0.0009755282581475767, "time_sec": 32.40023136138916 }, { "epoch": 11, "train_loss": 0.788265288658142, "train_acc": 0.72186, "test_loss": 0.8550062474250794, "test_acc": 0.6904, "lyapunov": null, "grad_norm": 2.12020034951075, "grad_max_sv": 1.6186737358570098, "grad_min_sv": 1.0332133957291489e-07, "grad_condition": 15780748.729030486, "lr": 0.0009704403844771127, "time_sec": 32.40667533874512 }, { "epoch": 12, "train_loss": 0.7433690148735046, "train_acc": 0.73772, "test_loss": 0.8008458862304687, "test_acc": 0.7171, "lyapunov": null, "grad_norm": 1.8897751819834427, "grad_max_sv": 1.448184822499752, "grad_min_sv": 9.324852872083511e-08, "grad_condition": 15545592.26156075, "lr": 0.0009648882429441257, "time_sec": 32.4004065990448 }, { "epoch": 13, "train_loss": 0.7159804575920105, "train_acc": 0.74844, "test_loss": 0.8449424732208252, "test_acc": 0.7107, "lyapunov": null, "grad_norm": 1.7162684736286458, "grad_max_sv": 1.387939277291298, "grad_min_sv": 9.02613965791943e-08, "grad_condition": 15516859.545498159, "lr": 0.0009588773128419905, "time_sec": 32.39161419868469 }, { "epoch": 14, "train_loss": 0.6710689739608765, "train_acc": 0.7652, "test_loss": 0.8030969514846802, "test_acc": 0.7199, "lyapunov": null, "grad_norm": 1.5415310022642745, "grad_max_sv": 1.124143162369728, "grad_min_sv": 7.788519358342683e-08, "grad_condition": 14586378.513744438, "lr": 0.0009524135262330098, "time_sec": 32.40552067756653 }, { "epoch": 15, "train_loss": 0.6438176040267944, "train_acc": 0.77396, "test_loss": 0.7497868657112121, "test_acc": 0.7401, "lyapunov": null, "grad_norm": 1.4186644873786285, "grad_max_sv": 1.0314671725034714, "grad_min_sv": 7.5272734179066e-08, "grad_condition": 13653093.352212925, "lr": 0.0009455032620941839, "time_sec": 32.40474534034729 }, { "epoch": 16, "train_loss": 0.615869576702118, "train_acc": 0.7829, "test_loss": 0.7672984195709228, "test_acc": 0.7337, "lyapunov": null, "grad_norm": 1.2847059491767132, "grad_max_sv": 0.8981582961976529, "grad_min_sv": 7.069710665774664e-08, "grad_condition": 12774971.99569363, "lr": 0.0009381533400219318, "time_sec": 32.411378145217896 }, { "epoch": 17, "train_loss": 0.5916317593765259, "train_acc": 0.79332, "test_loss": 0.6773865149497986, "test_acc": 0.7673, "lyapunov": null, "grad_norm": 1.1905850089737686, "grad_max_sv": 0.8305475980043411, "grad_min_sv": 6.581527465243652e-08, "grad_condition": 12649477.259974267, "lr": 0.0009303710135019719, "time_sec": 32.40375375747681 }, { "epoch": 18, "train_loss": 0.5710988390541076, "train_acc": 0.80148, "test_loss": 0.6730817820549011, "test_acc": 0.7658, "lyapunov": null, "grad_norm": 1.1184745092261044, "grad_max_sv": 0.8092691361904144, "grad_min_sv": 6.20087442726458e-08, "grad_condition": 13237272.581055809, "lr": 0.0009221639627510076, "time_sec": 32.403624534606934 }, { "epoch": 19, "train_loss": 0.5524461611747742, "train_acc": 0.80704, "test_loss": 0.7162760413169861, "test_acc": 0.7602, "lyapunov": null, "grad_norm": 1.023562615452227, "grad_max_sv": 0.6794823326170445, "grad_min_sv": 5.88299432280337e-08, "grad_condition": 11704217.317878243, "lr": 0.000913540287137281, "time_sec": 32.39382600784302 }, { "epoch": 20, "train_loss": 0.5298428584098815, "train_acc": 0.81452, "test_loss": 0.7450216589927673, "test_acc": 0.752, "lyapunov": null, "grad_norm": 0.9359144343942514, "grad_max_sv": 0.5905756287276744, "grad_min_sv": 5.571528873815623e-08, "grad_condition": 10693233.182217773, "lr": 0.0009045084971874739, "time_sec": 32.40094780921936 }, { "epoch": 21, "train_loss": 0.5077325123977661, "train_acc": 0.82174, "test_loss": 0.63943037815094, "test_acc": 0.7812, "lyapunov": null, "grad_norm": 0.8805285251076611, "grad_max_sv": 0.615053903311491, "grad_min_sv": 5.4429192175575734e-08, "grad_condition": 11327012.575821584, "lr": 0.0008950775061878452, "time_sec": 32.38740086555481 }, { "epoch": 22, "train_loss": 0.4933246819114685, "train_acc": 0.8259, "test_loss": 0.718407027053833, "test_acc": 0.7614, "lyapunov": null, "grad_norm": 0.8303617086611039, "grad_max_sv": 0.5229416653513909, "grad_min_sv": 5.0371477122723717e-08, "grad_condition": 10417728.60900723, "lr": 0.0008852566213878947, "time_sec": 32.404406785964966 }, { "epoch": 23, "train_loss": 0.47660592782020567, "train_acc": 0.83498, "test_loss": 0.6119730060577393, "test_acc": 0.7951, "lyapunov": null, "grad_norm": 0.7772569962051041, "grad_max_sv": 0.5228113703429699, "grad_min_sv": 4.883190189985953e-08, "grad_condition": 10840281.592058718, "lr": 0.0008750555348152298, "time_sec": 32.41756844520569 }, { "epoch": 24, "train_loss": 0.4621484722900391, "train_acc": 0.8354, "test_loss": 0.6255874982833862, "test_acc": 0.7921, "lyapunov": null, "grad_norm": 0.7435129116165293, "grad_max_sv": 0.5028938911855221, "grad_min_sv": 4.940657198915232e-08, "grad_condition": 10262672.7433966, "lr": 0.0008644843137107057, "time_sec": 32.40160775184631 }, { "epoch": 25, "train_loss": 0.44543547362804414, "train_acc": 0.84322, "test_loss": 0.6244046552658081, "test_acc": 0.8003, "lyapunov": null, "grad_norm": 0.7057766135770664, "grad_max_sv": 0.45453565418720243, "grad_min_sv": 4.47153126970079e-08, "grad_condition": 10235918.99223967, "lr": 0.0008535533905932737, "time_sec": 32.397634983062744 }, { "epoch": 26, "train_loss": 0.4291659313964844, "train_acc": 0.85028, "test_loss": 0.586253802204132, "test_acc": 0.8053, "lyapunov": null, "grad_norm": 0.6653011352683553, "grad_max_sv": 0.40432176999747754, "grad_min_sv": 4.4079006933372964e-08, "grad_condition": 9263382.4971398, "lr": 0.0008422735529643444, "time_sec": 32.408364057540894 }, { "epoch": 27, "train_loss": 0.41755434021949767, "train_acc": 0.8537, "test_loss": 0.6190900807380676, "test_acc": 0.8031, "lyapunov": null, "grad_norm": 0.634844213604884, "grad_max_sv": 0.38489293307065964, "grad_min_sv": 4.278397165435877e-08, "grad_condition": 9083713.307072137, "lr": 0.0008306559326618259, "time_sec": 32.3781955242157 }, { "epoch": 28, "train_loss": 0.409987173576355, "train_acc": 0.85588, "test_loss": 0.6381987627029418, "test_acc": 0.7967, "lyapunov": null, "grad_norm": 0.6208575070285024, "grad_max_sv": 0.3849256232380867, "grad_min_sv": 4.156698754087529e-08, "grad_condition": 9343591.955088045, "lr": 0.0008187119948743449, "time_sec": 32.424397468566895 }, { "epoch": 29, "train_loss": 0.39254301443099976, "train_acc": 0.86148, "test_loss": 0.6114391220092773, "test_acc": 0.8072, "lyapunov": null, "grad_norm": 0.5930731028782803, "grad_max_sv": 0.35281661339104176, "grad_min_sv": 3.97135552887562e-08, "grad_condition": 8878121.049382607, "lr": 0.0008064535268264883, "time_sec": 32.40766763687134 }, { "epoch": 30, "train_loss": 0.3785347310256958, "train_acc": 0.86726, "test_loss": 0.6049399808883666, "test_acc": 0.811, "lyapunov": null, "grad_norm": 0.5794796026042499, "grad_max_sv": 0.36831745132803917, "grad_min_sv": 4.032110121343635e-08, "grad_condition": 9212028.38827365, "lr": 0.0007938926261462367, "time_sec": 32.40119290351868 }, { "epoch": 31, "train_loss": 0.3689020803642273, "train_acc": 0.87034, "test_loss": 0.6224831011772156, "test_acc": 0.8103, "lyapunov": null, "grad_norm": 0.5518777770693967, "grad_max_sv": 0.34497435614466665, "grad_min_sv": 3.993250263789605e-08, "grad_condition": 8691890.072923485, "lr": 0.0007810416889260654, "time_sec": 32.42319178581238 }, { "epoch": 32, "train_loss": 0.3600490350532532, "train_acc": 0.87378, "test_loss": 0.6563146770000458, "test_acc": 0.7989, "lyapunov": null, "grad_norm": 0.5344416918727563, "grad_max_sv": 0.3161147892475128, "grad_min_sv": 3.79914633530376e-08, "grad_condition": 8391808.948301231, "lr": 0.0007679133974894983, "time_sec": 32.40037226676941 }, { "epoch": 33, "train_loss": 0.3552369830417633, "train_acc": 0.876, "test_loss": 0.5918597935676575, "test_acc": 0.8191, "lyapunov": null, "grad_norm": 0.5223477954823382, "grad_max_sv": 0.32091905549168587, "grad_min_sv": 3.692389771714488e-08, "grad_condition": 8735655.499988783, "lr": 0.0007545207078751857, "time_sec": 32.39385366439819 }, { "epoch": 34, "train_loss": 0.3357627202987671, "train_acc": 0.88192, "test_loss": 0.6601162696361542, "test_acc": 0.8074, "lyapunov": null, "grad_norm": 0.5010170887656177, "grad_max_sv": 0.3139246258884668, "grad_min_sv": 3.658822085306213e-08, "grad_condition": 8606732.681616401, "lr": 0.0007408768370508577, "time_sec": 32.40888476371765 }, { "epoch": 35, "train_loss": 0.32540871870040894, "train_acc": 0.88428, "test_loss": 0.6114396753549576, "test_acc": 0.8112, "lyapunov": null, "grad_norm": 0.4852002465463357, "grad_max_sv": 0.3033136323094368, "grad_min_sv": 3.599271058973841e-08, "grad_condition": 8499862.031601336, "lr": 0.0007269952498697734, "time_sec": 32.40857720375061 }, { "epoch": 36, "train_loss": 0.32421252524375915, "train_acc": 0.8847, "test_loss": 0.6881836595535278, "test_acc": 0.8116, "lyapunov": null, "grad_norm": 0.47585625371919826, "grad_max_sv": 0.28932417593896387, "grad_min_sv": 3.663087517757902e-08, "grad_condition": 7933220.2527872, "lr": 0.0007128896457825364, "time_sec": 32.39529776573181 }, { "epoch": 37, "train_loss": 0.3108924944496155, "train_acc": 0.88942, "test_loss": 0.7008573976516723, "test_acc": 0.8098, "lyapunov": null, "grad_norm": 0.46276747011208014, "grad_max_sv": 0.2795715734362602, "grad_min_sv": 3.448033547570617e-08, "grad_condition": 8262563.079640454, "lr": 0.0006985739453173903, "time_sec": 32.38434648513794 }, { "epoch": 38, "train_loss": 0.31133034090042117, "train_acc": 0.88992, "test_loss": 0.6698009629249573, "test_acc": 0.81, "lyapunov": null, "grad_norm": 0.4586602799362298, "grad_max_sv": 0.2844005227088928, "grad_min_sv": 3.324500559287458e-08, "grad_condition": 8714467.747357922, "lr": 0.0006840622763423391, "time_sec": 32.396021366119385 }, { "epoch": 39, "train_loss": 0.29518098635673523, "train_acc": 0.89552, "test_loss": 0.7677701180458069, "test_acc": 0.7991, "lyapunov": null, "grad_norm": 0.43830085967668675, "grad_max_sv": 0.2725641973316669, "grad_min_sv": 3.3406064270380397e-08, "grad_condition": 8255466.038533419, "lr": 0.0006693689601226458, "time_sec": 32.40195083618164 }, { "epoch": 40, "train_loss": 0.2831247230243683, "train_acc": 0.89996, "test_loss": 0.6842746494293213, "test_acc": 0.8148, "lyapunov": null, "grad_norm": 0.4331819538283316, "grad_max_sv": 0.26449211575090886, "grad_min_sv": 3.399684476157461e-08, "grad_condition": 7879060.46068686, "lr": 0.0006545084971874737, "time_sec": 32.418256521224976 }, { "epoch": 41, "train_loss": 0.27670828733444214, "train_acc": 0.90256, "test_loss": 0.701638517665863, "test_acc": 0.8105, "lyapunov": null, "grad_norm": 0.42402034759846713, "grad_max_sv": 0.26597036607563496, "grad_min_sv": 3.2260157212249396e-08, "grad_condition": 8290157.649110466, "lr": 0.0006394955530196147, "time_sec": 32.40391206741333 }, { "epoch": 42, "train_loss": 0.26722780378341676, "train_acc": 0.90478, "test_loss": 0.676421770954132, "test_acc": 0.8152, "lyapunov": null, "grad_norm": 0.41593559749987674, "grad_max_sv": 0.26356035731732846, "grad_min_sv": 3.2800773563934625e-08, "grad_condition": 8080555.103613043, "lr": 0.0006243449435824273, "time_sec": 32.413851737976074 }, { "epoch": 43, "train_loss": 0.2611290577888489, "train_acc": 0.9069, "test_loss": 0.7091101724147797, "test_acc": 0.8165, "lyapunov": null, "grad_norm": 0.40890139043798995, "grad_max_sv": 0.2530216708779335, "grad_min_sv": 3.0997858102566053e-08, "grad_condition": 8224218.543131987, "lr": 0.0006090716206982714, "time_sec": 32.60969662666321 }, { "epoch": 44, "train_loss": 0.2530948238658905, "train_acc": 0.90982, "test_loss": 0.6961516171455383, "test_acc": 0.8214, "lyapunov": null, "grad_norm": 0.39919304872434885, "grad_max_sv": 0.24201009832322598, "grad_min_sv": 3.264100985056473e-08, "grad_condition": 7496864.741894746, "lr": 0.0005936906572928625, "time_sec": 32.40188717842102 }, { "epoch": 45, "train_loss": 0.23889887328147888, "train_acc": 0.91386, "test_loss": 0.7265622617721558, "test_acc": 0.8196, "lyapunov": null, "grad_norm": 0.39216552760863915, "grad_max_sv": 0.25172842368483545, "grad_min_sv": 3.196390450099784e-08, "grad_condition": 7939664.340514863, "lr": 0.0005782172325201156, "time_sec": 32.40084266662598 }, { "epoch": 46, "train_loss": 0.23805784145355224, "train_acc": 0.91674, "test_loss": 0.6975640031337738, "test_acc": 0.8226, "lyapunov": null, "grad_norm": 0.3825430754006707, "grad_max_sv": 0.23831223957240583, "grad_min_sv": 2.971923072081495e-08, "grad_condition": 8085204.090791678, "lr": 0.0005626666167821523, "time_sec": 32.42257380485535 }, { "epoch": 47, "train_loss": 0.23282361968994142, "train_acc": 0.91824, "test_loss": 0.6992193672657013, "test_acc": 0.8311, "lyapunov": null, "grad_norm": 0.3814486121413188, "grad_max_sv": 0.23424655832350255, "grad_min_sv": 3.104032040290861e-08, "grad_condition": 7643726.892298067, "lr": 0.0005470541566592572, "time_sec": 32.40861511230469 }, { "epoch": 48, "train_loss": 0.22799833922863005, "train_acc": 0.91886, "test_loss": 0.6951349193096161, "test_acc": 0.8282, "lyapunov": null, "grad_norm": 0.38166215011498245, "grad_max_sv": 0.24571430422365664, "grad_min_sv": 3.0606541878697156e-08, "grad_condition": 8099711.568480073, "lr": 0.0005313952597646569, "time_sec": 32.382601499557495 }, { "epoch": 49, "train_loss": 0.21888560410499572, "train_acc": 0.92208, "test_loss": 0.6775056694984436, "test_acc": 0.8377, "lyapunov": null, "grad_norm": 0.3681781600012364, "grad_max_sv": 0.22858488224446774, "grad_min_sv": 3.0608208811955254e-08, "grad_condition": 7499521.525014189, "lr": 0.0005157053795390643, "time_sec": 32.38293170928955 }, { "epoch": 50, "train_loss": 0.2106206985092163, "train_acc": 0.9252, "test_loss": 0.6563802011966705, "test_acc": 0.8396, "lyapunov": null, "grad_norm": 0.36053809946906845, "grad_max_sv": 0.2215539276599884, "grad_min_sv": 2.9670953960447833e-08, "grad_condition": 7567975.97315415, "lr": 0.0005000000000000002, "time_sec": 32.3891761302948 }, { "epoch": 51, "train_loss": 0.19901366895198822, "train_acc": 0.92832, "test_loss": 0.6814763808727264, "test_acc": 0.837, "lyapunov": null, "grad_norm": 0.3509310663538234, "grad_max_sv": 0.21552756875753404, "grad_min_sv": 3.0066001732720335e-08, "grad_condition": 7264544.488552595, "lr": 0.00048429462046093607, "time_sec": 32.41236758232117 }, { "epoch": 52, "train_loss": 0.19969978581905365, "train_acc": 0.9285, "test_loss": 0.6935202028274536, "test_acc": 0.8339, "lyapunov": null, "grad_norm": 0.3520257382758021, "grad_max_sv": 0.22391790114343166, "grad_min_sv": 3.0129751982244104e-08, "grad_condition": 7509087.830538243, "lr": 0.0004686047402353435, "time_sec": 32.39413237571716 }, { "epoch": 53, "train_loss": 0.19100741683721542, "train_acc": 0.93138, "test_loss": 0.686068691778183, "test_acc": 0.8361, "lyapunov": null, "grad_norm": 0.3426294963785598, "grad_max_sv": 0.22632624246180058, "grad_min_sv": 2.9659243594437613e-08, "grad_condition": 7652635.339128266, "lr": 0.000452945843340743, "time_sec": 32.40613842010498 }, { "epoch": 54, "train_loss": 0.18032077651500703, "train_acc": 0.9362, "test_loss": 0.7067575240373611, "test_acc": 0.8336, "lyapunov": null, "grad_norm": 0.3322012382733825, "grad_max_sv": 0.20586859565228224, "grad_min_sv": 2.850985989510946e-08, "grad_condition": 7314687.938871255, "lr": 0.00043733338321784806, "time_sec": 32.4026734828949 }, { "epoch": 55, "train_loss": 0.17773653375148774, "train_acc": 0.93586, "test_loss": 0.7423279015541077, "test_acc": 0.8264, "lyapunov": null, "grad_norm": 0.3304441924446054, "grad_max_sv": 0.21223607212305068, "grad_min_sv": 2.8433270138350508e-08, "grad_condition": 7539548.749518724, "lr": 0.0004217827674798847, "time_sec": 32.404977560043335 }, { "epoch": 56, "train_loss": 0.17266820957183837, "train_acc": 0.93834, "test_loss": 0.7072871742248535, "test_acc": 0.8362, "lyapunov": null, "grad_norm": 0.3213443005744008, "grad_max_sv": 0.20142054706811904, "grad_min_sv": 2.726542889242012e-08, "grad_condition": 7440941.08660387, "lr": 0.00040630934270713783, "time_sec": 32.39922308921814 }, { "epoch": 57, "train_loss": 0.16320502066612244, "train_acc": 0.9411, "test_loss": 0.7605734568834305, "test_acc": 0.8318, "lyapunov": null, "grad_norm": 0.31657510227372176, "grad_max_sv": 0.20284682027995588, "grad_min_sv": 2.7356661469468692e-08, "grad_condition": 7474082.923928386, "lr": 0.000390928379301729, "time_sec": 32.39910292625427 }, { "epoch": 58, "train_loss": 0.15670019901275634, "train_acc": 0.94476, "test_loss": 0.784366103553772, "test_acc": 0.8311, "lyapunov": null, "grad_norm": 0.30805235096734923, "grad_max_sv": 0.20260103438049554, "grad_min_sv": 2.8483807401613605e-08, "grad_condition": 7164125.0338090565, "lr": 0.0003756550564175727, "time_sec": 32.38076663017273 }, { "epoch": 59, "train_loss": 0.1490273987340927, "train_acc": 0.94576, "test_loss": 0.7455846133232117, "test_acc": 0.8376, "lyapunov": null, "grad_norm": 0.303406267580447, "grad_max_sv": 0.19556450732052327, "grad_min_sv": 2.8112297023596967e-08, "grad_condition": 7040746.144049543, "lr": 0.00036050444698038553, "time_sec": 32.39811587333679 }, { "epoch": 60, "train_loss": 0.14525161782741547, "train_acc": 0.94758, "test_loss": 0.7790617815971375, "test_acc": 0.8344, "lyapunov": null, "grad_norm": 0.30155039989577326, "grad_max_sv": 0.19981648530811072, "grad_min_sv": 2.756223151934023e-08, "grad_condition": 7325326.926472412, "lr": 0.00034549150281252655, "time_sec": 32.389100313186646 }, { "epoch": 61, "train_loss": 0.1412713815355301, "train_acc": 0.94936, "test_loss": 0.7642439495563507, "test_acc": 0.836, "lyapunov": null, "grad_norm": 0.29749874721325253, "grad_max_sv": 0.19452713318169118, "grad_min_sv": 2.9010603075363407e-08, "grad_condition": 6769308.704484415, "lr": 0.0003306310398773544, "time_sec": 32.38328981399536 }, { "epoch": 62, "train_loss": 0.1323081604719162, "train_acc": 0.95234, "test_loss": 0.7581991817474365, "test_acc": 0.8398, "lyapunov": null, "grad_norm": 0.29116698502726973, "grad_max_sv": 0.18757329024374486, "grad_min_sv": 2.7799571622466603e-08, "grad_condition": 6802391.979822846, "lr": 0.00031593772365766127, "time_sec": 32.38175868988037 }, { "epoch": 63, "train_loss": 0.12890920341968537, "train_acc": 0.95402, "test_loss": 0.7480168062210083, "test_acc": 0.8421, "lyapunov": null, "grad_norm": 0.286611612578029, "grad_max_sv": 0.1843133084475994, "grad_min_sv": 2.6867626612414597e-08, "grad_condition": 6929516.973504146, "lr": 0.0003014260546826097, "time_sec": 32.42565321922302 }, { "epoch": 64, "train_loss": 0.1265330140542984, "train_acc": 0.9554, "test_loss": 0.8281557668209076, "test_acc": 0.8301, "lyapunov": null, "grad_norm": 0.2827852267700905, "grad_max_sv": 0.18494715746492146, "grad_min_sv": 2.7603675123444305e-08, "grad_condition": 6836444.701068824, "lr": 0.0002871103542174637, "time_sec": 32.41487503051758 }, { "epoch": 65, "train_loss": 0.1179364563369751, "train_acc": 0.95766, "test_loss": 0.8201508460521698, "test_acc": 0.8301, "lyapunov": null, "grad_norm": 0.27559434018913526, "grad_max_sv": 0.1801072470843792, "grad_min_sv": 2.659138749194767e-08, "grad_condition": 6847688.983849314, "lr": 0.0002730047501302267, "time_sec": 32.39773344993591 }, { "epoch": 66, "train_loss": 0.11676965503931046, "train_acc": 0.9583, "test_loss": 0.8626040154457092, "test_acc": 0.8299, "lyapunov": null, "grad_norm": 0.2739785879338369, "grad_max_sv": 0.181886912509799, "grad_min_sv": 2.726705781164185e-08, "grad_condition": 6765344.039900659, "lr": 0.00025912316294914234, "time_sec": 32.3981568813324 }, { "epoch": 67, "train_loss": 0.1134087336063385, "train_acc": 0.95968, "test_loss": 0.8600147367477416, "test_acc": 0.8307, "lyapunov": null, "grad_norm": 0.27359780558028896, "grad_max_sv": 0.17809443082660437, "grad_min_sv": 2.617720586961525e-08, "grad_condition": 6850097.709154141, "lr": 0.0002454792921248144, "time_sec": 32.39709424972534 }, { "epoch": 68, "train_loss": 0.10615333132266998, "train_acc": 0.96164, "test_loss": 0.7972221804141998, "test_acc": 0.8376, "lyapunov": null, "grad_norm": 0.2659183144921437, "grad_max_sv": 0.18308131918311119, "grad_min_sv": 2.689645892672843e-08, "grad_condition": 6797772.602815667, "lr": 0.00023208660251050164, "time_sec": 32.41845703125 }, { "epoch": 69, "train_loss": 0.10183365075588226, "train_acc": 0.9635, "test_loss": 0.826421448802948, "test_acc": 0.8419, "lyapunov": null, "grad_norm": 0.25781252098700996, "grad_max_sv": 0.16897555273026227, "grad_min_sv": 2.6931133589869206e-08, "grad_condition": 6306456.524677806, "lr": 0.00021895831107393473, "time_sec": 32.397175788879395 }, { "epoch": 70, "train_loss": 0.10107698081731796, "train_acc": 0.96376, "test_loss": 0.8561173896312714, "test_acc": 0.831, "lyapunov": null, "grad_norm": 0.25760306881898437, "grad_max_sv": 0.17646125555038453, "grad_min_sv": 2.669760297280277e-08, "grad_condition": 6679362.317952393, "lr": 0.00020610737385376356, "time_sec": 32.403748512268066 }, { "epoch": 71, "train_loss": 0.09157823500394821, "train_acc": 0.9672, "test_loss": 0.819078180027008, "test_acc": 0.8435, "lyapunov": null, "grad_norm": 0.24819829552233322, "grad_max_sv": 0.1644124612212181, "grad_min_sv": 2.60399903861952e-08, "grad_condition": 6357922.646001594, "lr": 0.00019354647317351177, "time_sec": 32.40361571311951 }, { "epoch": 72, "train_loss": 0.09161295493125915, "train_acc": 0.9674, "test_loss": 0.8579238404273987, "test_acc": 0.8382, "lyapunov": null, "grad_norm": 0.2471838058669454, "grad_max_sv": 0.18323104958981276, "grad_min_sv": 2.6274890752020497e-08, "grad_condition": 7043842.298456557, "lr": 0.0001812880051256552, "time_sec": 32.40220522880554 }, { "epoch": 73, "train_loss": 0.08914089821338654, "train_acc": 0.9689, "test_loss": 0.822793147277832, "test_acc": 0.8428, "lyapunov": null, "grad_norm": 0.24800643716145856, "grad_max_sv": 0.17686894070357084, "grad_min_sv": 2.5135920411756273e-08, "grad_condition": 7047438.025677231, "lr": 0.00016934406733817422, "time_sec": 32.38602375984192 }, { "epoch": 74, "train_loss": 0.08674161068916321, "train_acc": 0.96972, "test_loss": 0.9136243630409241, "test_acc": 0.832, "lyapunov": null, "grad_norm": 0.24475644922641637, "grad_max_sv": 0.1730644192546606, "grad_min_sv": 2.701796373294485e-08, "grad_condition": 6442891.2485314775, "lr": 0.0001577264470356557, "time_sec": 32.388394594192505 }, { "epoch": 75, "train_loss": 0.08695965735673905, "train_acc": 0.96928, "test_loss": 0.8845508131980896, "test_acc": 0.8384, "lyapunov": null, "grad_norm": 0.2459968799202821, "grad_max_sv": 0.17426501363515853, "grad_min_sv": 2.6569961386613273e-08, "grad_condition": 6640201.158479671, "lr": 0.00014644660940672634, "time_sec": 32.41233015060425 }, { "epoch": 76, "train_loss": 0.08056579726457595, "train_acc": 0.97162, "test_loss": 0.8616433102607727, "test_acc": 0.843, "lyapunov": null, "grad_norm": 0.2370989720124241, "grad_max_sv": 0.17729146480560304, "grad_min_sv": 2.568868753272113e-08, "grad_condition": 6934864.636315972, "lr": 0.0001355156862892944, "time_sec": 32.40184926986694 }, { "epoch": 77, "train_loss": 0.0778916252565384, "train_acc": 0.97266, "test_loss": 0.8366258358001709, "test_acc": 0.846, "lyapunov": null, "grad_norm": 0.2285631358810043, "grad_max_sv": 0.15610157009214162, "grad_min_sv": 2.4703725332031468e-08, "grad_condition": 6441768.40822393, "lr": 0.00012494446518477025, "time_sec": 32.39042067527771 }, { "epoch": 78, "train_loss": 0.07181410483896733, "train_acc": 0.97442, "test_loss": 0.8555541298389435, "test_acc": 0.8426, "lyapunov": null, "grad_norm": 0.21751467049933892, "grad_max_sv": 0.15433428399264812, "grad_min_sv": 2.665557081726888e-08, "grad_condition": 5918219.605492928, "lr": 0.00011474337861210548, "time_sec": 32.394978523254395 }, { "epoch": 79, "train_loss": 0.07194108392477036, "train_acc": 0.9751, "test_loss": 0.8495045845985413, "test_acc": 0.8448, "lyapunov": null, "grad_norm": 0.22114745807083974, "grad_max_sv": 0.1569668130017817, "grad_min_sv": 2.5639288958601015e-08, "grad_condition": 6206249.934502038, "lr": 0.00010492249381215483, "time_sec": 32.40589165687561 }, { "epoch": 80, "train_loss": 0.07222781093478203, "train_acc": 0.97412, "test_loss": 0.8713514517307281, "test_acc": 0.8394, "lyapunov": null, "grad_norm": 0.22263796587188234, "grad_max_sv": 0.14711420265957714, "grad_min_sv": 2.5633022726623266e-08, "grad_condition": 5761666.097039051, "lr": 9.549150281252637e-05, "time_sec": 32.37701368331909 }, { "epoch": 81, "train_loss": 0.06728733582258224, "train_acc": 0.97644, "test_loss": 0.8841948908805847, "test_acc": 0.8471, "lyapunov": null, "grad_norm": 0.2167084382178911, "grad_max_sv": 0.150007457844913, "grad_min_sv": 2.4493604877662278e-08, "grad_condition": 6166534.410663934, "lr": 8.645971286271918e-05, "time_sec": 32.398573875427246 }, { "epoch": 82, "train_loss": 0.06532315739750862, "train_acc": 0.97664, "test_loss": 0.8479381636619567, "test_acc": 0.8476, "lyapunov": null, "grad_norm": 0.21360344563146125, "grad_max_sv": 0.14955835351720453, "grad_min_sv": 2.5209754284105657e-08, "grad_condition": 5995150.4945804905, "lr": 7.78360372489926e-05, "time_sec": 32.39670705795288 }, { "epoch": 83, "train_loss": 0.06434115768909454, "train_acc": 0.97796, "test_loss": 0.8688706632614136, "test_acc": 0.8462, "lyapunov": null, "grad_norm": 0.208142142739157, "grad_max_sv": 0.14977061534300445, "grad_min_sv": 2.4894345518333694e-08, "grad_condition": 6089831.719725271, "lr": 6.962898649802815e-05, "time_sec": 32.399760007858276 }, { "epoch": 84, "train_loss": 0.06394571399211883, "train_acc": 0.9776, "test_loss": 0.8629561246871948, "test_acc": 0.8473, "lyapunov": null, "grad_norm": 0.2090274768795119, "grad_max_sv": 0.1535501467064023, "grad_min_sv": 2.6076664383367643e-08, "grad_condition": 5914212.49570628, "lr": 6.184665997806824e-05, "time_sec": 32.38430905342102 }, { "epoch": 85, "train_loss": 0.062020836523771286, "train_acc": 0.97872, "test_loss": 0.875181820678711, "test_acc": 0.8453, "lyapunov": null, "grad_norm": 0.2063308108071089, "grad_max_sv": 0.14753851415589453, "grad_min_sv": 2.432188375145472e-08, "grad_condition": 6144261.18306755, "lr": 5.449673790581613e-05, "time_sec": 32.41748404502869 }, { "epoch": 86, "train_loss": 0.06044566638708115, "train_acc": 0.9789, "test_loss": 0.872238347530365, "test_acc": 0.8476, "lyapunov": null, "grad_norm": 0.20133211072179052, "grad_max_sv": 0.148629211448133, "grad_min_sv": 2.4942497534041762e-08, "grad_condition": 6060679.3216307415, "lr": 4.758647376699034e-05, "time_sec": 32.391072273254395 }, { "epoch": 87, "train_loss": 0.061503240056037904, "train_acc": 0.97832, "test_loss": 0.8733239276885987, "test_acc": 0.8431, "lyapunov": null, "grad_norm": 0.2056722075536268, "grad_max_sv": 0.14386752797290683, "grad_min_sv": 2.4274280185920816e-08, "grad_condition": 5915342.2569472315, "lr": 4.112268715800956e-05, "time_sec": 32.393316984176636 }, { "epoch": 88, "train_loss": 0.057686230409145355, "train_acc": 0.98028, "test_loss": 0.9238866704940796, "test_acc": 0.8441, "lyapunov": null, "grad_norm": 0.19849445098013146, "grad_max_sv": 0.14159611044451595, "grad_min_sv": 2.40493778669304e-08, "grad_condition": 5894624.093493214, "lr": 3.511175705587434e-05, "time_sec": 32.38528490066528 }, { "epoch": 89, "train_loss": 0.05870611476659775, "train_acc": 0.9798, "test_loss": 0.8742481526374817, "test_acc": 0.8481, "lyapunov": null, "grad_norm": 0.20012200731407057, "grad_max_sv": 0.15360670480877162, "grad_min_sv": 2.5219260857411995e-08, "grad_condition": 6191506.157967448, "lr": 2.9559615522887284e-05, "time_sec": 32.393001079559326 }, { "epoch": 90, "train_loss": 0.05783582457482815, "train_acc": 0.9801, "test_loss": 0.8813467388153076, "test_acc": 0.8475, "lyapunov": null, "grad_norm": 0.19996222144489287, "grad_max_sv": 0.1403856192715466, "grad_min_sv": 2.448204212690541e-08, "grad_condition": 5742298.053374326, "lr": 2.447174185242324e-05, "time_sec": 32.38493609428406 }, { "epoch": 91, "train_loss": 0.05505133232176304, "train_acc": 0.9811, "test_loss": 0.8983916495323181, "test_acc": 0.8462, "lyapunov": null, "grad_norm": 0.1922888220223182, "grad_max_sv": 0.13430234417319298, "grad_min_sv": 2.4953015476114616e-08, "grad_condition": 5451203.641164561, "lr": 1.9853157161528526e-05, "time_sec": 32.399288177490234 }, { "epoch": 92, "train_loss": 0.05489971268892288, "train_acc": 0.98124, "test_loss": 0.8997103338241577, "test_acc": 0.843, "lyapunov": null, "grad_norm": 0.1914882132186981, "grad_max_sv": 0.13863548981025814, "grad_min_sv": 2.579038138605938e-08, "grad_condition": 5398596.905280545, "lr": 1.570841943568452e-05, "time_sec": 32.40613651275635 }, { "epoch": 93, "train_loss": 0.05393671277284622, "train_acc": 0.9816, "test_loss": 0.8570820412635803, "test_acc": 0.847, "lyapunov": null, "grad_norm": 0.19247907609747256, "grad_max_sv": 0.14507245384156703, "grad_min_sv": 2.4785522878545406e-08, "grad_condition": 5879853.769356969, "lr": 1.204161903062634e-05, "time_sec": 32.38154458999634 }, { "epoch": 94, "train_loss": 0.05565428542852402, "train_acc": 0.98092, "test_loss": 0.8699159992218017, "test_acc": 0.8494, "lyapunov": null, "grad_norm": 0.1950428660443827, "grad_max_sv": 0.15786617370322348, "grad_min_sv": 2.5128920544403855e-08, "grad_condition": 6342900.039114647, "lr": 8.85637463565564e-06, "time_sec": 32.408872842788696 }, { "epoch": 95, "train_loss": 0.0554716275537014, "train_acc": 0.98074, "test_loss": 0.8724354814529419, "test_acc": 0.848, "lyapunov": null, "grad_norm": 0.1953551453056335, "grad_max_sv": 0.14595830552279948, "grad_min_sv": 2.4523609010174142e-08, "grad_condition": 6097998.471070435, "lr": 6.155829702431171e-06, "time_sec": 32.37954640388489 }, { "epoch": 96, "train_loss": 0.055670329051017764, "train_acc": 0.98156, "test_loss": 0.8982214247703553, "test_acc": 0.8452, "lyapunov": null, "grad_norm": 0.19496196662820392, "grad_max_sv": 0.1501585453748703, "grad_min_sv": 2.5934764646962095e-08, "grad_condition": 5869735.378663734, "lr": 3.942649342761118e-06, "time_sec": 32.4021053314209 }, { "epoch": 97, "train_loss": 0.05344248455762863, "train_acc": 0.9813, "test_loss": 0.9114454601287841, "test_acc": 0.8468, "lyapunov": null, "grad_norm": 0.19018664442063118, "grad_max_sv": 0.14032225906848908, "grad_min_sv": 2.502056415387699e-08, "grad_condition": 5745975.090099884, "lr": 2.2190176984600023e-06, "time_sec": 32.38188123703003 }, { "epoch": 98, "train_loss": 0.053135186285972594, "train_acc": 0.9819, "test_loss": 0.869631242275238, "test_acc": 0.8508, "lyapunov": null, "grad_norm": 0.18824134211058935, "grad_max_sv": 0.13075507152825594, "grad_min_sv": 2.4252965857840536e-08, "grad_condition": 5397614.905736231, "lr": 9.866357858642206e-07, "time_sec": 32.386441230773926 }, { "epoch": 99, "train_loss": 0.05097491117954254, "train_acc": 0.983, "test_loss": 0.8943203839302063, "test_acc": 0.8483, "lyapunov": null, "grad_norm": 0.18445756568932634, "grad_max_sv": 0.13804081929847598, "grad_min_sv": 2.4356519201518267e-08, "grad_condition": 5702871.134726013, "lr": 2.467198171342e-07, "time_sec": 32.405375480651855 }, { "epoch": 100, "train_loss": 0.05390245022058487, "train_acc": 0.9809, "test_loss": 0.871891166973114, "test_acc": 0.8498, "lyapunov": null, "grad_norm": 0.1935152752615153, "grad_max_sv": 0.14720266554504632, "grad_min_sv": 2.436729609200938e-08, "grad_condition": 6104513.732861901, "lr": 0.0, "time_sec": 32.40170097351074 } ], "12": [ { "epoch": 1, "train_loss": 2.4167917232513427, "train_acc": 0.21668, "test_loss": 2.5600556365966796, "test_acc": 0.1426, "lyapunov": null, "grad_norm": 8.183371300480916, "grad_max_sv": 7.386911773681641, "grad_min_sv": 2.415331181282454e-07, "grad_condition": 30373000.643941343, "lr": 0.0009997532801828658, "time_sec": 49.45663261413574 }, { "epoch": 2, "train_loss": 1.9079357604217528, "train_acc": 0.31534, "test_loss": 2.481009757232666, "test_acc": 0.1736, "lyapunov": null, "grad_norm": 6.225007320887903, "grad_max_sv": 6.023341983556747, "grad_min_sv": 2.0562342122332212e-07, "grad_condition": 29136429.527644336, "lr": 0.0009990133642141358, "time_sec": 49.483285427093506 }, { "epoch": 3, "train_loss": 1.7475298168945312, "train_acc": 0.36588, "test_loss": 2.8285199867248534, "test_acc": 0.131, "lyapunov": null, "grad_norm": 5.1420950067433004, "grad_max_sv": 4.660892617702484, "grad_min_sv": 1.8032060928874215e-07, "grad_condition": 26358047.987367053, "lr": 0.00099778098230154, "time_sec": 49.57265663146973 }, { "epoch": 4, "train_loss": 1.648739521408081, "train_acc": 0.40166, "test_loss": 2.3356450172424315, "test_acc": 0.1751, "lyapunov": null, "grad_norm": 4.371713821921025, "grad_max_sv": 3.9185040295124054, "grad_min_sv": 1.6463919898512814e-07, "grad_condition": 23923294.770848013, "lr": 0.000996057350657239, "time_sec": 49.45625138282776 }, { "epoch": 5, "train_loss": 1.5810089331436157, "train_acc": 0.4251, "test_loss": 2.673109909439087, "test_acc": 0.1544, "lyapunov": null, "grad_norm": 3.4555186506953595, "grad_max_sv": 2.900471958518028, "grad_min_sv": 1.4436529607309013e-07, "grad_condition": 20173199.710391533, "lr": 0.0009938441702975688, "time_sec": 49.46467709541321 }, { "epoch": 6, "train_loss": 1.5207538050079346, "train_acc": 0.44858, "test_loss": 2.5345509658813477, "test_acc": 0.1699, "lyapunov": null, "grad_norm": 2.64949967993879, "grad_max_sv": 2.2037453174591066, "grad_min_sv": 1.0903019624919352e-07, "grad_condition": 20443245.381738927, "lr": 0.0009911436253643444, "time_sec": 49.46764326095581 }, { "epoch": 7, "train_loss": 1.4697360105133057, "train_acc": 0.46474, "test_loss": 2.8721789810180662, "test_acc": 0.1272, "lyapunov": null, "grad_norm": 2.07791741270765, "grad_max_sv": 1.6007355004549026, "grad_min_sv": 8.760053766820875e-08, "grad_condition": 18373378.661422264, "lr": 0.0009879583809693736, "time_sec": 49.47743082046509 }, { "epoch": 8, "train_loss": 1.4266535543823242, "train_acc": 0.48382, "test_loss": 3.240042792892456, "test_acc": 0.1388, "lyapunov": null, "grad_norm": 1.6671990756280735, "grad_max_sv": 1.2928156778216362, "grad_min_sv": 7.22438866951336e-08, "grad_condition": 18264606.350417227, "lr": 0.0009842915805643154, "time_sec": 49.462923526763916 }, { "epoch": 9, "train_loss": 1.394312504272461, "train_acc": 0.49708, "test_loss": 2.92084864654541, "test_acc": 0.1515, "lyapunov": null, "grad_norm": 1.4501900520177538, "grad_max_sv": 1.0461901366710662, "grad_min_sv": 6.580800739897086e-08, "grad_condition": 16086880.216684576, "lr": 0.0009801468428384714, "time_sec": 49.47783327102661 }, { "epoch": 10, "train_loss": 1.3646438373184204, "train_acc": 0.50782, "test_loss": 2.4641769153594972, "test_acc": 0.2432, "lyapunov": null, "grad_norm": 1.291271889799819, "grad_max_sv": 0.9352933883666992, "grad_min_sv": 6.025941292620019e-08, "grad_condition": 15737334.845315147, "lr": 0.0009755282581475767, "time_sec": 49.47376465797424 }, { "epoch": 11, "train_loss": 1.3376501561355592, "train_acc": 0.51558, "test_loss": 2.9219178497314453, "test_acc": 0.2438, "lyapunov": null, "grad_norm": 1.1555098680383777, "grad_max_sv": 0.7429820895195007, "grad_min_sv": 5.2901568192709195e-08, "grad_condition": 14266011.744750757, "lr": 0.0009704403844771127, "time_sec": 49.47013974189758 }, { "epoch": 12, "train_loss": 1.3112868671417237, "train_acc": 0.5284, "test_loss": 2.74031083946228, "test_acc": 0.2031, "lyapunov": null, "grad_norm": 1.0738955371821308, "grad_max_sv": 0.748549421876669, "grad_min_sv": 4.978303538294426e-08, "grad_condition": 15210211.076616298, "lr": 0.0009648882429441257, "time_sec": 49.46808075904846 }, { "epoch": 13, "train_loss": 1.287481568031311, "train_acc": 0.53728, "test_loss": 3.040859108734131, "test_acc": 0.1924, "lyapunov": null, "grad_norm": 0.9771624206683323, "grad_max_sv": 0.64529999345541, "grad_min_sv": 4.393245678357971e-08, "grad_condition": 14761475.748675447, "lr": 0.0009588773128419905, "time_sec": 49.47308921813965 }, { "epoch": 14, "train_loss": 1.2648405401992797, "train_acc": 0.54502, "test_loss": 2.792311123275757, "test_acc": 0.1915, "lyapunov": null, "grad_norm": 0.9467244901324925, "grad_max_sv": 0.6184789575636387, "grad_min_sv": 4.4816473465658643e-08, "grad_condition": 14165375.345471447, "lr": 0.0009524135262330098, "time_sec": 49.483009815216064 }, { "epoch": 15, "train_loss": 1.241471286087036, "train_acc": 0.55048, "test_loss": 2.3441864311218263, "test_acc": 0.2456, "lyapunov": null, "grad_norm": 0.8759338877958681, "grad_max_sv": 0.5726857863366603, "grad_min_sv": 3.894658555658736e-08, "grad_condition": 14972228.263231587, "lr": 0.0009455032620941839, "time_sec": 49.48427653312683 }, { "epoch": 16, "train_loss": 1.2250818849945069, "train_acc": 0.55916, "test_loss": 2.4376744468688964, "test_acc": 0.2811, "lyapunov": null, "grad_norm": 0.8280125995789305, "grad_max_sv": 0.5269983820617199, "grad_min_sv": 3.957679450827811e-08, "grad_condition": 13458638.5630938, "lr": 0.0009381533400219318, "time_sec": 49.491514921188354 }, { "epoch": 17, "train_loss": 1.2011407931518554, "train_acc": 0.5681, "test_loss": 3.077988208389282, "test_acc": 0.2372, "lyapunov": null, "grad_norm": 0.7903623783049802, "grad_max_sv": 0.5003585621714592, "grad_min_sv": 3.7936934749183135e-08, "grad_condition": 13344237.683557762, "lr": 0.0009303710135019719, "time_sec": 49.4895544052124 }, { "epoch": 18, "train_loss": 1.1899376231193541, "train_acc": 0.57472, "test_loss": 2.3918450389862063, "test_acc": 0.2518, "lyapunov": null, "grad_norm": 0.7718039520215193, "grad_max_sv": 0.47414265275001527, "grad_min_sv": 3.554989529419572e-08, "grad_condition": 13438942.364842063, "lr": 0.0009221639627510076, "time_sec": 49.456658124923706 }, { "epoch": 19, "train_loss": 1.168603648300171, "train_acc": 0.57972, "test_loss": 2.283582151031494, "test_acc": 0.2237, "lyapunov": null, "grad_norm": 0.7146309518059523, "grad_max_sv": 0.4340610824525356, "grad_min_sv": 3.228430212054434e-08, "grad_condition": 13543039.003440287, "lr": 0.000913540287137281, "time_sec": 49.45988321304321 }, { "epoch": 20, "train_loss": 1.151336190109253, "train_acc": 0.58574, "test_loss": 2.2708426193237305, "test_acc": 0.2755, "lyapunov": null, "grad_norm": 0.6983120785552407, "grad_max_sv": 0.4454373300075531, "grad_min_sv": 3.350230577403579e-08, "grad_condition": 13641891.236675229, "lr": 0.0009045084971874739, "time_sec": 49.4855215549469 }, { "epoch": 21, "train_loss": 1.1312933298873902, "train_acc": 0.5941, "test_loss": 2.002239217376709, "test_acc": 0.3398, "lyapunov": null, "grad_norm": 0.6668029786621408, "grad_max_sv": 0.4022377036511898, "grad_min_sv": 3.0301077691419207e-08, "grad_condition": 13290330.075167935, "lr": 0.0008950775061878452, "time_sec": 49.5133171081543 }, { "epoch": 22, "train_loss": 1.1186233515167237, "train_acc": 0.59978, "test_loss": 3.6749740661621093, "test_acc": 0.2938, "lyapunov": null, "grad_norm": 0.6355160393463501, "grad_max_sv": 0.3662328697741032, "grad_min_sv": 2.919807395862506e-08, "grad_condition": 12676455.229119861, "lr": 0.0008852566213878947, "time_sec": 49.47933578491211 }, { "epoch": 23, "train_loss": 1.0992162245941162, "train_acc": 0.60538, "test_loss": 2.2956289947509765, "test_acc": 0.3419, "lyapunov": null, "grad_norm": 0.6289434264719856, "grad_max_sv": 0.3852032497525215, "grad_min_sv": 2.838916279834791e-08, "grad_condition": 13726993.354284357, "lr": 0.0008750555348152298, "time_sec": 49.46930289268494 }, { "epoch": 24, "train_loss": 1.09261875541687, "train_acc": 0.6078, "test_loss": 2.194385333251953, "test_acc": 0.3862, "lyapunov": null, "grad_norm": 0.6127565268862699, "grad_max_sv": 0.3749225478619337, "grad_min_sv": 2.902605293897409e-08, "grad_condition": 12941629.392305708, "lr": 0.0008644843137107057, "time_sec": 49.45948123931885 }, { "epoch": 25, "train_loss": 1.0722477124023437, "train_acc": 0.61656, "test_loss": 2.4663957664489744, "test_acc": 0.3925, "lyapunov": null, "grad_norm": 0.5897825535844798, "grad_max_sv": 0.371936571970582, "grad_min_sv": 2.8421365216857452e-08, "grad_condition": 13252758.329758141, "lr": 0.0008535533905932737, "time_sec": 49.479785442352295 }, { "epoch": 26, "train_loss": 1.0658014038848878, "train_acc": 0.62154, "test_loss": 2.2172969047546385, "test_acc": 0.3602, "lyapunov": null, "grad_norm": 0.5970948959400837, "grad_max_sv": 0.3504005130380392, "grad_min_sv": 2.822866052021311e-08, "grad_condition": 12516728.270259932, "lr": 0.0008422735529643444, "time_sec": 49.46492099761963 }, { "epoch": 27, "train_loss": 1.04928136428833, "train_acc": 0.62394, "test_loss": 2.3098046798706053, "test_acc": 0.3753, "lyapunov": null, "grad_norm": 0.5799982623396496, "grad_max_sv": 0.3511035542935133, "grad_min_sv": 2.871881275012811e-08, "grad_condition": 12420577.990074852, "lr": 0.0008306559326618259, "time_sec": 49.463754177093506 }, { "epoch": 28, "train_loss": 1.033934779319763, "train_acc": 0.6312, "test_loss": 2.5853637130737304, "test_acc": 0.3827, "lyapunov": null, "grad_norm": 0.5626766992798455, "grad_max_sv": 0.3680811390280724, "grad_min_sv": 2.860611223454157e-08, "grad_condition": 13030738.458713688, "lr": 0.0008187119948743449, "time_sec": 49.46650528907776 }, { "epoch": 29, "train_loss": 1.0245469808578491, "train_acc": 0.63318, "test_loss": 2.421029793548584, "test_acc": 0.3777, "lyapunov": null, "grad_norm": 0.540434209171599, "grad_max_sv": 0.33249553516507147, "grad_min_sv": 2.5725369168227985e-08, "grad_condition": 13074923.559065297, "lr": 0.0008064535268264883, "time_sec": 49.46920871734619 }, { "epoch": 30, "train_loss": 1.0157002903938293, "train_acc": 0.63876, "test_loss": 2.5748968841552733, "test_acc": 0.353, "lyapunov": null, "grad_norm": 0.5335667641481916, "grad_max_sv": 0.31497838646173476, "grad_min_sv": 2.4617009453109516e-08, "grad_condition": 12878002.467485525, "lr": 0.0007938926261462367, "time_sec": 49.47658443450928 }, { "epoch": 31, "train_loss": 1.0092763556671143, "train_acc": 0.64072, "test_loss": 2.575096744155884, "test_acc": 0.3689, "lyapunov": null, "grad_norm": 0.5319602288309537, "grad_max_sv": 0.33714523129165175, "grad_min_sv": 2.6278444886784767e-08, "grad_condition": 12997099.648816537, "lr": 0.0007810416889260654, "time_sec": 49.48014044761658 }, { "epoch": 32, "train_loss": 0.9945861617660523, "train_acc": 0.64606, "test_loss": 2.18585274848938, "test_acc": 0.3591, "lyapunov": null, "grad_norm": 0.5207883539385971, "grad_max_sv": 0.30190461575984956, "grad_min_sv": 2.498473832268644e-08, "grad_condition": 12302495.137337226, "lr": 0.0007679133974894983, "time_sec": 49.48141527175903 }, { "epoch": 33, "train_loss": 0.9839789762878418, "train_acc": 0.65072, "test_loss": 2.067453681182861, "test_acc": 0.4015, "lyapunov": null, "grad_norm": 0.5202120303096632, "grad_max_sv": 0.3107115812599659, "grad_min_sv": 2.559975968985384e-08, "grad_condition": 12183076.283694824, "lr": 0.0007545207078751857, "time_sec": 49.50013208389282 }, { "epoch": 34, "train_loss": 0.9741807369995117, "train_acc": 0.6534, "test_loss": 2.3987243717193603, "test_acc": 0.3907, "lyapunov": null, "grad_norm": 0.5156705695841731, "grad_max_sv": 0.3042212676256895, "grad_min_sv": 2.4721938141070156e-08, "grad_condition": 12439098.422273466, "lr": 0.0007408768370508577, "time_sec": 49.4883246421814 }, { "epoch": 35, "train_loss": 0.960876017742157, "train_acc": 0.6604, "test_loss": 2.952223745727539, "test_acc": 0.3772, "lyapunov": null, "grad_norm": 0.49534065997567395, "grad_max_sv": 0.3189103938639164, "grad_min_sv": 2.6160001853625657e-08, "grad_condition": 12245579.759729771, "lr": 0.0007269952498697734, "time_sec": 49.49185800552368 }, { "epoch": 36, "train_loss": 0.9563328867340087, "train_acc": 0.66094, "test_loss": 2.5444390853881838, "test_acc": 0.3748, "lyapunov": null, "grad_norm": 0.5015211388674911, "grad_max_sv": 0.301097634062171, "grad_min_sv": 2.4840815004978368e-08, "grad_condition": 12193384.34751702, "lr": 0.0007128896457825364, "time_sec": 49.473448038101196 }, { "epoch": 37, "train_loss": 0.9456947842597961, "train_acc": 0.66318, "test_loss": 2.8305119338989257, "test_acc": 0.3608, "lyapunov": null, "grad_norm": 0.5027801927119517, "grad_max_sv": 0.3191258400678635, "grad_min_sv": 2.5498967737291876e-08, "grad_condition": 12721385.179239903, "lr": 0.0006985739453173903, "time_sec": 49.47532916069031 }, { "epoch": 38, "train_loss": 0.9344060453033447, "train_acc": 0.66828, "test_loss": 2.3942235221862793, "test_acc": 0.3846, "lyapunov": null, "grad_norm": 0.4893981754322751, "grad_max_sv": 0.27843328677117823, "grad_min_sv": 2.3813316207821345e-08, "grad_condition": 11809731.27063098, "lr": 0.0006840622763423391, "time_sec": 49.466092109680176 }, { "epoch": 39, "train_loss": 0.9299031619262695, "train_acc": 0.6701, "test_loss": 2.5896951622009277, "test_acc": 0.3377, "lyapunov": null, "grad_norm": 0.4877056898105668, "grad_max_sv": 0.2895252756774426, "grad_min_sv": 2.313919011953658e-08, "grad_condition": 12624897.370656734, "lr": 0.0006693689601226458, "time_sec": 49.47689652442932 }, { "epoch": 40, "train_loss": 0.9202397887802124, "train_acc": 0.67222, "test_loss": 2.3479004539489745, "test_acc": 0.3652, "lyapunov": null, "grad_norm": 0.48378803227864736, "grad_max_sv": 0.2827453903853893, "grad_min_sv": 2.3820017647224744e-08, "grad_condition": 11971929.846932925, "lr": 0.0006545084971874737, "time_sec": 49.48384690284729 }, { "epoch": 41, "train_loss": 0.9035198735237122, "train_acc": 0.67674, "test_loss": 2.4544072883605956, "test_acc": 0.4098, "lyapunov": null, "grad_norm": 0.48414477684461676, "grad_max_sv": 0.2927399341017008, "grad_min_sv": 2.5373001699691144e-08, "grad_condition": 11722800.874950778, "lr": 0.0006394955530196147, "time_sec": 49.49253749847412 }, { "epoch": 42, "train_loss": 0.8996260007095337, "train_acc": 0.67922, "test_loss": 2.7968482540130615, "test_acc": 0.3717, "lyapunov": null, "grad_norm": 0.47529519443329865, "grad_max_sv": 0.2862662900239229, "grad_min_sv": 2.4432264433826845e-08, "grad_condition": 11830651.602965241, "lr": 0.0006243449435824273, "time_sec": 49.472256898880005 }, { "epoch": 43, "train_loss": 0.8935702981376648, "train_acc": 0.68226, "test_loss": 2.7968372314453127, "test_acc": 0.3814, "lyapunov": null, "grad_norm": 0.47246322948696845, "grad_max_sv": 0.2997207723557949, "grad_min_sv": 2.4396437803275717e-08, "grad_condition": 12442839.021676019, "lr": 0.0006090716206982714, "time_sec": 49.47343039512634 }, { "epoch": 44, "train_loss": 0.8839340761566162, "train_acc": 0.68406, "test_loss": 2.1332605548858643, "test_acc": 0.4518, "lyapunov": null, "grad_norm": 0.4773353798688752, "grad_max_sv": 0.287653349712491, "grad_min_sv": 2.485683419095608e-08, "grad_condition": 11744954.507169517, "lr": 0.0005936906572928625, "time_sec": 49.483134508132935 }, { "epoch": 45, "train_loss": 0.8809750416755676, "train_acc": 0.6871, "test_loss": 2.3744767669677733, "test_acc": 0.4104, "lyapunov": null, "grad_norm": 0.47171575077424854, "grad_max_sv": 0.2800353281199932, "grad_min_sv": 2.4150169553038835e-08, "grad_condition": 11697732.41688976, "lr": 0.0005782172325201156, "time_sec": 49.47827482223511 }, { "epoch": 46, "train_loss": 0.8651049407958984, "train_acc": 0.69358, "test_loss": 2.6672937103271486, "test_acc": 0.4106, "lyapunov": null, "grad_norm": 0.46225804490680006, "grad_max_sv": 0.2764727082103491, "grad_min_sv": 2.4165243095453092e-08, "grad_condition": 11539194.901861329, "lr": 0.0005626666167821523, "time_sec": 49.482288122177124 }, { "epoch": 47, "train_loss": 0.855909815826416, "train_acc": 0.6953, "test_loss": 2.1082290111541746, "test_acc": 0.4302, "lyapunov": null, "grad_norm": 0.46665587567927413, "grad_max_sv": 0.2777487523853779, "grad_min_sv": 2.3157732442768975e-08, "grad_condition": 12021773.98709596, "lr": 0.0005470541566592572, "time_sec": 49.48243308067322 }, { "epoch": 48, "train_loss": 0.8559737893295288, "train_acc": 0.69554, "test_loss": 2.6735187637329103, "test_acc": 0.3758, "lyapunov": null, "grad_norm": 0.4613852081362787, "grad_max_sv": 0.2753657314926386, "grad_min_sv": 2.358262860546745e-08, "grad_condition": 11826265.97781797, "lr": 0.0005313952597646569, "time_sec": 49.471890687942505 }, { "epoch": 49, "train_loss": 0.8440363460159301, "train_acc": 0.69974, "test_loss": 2.318854873275757, "test_acc": 0.4239, "lyapunov": null, "grad_norm": 0.46468634824792515, "grad_max_sv": 0.2798832211643457, "grad_min_sv": 2.5059412145367333e-08, "grad_condition": 11328180.182026755, "lr": 0.0005157053795390643, "time_sec": 49.46786379814148 }, { "epoch": 50, "train_loss": 0.8407046744155884, "train_acc": 0.69938, "test_loss": 2.2581016651153565, "test_acc": 0.4586, "lyapunov": null, "grad_norm": 0.4552999687027473, "grad_max_sv": 0.27262482419610023, "grad_min_sv": 2.3505009449920066e-08, "grad_condition": 11655869.156098623, "lr": 0.0005000000000000002, "time_sec": 49.46631741523743 }, { "epoch": 51, "train_loss": 0.8328268578910828, "train_acc": 0.70616, "test_loss": 2.021052066421509, "test_acc": 0.4663, "lyapunov": null, "grad_norm": 0.45398371093616957, "grad_max_sv": 0.2551860522478819, "grad_min_sv": 2.261276339510232e-08, "grad_condition": 11423398.903523896, "lr": 0.00048429462046093607, "time_sec": 49.49492907524109 }, { "epoch": 52, "train_loss": 0.8242957615280151, "train_acc": 0.70608, "test_loss": 2.4299042922973633, "test_acc": 0.4339, "lyapunov": null, "grad_norm": 0.4518491350882313, "grad_max_sv": 0.2677639227360487, "grad_min_sv": 2.340493003849531e-08, "grad_condition": 11498272.982724927, "lr": 0.0004686047402353435, "time_sec": 49.47549295425415 }, { "epoch": 53, "train_loss": 0.8202688133239746, "train_acc": 0.70788, "test_loss": 2.0557694828033446, "test_acc": 0.4729, "lyapunov": null, "grad_norm": 0.45155452834894444, "grad_max_sv": 0.2765634849667549, "grad_min_sv": 2.294847063488703e-08, "grad_condition": 12152279.677541133, "lr": 0.000452945843340743, "time_sec": 49.47136735916138 }, { "epoch": 54, "train_loss": 0.8075869009590149, "train_acc": 0.71144, "test_loss": 2.2601095848083497, "test_acc": 0.469, "lyapunov": null, "grad_norm": 0.44703257607115265, "grad_max_sv": 0.28669003024697304, "grad_min_sv": 2.3961542838790707e-08, "grad_condition": 11972426.895574057, "lr": 0.00043733338321784806, "time_sec": 49.472840785980225 }, { "epoch": 55, "train_loss": 0.8038845987319946, "train_acc": 0.71234, "test_loss": 1.9625594703674316, "test_acc": 0.4966, "lyapunov": null, "grad_norm": 0.45158056349279113, "grad_max_sv": 0.2616859499365091, "grad_min_sv": 2.319859899735377e-08, "grad_condition": 11323136.132990547, "lr": 0.0004217827674798847, "time_sec": 49.475728034973145 }, { "epoch": 56, "train_loss": 0.7961191424942017, "train_acc": 0.71566, "test_loss": 2.24710135345459, "test_acc": 0.4678, "lyapunov": null, "grad_norm": 0.45114634744336685, "grad_max_sv": 0.27140378654003144, "grad_min_sv": 2.345107636969601e-08, "grad_condition": 11702309.047382332, "lr": 0.00040630934270713783, "time_sec": 49.46745586395264 }, { "epoch": 57, "train_loss": 0.7886269653129577, "train_acc": 0.71928, "test_loss": 2.332701706314087, "test_acc": 0.4392, "lyapunov": null, "grad_norm": 0.44691251964783024, "grad_max_sv": 0.2512993272393942, "grad_min_sv": 2.3577591501400263e-08, "grad_condition": 10797942.504272973, "lr": 0.000390928379301729, "time_sec": 49.487914085388184 }, { "epoch": 58, "train_loss": 0.7809809253120422, "train_acc": 0.72054, "test_loss": 2.163261636352539, "test_acc": 0.4825, "lyapunov": null, "grad_norm": 0.44707505885973187, "grad_max_sv": 0.27487311884760857, "grad_min_sv": 2.305816853009901e-08, "grad_condition": 11921937.091947556, "lr": 0.0003756550564175727, "time_sec": 49.477548360824585 }, { "epoch": 59, "train_loss": 0.7728579918098449, "train_acc": 0.72464, "test_loss": 2.4211140827178954, "test_acc": 0.4792, "lyapunov": null, "grad_norm": 0.442207932790873, "grad_max_sv": 0.2551064256578684, "grad_min_sv": 2.3925818348757842e-08, "grad_condition": 10733599.660670992, "lr": 0.00036050444698038553, "time_sec": 49.47178077697754 }, { "epoch": 60, "train_loss": 0.7646781494522095, "train_acc": 0.72672, "test_loss": 2.02176361579895, "test_acc": 0.4897, "lyapunov": null, "grad_norm": 0.4430698668925349, "grad_max_sv": 0.26053123250603677, "grad_min_sv": 2.3670396620545377e-08, "grad_condition": 11170288.922506649, "lr": 0.00034549150281252655, "time_sec": 49.46177387237549 }, { "epoch": 61, "train_loss": 0.7588282846641541, "train_acc": 0.7286, "test_loss": 2.670531511688232, "test_acc": 0.4198, "lyapunov": null, "grad_norm": 0.43898999083578233, "grad_max_sv": 0.26667738817632197, "grad_min_sv": 2.325178121154181e-08, "grad_condition": 11623927.174902633, "lr": 0.0003306310398773544, "time_sec": 49.49580407142639 }, { "epoch": 62, "train_loss": 0.7492313718986511, "train_acc": 0.73298, "test_loss": 2.4778705802917482, "test_acc": 0.449, "lyapunov": null, "grad_norm": 0.4417738790617677, "grad_max_sv": 0.2574993997812271, "grad_min_sv": 2.3859390374525445e-08, "grad_condition": 10899105.692467105, "lr": 0.00031593772365766127, "time_sec": 49.486817836761475 }, { "epoch": 63, "train_loss": 0.7480638890266419, "train_acc": 0.73324, "test_loss": 2.1940598976135255, "test_acc": 0.4734, "lyapunov": null, "grad_norm": 0.4366591281226868, "grad_max_sv": 0.2512634038925171, "grad_min_sv": 2.326989370082799e-08, "grad_condition": 10851343.919251464, "lr": 0.0003014260546826097, "time_sec": 49.494584798812866 }, { "epoch": 64, "train_loss": 0.7451907014846801, "train_acc": 0.73538, "test_loss": 2.3143032501220704, "test_acc": 0.4762, "lyapunov": null, "grad_norm": 0.4362314837898005, "grad_max_sv": 0.2649652697145939, "grad_min_sv": 2.3657484859995748e-08, "grad_condition": 11323682.220760768, "lr": 0.0002871103542174637, "time_sec": 49.46461892127991 }, { "epoch": 65, "train_loss": 0.7316487748908996, "train_acc": 0.73868, "test_loss": 2.132633139801025, "test_acc": 0.4893, "lyapunov": null, "grad_norm": 0.43117564557331234, "grad_max_sv": 0.2554838340729475, "grad_min_sv": 2.3040169683241628e-08, "grad_condition": 11170455.423079647, "lr": 0.0002730047501302267, "time_sec": 49.4881227016449 }, { "epoch": 66, "train_loss": 0.7290266520881653, "train_acc": 0.7408, "test_loss": 2.396712022781372, "test_acc": 0.4793, "lyapunov": null, "grad_norm": 0.43225303341958693, "grad_max_sv": 0.2486136831343174, "grad_min_sv": 2.2949348021938932e-08, "grad_condition": 10962824.963370848, "lr": 0.00025912316294914234, "time_sec": 49.47016882896423 }, { "epoch": 67, "train_loss": 0.7191537443733216, "train_acc": 0.74308, "test_loss": 2.1576420639038085, "test_acc": 0.4941, "lyapunov": null, "grad_norm": 0.42657147393758854, "grad_max_sv": 0.2438450776040554, "grad_min_sv": 2.3898531642529975e-08, "grad_condition": 10287595.631951943, "lr": 0.0002454792921248144, "time_sec": 49.49215388298035 }, { "epoch": 68, "train_loss": 0.7169496524429322, "train_acc": 0.74418, "test_loss": 2.4695981254577637, "test_acc": 0.4807, "lyapunov": null, "grad_norm": 0.4234097941028663, "grad_max_sv": 0.24577417597174644, "grad_min_sv": 2.2813544342525915e-08, "grad_condition": 10779009.57251847, "lr": 0.00023208660251050164, "time_sec": 49.531681299209595 }, { "epoch": 69, "train_loss": 0.7072784723091126, "train_acc": 0.74744, "test_loss": 2.27939485244751, "test_acc": 0.4853, "lyapunov": null, "grad_norm": 0.4251678846869415, "grad_max_sv": 0.241105442866683, "grad_min_sv": 2.3618906030975496e-08, "grad_condition": 10243169.91188918, "lr": 0.00021895831107393473, "time_sec": 49.46745848655701 }, { "epoch": 70, "train_loss": 0.7093459980392456, "train_acc": 0.74668, "test_loss": 2.2168941738128662, "test_acc": 0.4993, "lyapunov": null, "grad_norm": 0.4187232599688298, "grad_max_sv": 0.2437821462750435, "grad_min_sv": 2.330924906424059e-08, "grad_condition": 10529543.438680641, "lr": 0.00020610737385376356, "time_sec": 49.46611166000366 }, { "epoch": 71, "train_loss": 0.7046173419761658, "train_acc": 0.74866, "test_loss": 2.6486716678619384, "test_acc": 0.4604, "lyapunov": null, "grad_norm": 0.43152156311922873, "grad_max_sv": 0.26821285113692284, "grad_min_sv": 2.3308388552578663e-08, "grad_condition": 11585490.938807528, "lr": 0.00019354647317351177, "time_sec": 49.484049558639526 }, { "epoch": 72, "train_loss": 0.6916852585601807, "train_acc": 0.75164, "test_loss": 2.4044878028869627, "test_acc": 0.4868, "lyapunov": null, "grad_norm": 0.42974614402520106, "grad_max_sv": 0.2577272642403841, "grad_min_sv": 2.3734259935181968e-08, "grad_condition": 10929944.700492647, "lr": 0.0001812880051256552, "time_sec": 49.47321033477783 }, { "epoch": 73, "train_loss": 0.6914860160255432, "train_acc": 0.75462, "test_loss": 2.459467795562744, "test_acc": 0.4755, "lyapunov": null, "grad_norm": 0.4235499199054343, "grad_max_sv": 0.2499073389917612, "grad_min_sv": 2.312090292555524e-08, "grad_condition": 10928192.758700397, "lr": 0.00016934406733817422, "time_sec": 49.47536325454712 }, { "epoch": 74, "train_loss": 0.6900841831016541, "train_acc": 0.75346, "test_loss": 2.529036985015869, "test_acc": 0.4694, "lyapunov": null, "grad_norm": 0.4200493463432216, "grad_max_sv": 0.24829606115818023, "grad_min_sv": 2.3347005217999595e-08, "grad_condition": 10777473.575533265, "lr": 0.0001577264470356557, "time_sec": 49.47671389579773 }, { "epoch": 75, "train_loss": 0.6844219914627075, "train_acc": 0.75664, "test_loss": 2.7192491188049317, "test_acc": 0.4659, "lyapunov": null, "grad_norm": 0.41891725324120427, "grad_max_sv": 0.2549721471965313, "grad_min_sv": 2.308645701276646e-08, "grad_condition": 11178421.697050892, "lr": 0.00014644660940672634, "time_sec": 49.475868701934814 }, { "epoch": 76, "train_loss": 0.6757127567672729, "train_acc": 0.76002, "test_loss": 2.228153326416016, "test_acc": 0.4719, "lyapunov": null, "grad_norm": 0.41518783756559813, "grad_max_sv": 0.24106829576194286, "grad_min_sv": 2.3467413079458765e-08, "grad_condition": 10331945.898118276, "lr": 0.0001355156862892944, "time_sec": 49.47853899002075 }, { "epoch": 77, "train_loss": 0.6663033656692505, "train_acc": 0.7606, "test_loss": 2.5164624114990235, "test_acc": 0.4627, "lyapunov": null, "grad_norm": 0.41866630242016806, "grad_max_sv": 0.2701979674398899, "grad_min_sv": 2.4135091125643272e-08, "grad_condition": 11260755.273271866, "lr": 0.00012494446518477025, "time_sec": 49.47706151008606 }, { "epoch": 78, "train_loss": 0.6645314185142517, "train_acc": 0.76252, "test_loss": 2.8226414447784425, "test_acc": 0.4614, "lyapunov": null, "grad_norm": 0.4173542916715373, "grad_max_sv": 0.2490392465144396, "grad_min_sv": 2.3206901200722994e-08, "grad_condition": 10823280.058633823, "lr": 0.00011474337861210548, "time_sec": 49.483954191207886 }, { "epoch": 79, "train_loss": 0.6665540114593506, "train_acc": 0.76016, "test_loss": 2.2122913623809812, "test_acc": 0.4819, "lyapunov": null, "grad_norm": 0.4188547510844498, "grad_max_sv": 0.25715495869517324, "grad_min_sv": 2.4195212988686877e-08, "grad_condition": 10755821.867443344, "lr": 0.00010492249381215483, "time_sec": 49.46640372276306 }, { "epoch": 80, "train_loss": 0.6579594387054444, "train_acc": 0.76406, "test_loss": 2.328022619628906, "test_acc": 0.4922, "lyapunov": null, "grad_norm": 0.41446019268915407, "grad_max_sv": 0.2467421844601631, "grad_min_sv": 2.3609747978881047e-08, "grad_condition": 10542743.78062649, "lr": 9.549150281252637e-05, "time_sec": 49.47466158866882 }, { "epoch": 81, "train_loss": 0.6575078699111938, "train_acc": 0.76504, "test_loss": 2.435921426773071, "test_acc": 0.4706, "lyapunov": null, "grad_norm": 0.41722587257024396, "grad_max_sv": 0.2460654556751251, "grad_min_sv": 2.2818005085412097e-08, "grad_condition": 10871762.933690486, "lr": 8.645971286271918e-05, "time_sec": 49.48575758934021 }, { "epoch": 82, "train_loss": 0.6540266362380981, "train_acc": 0.7668, "test_loss": 2.420010438537598, "test_acc": 0.4873, "lyapunov": null, "grad_norm": 0.4134489054266664, "grad_max_sv": 0.24872095324099064, "grad_min_sv": 2.4063159953513492e-08, "grad_condition": 10418409.724400165, "lr": 7.78360372489926e-05, "time_sec": 49.4517502784729 }, { "epoch": 83, "train_loss": 0.6572029878616333, "train_acc": 0.76728, "test_loss": 2.509574550628662, "test_acc": 0.4741, "lyapunov": null, "grad_norm": 0.40888921626022273, "grad_max_sv": 0.24261515885591506, "grad_min_sv": 2.325806733871616e-08, "grad_condition": 10519103.211694924, "lr": 6.962898649802815e-05, "time_sec": 49.47699522972107 }, { "epoch": 84, "train_loss": 0.648239343738556, "train_acc": 0.76774, "test_loss": 2.2645148223876954, "test_acc": 0.485, "lyapunov": null, "grad_norm": 0.4120785615672335, "grad_max_sv": 0.24379208087921142, "grad_min_sv": 2.272370744904606e-08, "grad_condition": 10771039.526767144, "lr": 6.184665997806824e-05, "time_sec": 49.461183071136475 }, { "epoch": 85, "train_loss": 0.6412541982460022, "train_acc": 0.77106, "test_loss": 2.5437144912719725, "test_acc": 0.4865, "lyapunov": null, "grad_norm": 0.41805406865324773, "grad_max_sv": 0.2572408441454172, "grad_min_sv": 2.2814066324983172e-08, "grad_condition": 11337861.01159941, "lr": 5.449673790581613e-05, "time_sec": 49.47793769836426 }, { "epoch": 86, "train_loss": 0.6463544520187378, "train_acc": 0.76662, "test_loss": 2.9264222496032715, "test_acc": 0.4471, "lyapunov": null, "grad_norm": 0.4118969055764605, "grad_max_sv": 0.2387235414236784, "grad_min_sv": 2.2642364694291928e-08, "grad_condition": 10550361.803450387, "lr": 4.758647376699034e-05, "time_sec": 49.4726197719574 }, { "epoch": 87, "train_loss": 0.6428634425735473, "train_acc": 0.7704, "test_loss": 2.5568968086242676, "test_acc": 0.4759, "lyapunov": null, "grad_norm": 0.415046593792845, "grad_max_sv": 0.2535580638796091, "grad_min_sv": 2.363120126247509e-08, "grad_condition": 10837761.433894884, "lr": 4.112268715800956e-05, "time_sec": 49.48099684715271 }, { "epoch": 88, "train_loss": 0.6407405834579468, "train_acc": 0.77184, "test_loss": 2.4600058319091795, "test_acc": 0.475, "lyapunov": null, "grad_norm": 0.4135582126787873, "grad_max_sv": 0.25508003048598765, "grad_min_sv": 2.376858407870941e-08, "grad_condition": 10837781.081215866, "lr": 3.511175705587434e-05, "time_sec": 49.47017812728882 }, { "epoch": 89, "train_loss": 0.6344939192008973, "train_acc": 0.77288, "test_loss": 2.4250204902648926, "test_acc": 0.4787, "lyapunov": null, "grad_norm": 0.4160361292383021, "grad_max_sv": 0.25198650658130645, "grad_min_sv": 2.3671872506625392e-08, "grad_condition": 10764847.245073054, "lr": 2.9559615522887284e-05, "time_sec": 49.48287224769592 }, { "epoch": 90, "train_loss": 0.6344009274482727, "train_acc": 0.77354, "test_loss": 2.7001010314941407, "test_acc": 0.4623, "lyapunov": null, "grad_norm": 0.4089648902673904, "grad_max_sv": 0.24975020438432693, "grad_min_sv": 2.2971467306120984e-08, "grad_condition": 10990208.207150657, "lr": 2.447174185242324e-05, "time_sec": 49.50636339187622 }, { "epoch": 91, "train_loss": 0.6388888354110718, "train_acc": 0.77322, "test_loss": 2.4007692584991456, "test_acc": 0.482, "lyapunov": null, "grad_norm": 0.41394740295503574, "grad_max_sv": 0.24785541072487832, "grad_min_sv": 2.4093225903243366e-08, "grad_condition": 10380601.978368312, "lr": 1.9853157161528526e-05, "time_sec": 49.47446608543396 }, { "epoch": 92, "train_loss": 0.6364776765632629, "train_acc": 0.7745, "test_loss": 2.399016780090332, "test_acc": 0.4893, "lyapunov": null, "grad_norm": 0.4144776850028884, "grad_max_sv": 0.23398316986858844, "grad_min_sv": 2.3364770829203963e-08, "grad_condition": 10152213.637178902, "lr": 1.570841943568452e-05, "time_sec": 49.4903450012207 }, { "epoch": 93, "train_loss": 0.6323039393615723, "train_acc": 0.7761, "test_loss": 2.5661166526794434, "test_acc": 0.4799, "lyapunov": null, "grad_norm": 0.4148058440423859, "grad_max_sv": 0.25038140527904035, "grad_min_sv": 2.3675201843431638e-08, "grad_condition": 10621575.74650034, "lr": 1.204161903062634e-05, "time_sec": 49.47283339500427 }, { "epoch": 94, "train_loss": 0.6312036778831482, "train_acc": 0.77456, "test_loss": 2.4954245025634765, "test_acc": 0.4884, "lyapunov": null, "grad_norm": 0.41190158928123094, "grad_max_sv": 0.23922828286886216, "grad_min_sv": 2.3207600818864195e-08, "grad_condition": 10426944.434691576, "lr": 8.85637463565564e-06, "time_sec": 49.4705286026001 }, { "epoch": 95, "train_loss": 0.631898609752655, "train_acc": 0.77374, "test_loss": 2.496735878753662, "test_acc": 0.484, "lyapunov": null, "grad_norm": 0.4118919272482802, "grad_max_sv": 0.2545221421867609, "grad_min_sv": 2.265429692727139e-08, "grad_condition": 11229071.176658351, "lr": 6.155829702431171e-06, "time_sec": 49.45284724235535 }, { "epoch": 96, "train_loss": 0.6379076655197143, "train_acc": 0.77178, "test_loss": 2.6363272483825684, "test_acc": 0.476, "lyapunov": null, "grad_norm": 0.4109637736779776, "grad_max_sv": 0.23244931511580944, "grad_min_sv": 2.2822463163763017e-08, "grad_condition": 10301145.344649881, "lr": 3.942649342761118e-06, "time_sec": 49.47940802574158 }, { "epoch": 97, "train_loss": 0.6325872544288635, "train_acc": 0.77334, "test_loss": 2.7118479751586912, "test_acc": 0.4606, "lyapunov": null, "grad_norm": 0.4111072193471729, "grad_max_sv": 0.23797121047973632, "grad_min_sv": 2.2607291239040707e-08, "grad_condition": 10688228.14219837, "lr": 2.2190176984600023e-06, "time_sec": 49.482439041137695 }, { "epoch": 98, "train_loss": 0.6342727423286438, "train_acc": 0.77484, "test_loss": 2.50120391998291, "test_acc": 0.4868, "lyapunov": null, "grad_norm": 0.4137394255148928, "grad_max_sv": 0.24089130759239197, "grad_min_sv": 2.424639040654597e-08, "grad_condition": 10056603.153747398, "lr": 9.866357858642206e-07, "time_sec": 49.48271298408508 }, { "epoch": 99, "train_loss": 0.628259766407013, "train_acc": 0.77486, "test_loss": 2.447319179916382, "test_acc": 0.4885, "lyapunov": null, "grad_norm": 0.4076037809536703, "grad_max_sv": 0.25056461431086063, "grad_min_sv": 2.3701171647516616e-08, "grad_condition": 10626762.207877642, "lr": 2.467198171342e-07, "time_sec": 49.45984363555908 }, { "epoch": 100, "train_loss": 0.6313758395767212, "train_acc": 0.77534, "test_loss": 2.4442952224731447, "test_acc": 0.4905, "lyapunov": null, "grad_norm": 0.40858498927976306, "grad_max_sv": 0.23060753419995308, "grad_min_sv": 2.2785150743942496e-08, "grad_condition": 10116355.973472353, "lr": 0.0, "time_sec": 49.46379518508911 } ], "16": [ { "epoch": 1, "train_loss": 2.717775194091797, "train_acc": 0.12228, "test_loss": 3.3459623817443847, "test_acc": 0.1, "lyapunov": null, "grad_norm": 7.716699984005914, "grad_max_sv": 7.287460565567017, "grad_min_sv": 2.5165389772041635e-07, "grad_condition": 29456429.211788226, "lr": 0.0009997532801828658, "time_sec": 66.53277444839478 }, { "epoch": 2, "train_loss": 2.2721379792785643, "train_acc": 0.17654, "test_loss": 4.04989028930664, "test_acc": 0.1003, "lyapunov": null, "grad_norm": 6.63637414556116, "grad_max_sv": 6.237935948371887, "grad_min_sv": 2.2601446723058415e-07, "grad_condition": 28188789.96425259, "lr": 0.0009990133642141358, "time_sec": 66.55316853523254 }, { "epoch": 3, "train_loss": 2.137921618881226, "train_acc": 0.2105, "test_loss": 5.869428012084961, "test_acc": 0.1011, "lyapunov": null, "grad_norm": 5.7520031644476814, "grad_max_sv": 5.452845233678818, "grad_min_sv": 1.9201941405810886e-07, "grad_condition": 28919609.465649594, "lr": 0.00099778098230154, "time_sec": 66.56071186065674 }, { "epoch": 4, "train_loss": 2.0486733519744873, "train_acc": 0.23394, "test_loss": 5.161107911682129, "test_acc": 0.1097, "lyapunov": null, "grad_norm": 4.91519980042541, "grad_max_sv": 4.5814680576324465, "grad_min_sv": 1.6788343710771868e-07, "grad_condition": 27707547.33712595, "lr": 0.000996057350657239, "time_sec": 66.55148816108704 }, { "epoch": 5, "train_loss": 1.9897926804351806, "train_acc": 0.25822, "test_loss": 4.115356592559815, "test_acc": 0.1203, "lyapunov": null, "grad_norm": 4.476936137063571, "grad_max_sv": 4.264879077672958, "grad_min_sv": 1.6287330311115512e-07, "grad_condition": 27434565.90350554, "lr": 0.0009938441702975688, "time_sec": 66.53483939170837 }, { "epoch": 6, "train_loss": 1.950422788543701, "train_acc": 0.26598, "test_loss": 6.161662875366211, "test_acc": 0.1038, "lyapunov": null, "grad_norm": 4.078084494569751, "grad_max_sv": 3.8316186487674715, "grad_min_sv": 1.5860823996405315e-07, "grad_condition": 24946451.178036533, "lr": 0.0009911436253643444, "time_sec": 66.544926404953 }, { "epoch": 7, "train_loss": 1.9193549822998046, "train_acc": 0.28804, "test_loss": 6.333303915405273, "test_acc": 0.1006, "lyapunov": null, "grad_norm": 3.9544625089709906, "grad_max_sv": 3.660486602783203, "grad_min_sv": 1.3159545346752567e-07, "grad_condition": 27858533.203216422, "lr": 0.0009879583809693736, "time_sec": 66.54343152046204 }, { "epoch": 8, "train_loss": 1.8974505254364014, "train_acc": 0.29166, "test_loss": 6.595959260559082, "test_acc": 0.1052, "lyapunov": null, "grad_norm": 3.7716319720252063, "grad_max_sv": 3.4488155782222747, "grad_min_sv": 1.3156188991558792e-07, "grad_condition": 26979104.149509914, "lr": 0.0009842915805643154, "time_sec": 66.53689360618591 }, { "epoch": 9, "train_loss": 1.8757565868377686, "train_acc": 0.2988, "test_loss": 8.294800563049316, "test_acc": 0.1001, "lyapunov": null, "grad_norm": 3.606736816077247, "grad_max_sv": 3.276396805047989, "grad_min_sv": 1.2148574111137122e-07, "grad_condition": 27354129.68622259, "lr": 0.0009801468428384714, "time_sec": 66.53859829902649 }, { "epoch": 10, "train_loss": 1.853810763168335, "train_acc": 0.30818, "test_loss": 7.528170121765137, "test_acc": 0.1002, "lyapunov": null, "grad_norm": 3.590286745766664, "grad_max_sv": 3.3836376488208773, "grad_min_sv": 1.2300289498057282e-07, "grad_condition": 28478996.179412544, "lr": 0.0009755282581475767, "time_sec": 66.54752492904663 }, { "epoch": 11, "train_loss": 1.8360865605926513, "train_acc": 0.31554, "test_loss": 8.300324632263184, "test_acc": 0.1004, "lyapunov": null, "grad_norm": 3.4184867147228633, "grad_max_sv": 3.2137346804141997, "grad_min_sv": 1.2349632871888616e-07, "grad_condition": 27052165.93028751, "lr": 0.0009704403844771127, "time_sec": 66.54567265510559 }, { "epoch": 12, "train_loss": 1.822631957397461, "train_acc": 0.32436, "test_loss": 7.752643719482422, "test_acc": 0.1021, "lyapunov": null, "grad_norm": 3.4268104192911824, "grad_max_sv": 3.0984551936388014, "grad_min_sv": 1.1916837276970682e-07, "grad_condition": 26678795.929163624, "lr": 0.0009648882429441257, "time_sec": 66.54143714904785 }, { "epoch": 13, "train_loss": 1.8042937320327759, "train_acc": 0.33052, "test_loss": 6.320642838287354, "test_acc": 0.1016, "lyapunov": null, "grad_norm": 3.26500321242579, "grad_max_sv": 3.034997683763504, "grad_min_sv": 1.1198519924704443e-07, "grad_condition": 27516714.34616376, "lr": 0.0009588773128419905, "time_sec": 66.54663801193237 }, { "epoch": 14, "train_loss": 1.7935633684539796, "train_acc": 0.33378, "test_loss": 8.591533955383301, "test_acc": 0.1001, "lyapunov": null, "grad_norm": 3.205935962438017, "grad_max_sv": 2.9335897117853165, "grad_min_sv": 1.0952790088225584e-07, "grad_condition": 27285541.83012454, "lr": 0.0009524135262330098, "time_sec": 66.54473447799683 }, { "epoch": 15, "train_loss": 1.7773359481811524, "train_acc": 0.34102, "test_loss": 9.823327029418945, "test_acc": 0.1, "lyapunov": null, "grad_norm": 3.107803718888726, "grad_max_sv": 2.8818213611841204, "grad_min_sv": 1.1047076302617142e-07, "grad_condition": 26466849.950957365, "lr": 0.0009455032620941839, "time_sec": 66.54632878303528 }, { "epoch": 16, "train_loss": 1.7638415741348266, "train_acc": 0.3494, "test_loss": 10.98111782836914, "test_acc": 0.1, "lyapunov": null, "grad_norm": 2.991047436873543, "grad_max_sv": 2.6788798362016677, "grad_min_sv": 9.756340197952796e-08, "grad_condition": 27546377.57163794, "lr": 0.0009381533400219318, "time_sec": 66.5387659072876 }, { "epoch": 17, "train_loss": 1.7545028717422486, "train_acc": 0.3524, "test_loss": 8.496100090026856, "test_acc": 0.1005, "lyapunov": null, "grad_norm": 2.9405206102474817, "grad_max_sv": 2.7797821670770646, "grad_min_sv": 1.0545847413112597e-07, "grad_condition": 26402272.837948732, "lr": 0.0009303710135019719, "time_sec": 66.53228521347046 }, { "epoch": 18, "train_loss": 1.7399513541412353, "train_acc": 0.35946, "test_loss": 9.442770735168457, "test_acc": 0.1002, "lyapunov": null, "grad_norm": 2.876673477887061, "grad_max_sv": 2.652202320098877, "grad_min_sv": 1.0433013795108081e-07, "grad_condition": 26098642.755907767, "lr": 0.0009221639627510076, "time_sec": 66.52799201011658 }, { "epoch": 19, "train_loss": 1.7275141513061523, "train_acc": 0.36564, "test_loss": 8.60740804901123, "test_acc": 0.1, "lyapunov": null, "grad_norm": 2.820914668477109, "grad_max_sv": 2.8074967473745347, "grad_min_sv": 1.0515814725664541e-07, "grad_condition": 27554948.172257036, "lr": 0.000913540287137281, "time_sec": 66.53072094917297 }, { "epoch": 20, "train_loss": 1.7184981283187866, "train_acc": 0.36706, "test_loss": 5.74347527923584, "test_acc": 0.1074, "lyapunov": null, "grad_norm": 2.755999508826315, "grad_max_sv": 2.4683564633131025, "grad_min_sv": 9.147877104709323e-08, "grad_condition": 27108387.83832861, "lr": 0.0009045084971874739, "time_sec": 66.53930997848511 }, { "epoch": 21, "train_loss": 1.7127495180892944, "train_acc": 0.36988, "test_loss": 5.374083380126953, "test_acc": 0.1038, "lyapunov": null, "grad_norm": 2.7076782774581156, "grad_max_sv": 2.415825995802879, "grad_min_sv": 9.989069553739682e-08, "grad_condition": 24996642.26521779, "lr": 0.0008950775061878452, "time_sec": 66.5274007320404 }, { "epoch": 22, "train_loss": 1.7080568863677978, "train_acc": 0.37366, "test_loss": 5.8365667526245115, "test_acc": 0.1074, "lyapunov": null, "grad_norm": 2.777540200252398, "grad_max_sv": 2.682383918762207, "grad_min_sv": 1.0115953053002613e-07, "grad_condition": 27062321.26943115, "lr": 0.0008852566213878947, "time_sec": 66.52736306190491 }, { "epoch": 23, "train_loss": 1.6937433179473877, "train_acc": 0.378, "test_loss": 5.908844201660156, "test_acc": 0.102, "lyapunov": null, "grad_norm": 2.5943120813718052, "grad_max_sv": 2.4230685472488402, "grad_min_sv": 9.802377860523848e-08, "grad_condition": 25663315.966033876, "lr": 0.0008750555348152298, "time_sec": 66.55514574050903 }, { "epoch": 24, "train_loss": 1.685849613647461, "train_acc": 0.38486, "test_loss": 6.484691570281982, "test_acc": 0.1015, "lyapunov": null, "grad_norm": 2.470392685402757, "grad_max_sv": 2.3409340023994445, "grad_min_sv": 9.386610759776204e-08, "grad_condition": 25307930.60423732, "lr": 0.0008644843137107057, "time_sec": 66.55581784248352 }, { "epoch": 25, "train_loss": 1.6830421477890014, "train_acc": 0.38556, "test_loss": 7.468188558959961, "test_acc": 0.1022, "lyapunov": null, "grad_norm": 2.548563020510745, "grad_max_sv": 2.1459918454289437, "grad_min_sv": 8.803468158902205e-08, "grad_condition": 24944715.33907653, "lr": 0.0008535533905932737, "time_sec": 66.53887248039246 }, { "epoch": 26, "train_loss": 1.6700520505523682, "train_acc": 0.38856, "test_loss": 7.895222584533691, "test_acc": 0.1009, "lyapunov": null, "grad_norm": 2.5359070370837204, "grad_max_sv": 2.4539994060993195, "grad_min_sv": 9.640742533179037e-08, "grad_condition": 26335532.748314124, "lr": 0.0008422735529643444, "time_sec": 66.54404091835022 }, { "epoch": 27, "train_loss": 1.6605180406951905, "train_acc": 0.39334, "test_loss": 6.994429248046875, "test_acc": 0.101, "lyapunov": null, "grad_norm": 2.4258405770471474, "grad_max_sv": 2.320448189973831, "grad_min_sv": 9.107987271050888e-08, "grad_condition": 26102152.790860306, "lr": 0.0008306559326618259, "time_sec": 66.53805947303772 }, { "epoch": 28, "train_loss": 1.6567610062408447, "train_acc": 0.395, "test_loss": 6.368250694274902, "test_acc": 0.1099, "lyapunov": null, "grad_norm": 2.4482138479454654, "grad_max_sv": 2.1421856224536895, "grad_min_sv": 8.29846632299791e-08, "grad_condition": 25968573.760956615, "lr": 0.0008187119948743449, "time_sec": 66.56613659858704 }, { "epoch": 29, "train_loss": 1.643007601623535, "train_acc": 0.39978, "test_loss": 5.360125735473633, "test_acc": 0.1039, "lyapunov": null, "grad_norm": 2.4260201472737237, "grad_max_sv": 2.2909662395715715, "grad_min_sv": 9.427450295973471e-08, "grad_condition": 24999199.08130427, "lr": 0.0008064535268264883, "time_sec": 66.5019998550415 }, { "epoch": 30, "train_loss": 1.6426652933120727, "train_acc": 0.40242, "test_loss": 5.846046133422852, "test_acc": 0.1054, "lyapunov": null, "grad_norm": 2.4104230560175877, "grad_max_sv": 2.2003868728876115, "grad_min_sv": 8.557402386699664e-08, "grad_condition": 26105024.01238749, "lr": 0.0007938926261462367, "time_sec": 66.54244065284729 }, { "epoch": 31, "train_loss": 1.6377650901031495, "train_acc": 0.4032, "test_loss": 5.6720462432861325, "test_acc": 0.1037, "lyapunov": null, "grad_norm": 2.3941082742204367, "grad_max_sv": 2.1774697691202163, "grad_min_sv": 8.963231525882521e-08, "grad_condition": 24809583.231536172, "lr": 0.0007810416889260654, "time_sec": 66.54210758209229 }, { "epoch": 32, "train_loss": 1.6306892547607421, "train_acc": 0.40602, "test_loss": 6.530587504577637, "test_acc": 0.1021, "lyapunov": null, "grad_norm": 2.310788163521601, "grad_max_sv": 2.3168098986148835, "grad_min_sv": 8.591319300421674e-08, "grad_condition": 27429040.418645225, "lr": 0.0007679133974894983, "time_sec": 66.54988598823547 }, { "epoch": 33, "train_loss": 1.616210421142578, "train_acc": 0.41068, "test_loss": 6.481897874450683, "test_acc": 0.1047, "lyapunov": null, "grad_norm": 2.280822445658443, "grad_max_sv": 2.0465356022119523, "grad_min_sv": 8.811248948248363e-08, "grad_condition": 23945215.471904326, "lr": 0.0007545207078751857, "time_sec": 66.54384207725525 }, { "epoch": 34, "train_loss": 1.6103173712921142, "train_acc": 0.4129, "test_loss": 7.558738642883301, "test_acc": 0.1004, "lyapunov": null, "grad_norm": 2.268328370380239, "grad_max_sv": 1.9925297170877456, "grad_min_sv": 8.015654646698067e-08, "grad_condition": 25172747.9746131, "lr": 0.0007408768370508577, "time_sec": 66.53899669647217 }, { "epoch": 35, "train_loss": 1.6033166294860839, "train_acc": 0.41878, "test_loss": 7.87334995880127, "test_acc": 0.1014, "lyapunov": null, "grad_norm": 2.1857354046879727, "grad_max_sv": 1.9975714191794396, "grad_min_sv": 7.650004620884943e-08, "grad_condition": 26089987.057969414, "lr": 0.0007269952498697734, "time_sec": 66.5277693271637 }, { "epoch": 36, "train_loss": 1.6046894992446898, "train_acc": 0.41892, "test_loss": 8.474886727905274, "test_acc": 0.1054, "lyapunov": null, "grad_norm": 2.192178860403557, "grad_max_sv": 2.002661418914795, "grad_min_sv": 8.41961090181087e-08, "grad_condition": 24123592.75292515, "lr": 0.0007128896457825364, "time_sec": 66.54011392593384 }, { "epoch": 37, "train_loss": 1.5938314058685303, "train_acc": 0.42164, "test_loss": 7.729584867858887, "test_acc": 0.1023, "lyapunov": null, "grad_norm": 2.181177891654343, "grad_max_sv": 2.0365157604217528, "grad_min_sv": 8.0202053975853e-08, "grad_condition": 26197254.249608647, "lr": 0.0006985739453173903, "time_sec": 66.53632307052612 }, { "epoch": 38, "train_loss": 1.5886405113220214, "train_acc": 0.42264, "test_loss": 5.7885481513977055, "test_acc": 0.1062, "lyapunov": null, "grad_norm": 2.138587269147521, "grad_max_sv": 1.933423602581024, "grad_min_sv": 7.520017115680844e-08, "grad_condition": 25928003.19539905, "lr": 0.0006840622763423391, "time_sec": 66.54145908355713 }, { "epoch": 39, "train_loss": 1.5804911177825929, "train_acc": 0.42612, "test_loss": 6.7240009689331055, "test_acc": 0.106, "lyapunov": null, "grad_norm": 2.146582724428281, "grad_max_sv": 1.8961839854717255, "grad_min_sv": 7.674624242781647e-08, "grad_condition": 24938086.191727363, "lr": 0.0006693689601226458, "time_sec": 66.54460453987122 }, { "epoch": 40, "train_loss": 1.5785979819488525, "train_acc": 0.42734, "test_loss": 6.793812344360352, "test_acc": 0.1033, "lyapunov": null, "grad_norm": 2.0524354853565967, "grad_max_sv": 1.9275713503360747, "grad_min_sv": 7.654831097880788e-08, "grad_condition": 25599705.595900334, "lr": 0.0006545084971874737, "time_sec": 66.78280329704285 }, { "epoch": 41, "train_loss": 1.5828138892364503, "train_acc": 0.42612, "test_loss": 6.44511951751709, "test_acc": 0.1052, "lyapunov": null, "grad_norm": 2.1085813246105163, "grad_max_sv": 1.9095334649085998, "grad_min_sv": 7.941251247700621e-08, "grad_condition": 24686632.04929278, "lr": 0.0006394955530196147, "time_sec": 66.53900074958801 }, { "epoch": 42, "train_loss": 1.5717257321548461, "train_acc": 0.42996, "test_loss": 8.174863388061523, "test_acc": 0.1011, "lyapunov": null, "grad_norm": 2.0568855518830627, "grad_max_sv": 1.8603438019752503, "grad_min_sv": 8.168111662598676e-08, "grad_condition": 23782864.12280636, "lr": 0.0006243449435824273, "time_sec": 66.54205513000488 }, { "epoch": 43, "train_loss": 1.562401286239624, "train_acc": 0.43392, "test_loss": 7.7131751495361325, "test_acc": 0.1014, "lyapunov": null, "grad_norm": 2.0119184672620642, "grad_max_sv": 1.8657386392354964, "grad_min_sv": 7.582975278808135e-08, "grad_condition": 24942971.18450144, "lr": 0.0006090716206982714, "time_sec": 66.53042316436768 }, { "epoch": 44, "train_loss": 1.5541102393341064, "train_acc": 0.43712, "test_loss": 8.247987678527831, "test_acc": 0.1011, "lyapunov": null, "grad_norm": 1.9482695609274137, "grad_max_sv": 1.6971077546477318, "grad_min_sv": 7.249982623136474e-08, "grad_condition": 23783887.230844818, "lr": 0.0005936906572928625, "time_sec": 66.5365047454834 }, { "epoch": 45, "train_loss": 1.551253000793457, "train_acc": 0.43906, "test_loss": 7.164133547973633, "test_acc": 0.1021, "lyapunov": null, "grad_norm": 1.9478309625288126, "grad_max_sv": 1.7972041130065919, "grad_min_sv": 7.798710131012853e-08, "grad_condition": 23697966.26066207, "lr": 0.0005782172325201156, "time_sec": 66.54136061668396 }, { "epoch": 46, "train_loss": 1.541000611190796, "train_acc": 0.44134, "test_loss": 6.376314013671875, "test_acc": 0.1045, "lyapunov": null, "grad_norm": 1.8630241109997108, "grad_max_sv": 1.6913443714380265, "grad_min_sv": 7.214549819778427e-08, "grad_condition": 23808757.926116575, "lr": 0.0005626666167821523, "time_sec": 66.55902171134949 }, { "epoch": 47, "train_loss": 1.5372591391754151, "train_acc": 0.44398, "test_loss": 6.5030721710205075, "test_acc": 0.1069, "lyapunov": null, "grad_norm": 1.9024590490680153, "grad_max_sv": 1.814224436879158, "grad_min_sv": 7.368249033135044e-08, "grad_condition": 25117471.09981022, "lr": 0.0005470541566592572, "time_sec": 66.52199673652649 }, { "epoch": 48, "train_loss": 1.5375283456802369, "train_acc": 0.44544, "test_loss": 7.119714102935791, "test_acc": 0.1016, "lyapunov": null, "grad_norm": 1.8585907694205182, "grad_max_sv": 1.7394830703735351, "grad_min_sv": 7.501465217885084e-08, "grad_condition": 23906344.012628905, "lr": 0.0005313952597646569, "time_sec": 66.54580640792847 }, { "epoch": 49, "train_loss": 1.5338307555770874, "train_acc": 0.4442, "test_loss": 5.397337831115722, "test_acc": 0.1059, "lyapunov": null, "grad_norm": 1.7902731589528738, "grad_max_sv": 1.6494132414460183, "grad_min_sv": 6.831805556828386e-08, "grad_condition": 24615282.56582328, "lr": 0.0005157053795390643, "time_sec": 66.53534126281738 }, { "epoch": 50, "train_loss": 1.5284276412963866, "train_acc": 0.44778, "test_loss": 5.524033654785156, "test_acc": 0.1078, "lyapunov": null, "grad_norm": 1.7713612838130008, "grad_max_sv": 1.5726667106151582, "grad_min_sv": 6.907176626214096e-08, "grad_condition": 22960902.516891498, "lr": 0.0005000000000000002, "time_sec": 66.5325882434845 }, { "epoch": 51, "train_loss": 1.5330605014801026, "train_acc": 0.44666, "test_loss": 6.847183532714844, "test_acc": 0.1031, "lyapunov": null, "grad_norm": 1.7792073911302086, "grad_max_sv": 1.6382696747779846, "grad_min_sv": 6.6116589625409e-08, "grad_condition": 24861349.651776347, "lr": 0.00048429462046093607, "time_sec": 66.53938388824463 }, { "epoch": 52, "train_loss": 1.515211699180603, "train_acc": 0.45132, "test_loss": 6.849605633544922, "test_acc": 0.1046, "lyapunov": null, "grad_norm": 1.7110848232260776, "grad_max_sv": 1.4070507645606996, "grad_min_sv": 6.268320333902011e-08, "grad_condition": 22502851.341604523, "lr": 0.0004686047402353435, "time_sec": 66.54575228691101 }, { "epoch": 53, "train_loss": 1.511851570777893, "train_acc": 0.44984, "test_loss": 6.742161424255371, "test_acc": 0.1035, "lyapunov": null, "grad_norm": 1.6990701953393579, "grad_max_sv": 1.5247679650783539, "grad_min_sv": 6.360552236017725e-08, "grad_condition": 24187524.31056104, "lr": 0.000452945843340743, "time_sec": 66.55630564689636 }, { "epoch": 54, "train_loss": 1.5134658539581298, "train_acc": 0.45194, "test_loss": 6.076722029113769, "test_acc": 0.1055, "lyapunov": null, "grad_norm": 1.67595650149666, "grad_max_sv": 1.521102523803711, "grad_min_sv": 6.705203148271721e-08, "grad_condition": 23102185.373464666, "lr": 0.00043733338321784806, "time_sec": 66.54796624183655 }, { "epoch": 55, "train_loss": 1.5127635479736328, "train_acc": 0.45416, "test_loss": 6.099140180969238, "test_acc": 0.1054, "lyapunov": null, "grad_norm": 1.669713615396416, "grad_max_sv": 1.4162977203726768, "grad_min_sv": 5.9198181379116475e-08, "grad_condition": 24265418.333155036, "lr": 0.0004217827674798847, "time_sec": 66.56652212142944 }, { "epoch": 56, "train_loss": 1.5037149493789672, "train_acc": 0.45674, "test_loss": 5.881203063964843, "test_acc": 0.106, "lyapunov": null, "grad_norm": 1.6488336383475701, "grad_max_sv": 1.5071144998073578, "grad_min_sv": 6.376719170475554e-08, "grad_condition": 23818554.434521496, "lr": 0.00040630934270713783, "time_sec": 66.53574323654175 }, { "epoch": 57, "train_loss": 1.504850189590454, "train_acc": 0.459, "test_loss": 5.68402534790039, "test_acc": 0.1076, "lyapunov": null, "grad_norm": 1.6129911107480968, "grad_max_sv": 1.4527282550930978, "grad_min_sv": 6.286840470437483e-08, "grad_condition": 23483060.334747117, "lr": 0.000390928379301729, "time_sec": 66.54559707641602 }, { "epoch": 58, "train_loss": 1.4977053466033936, "train_acc": 0.45916, "test_loss": 5.9823997062683105, "test_acc": 0.1071, "lyapunov": null, "grad_norm": 1.6061924832487942, "grad_max_sv": 1.3888853162527084, "grad_min_sv": 6.253125484079192e-08, "grad_condition": 22608679.418678027, "lr": 0.0003756550564175727, "time_sec": 66.55387783050537 }, { "epoch": 59, "train_loss": 1.4972542272949219, "train_acc": 0.45872, "test_loss": 5.0882811370849605, "test_acc": 0.1151, "lyapunov": null, "grad_norm": 1.5591682163016796, "grad_max_sv": 1.3346713334321976, "grad_min_sv": 5.8280132453347735e-08, "grad_condition": 23069467.539254077, "lr": 0.00036050444698038553, "time_sec": 66.54211473464966 }, { "epoch": 60, "train_loss": 1.4907029873657227, "train_acc": 0.46126, "test_loss": 7.020564842224121, "test_acc": 0.1048, "lyapunov": null, "grad_norm": 1.5345406038505094, "grad_max_sv": 1.4284722179174423, "grad_min_sv": 6.001468877414595e-08, "grad_condition": 24162295.485593982, "lr": 0.00034549150281252655, "time_sec": 66.55491805076599 }, { "epoch": 61, "train_loss": 1.4877613472366333, "train_acc": 0.4653, "test_loss": 4.854167632293701, "test_acc": 0.1114, "lyapunov": null, "grad_norm": 1.5324361061772793, "grad_max_sv": 1.325933101773262, "grad_min_sv": 5.964644183009682e-08, "grad_condition": 22280923.908054985, "lr": 0.0003306310398773544, "time_sec": 66.54050326347351 }, { "epoch": 62, "train_loss": 1.4875999914550782, "train_acc": 0.4609, "test_loss": 6.024991397094727, "test_acc": 0.1045, "lyapunov": null, "grad_norm": 1.5157035873578593, "grad_max_sv": 1.2820105284452439, "grad_min_sv": 5.6854590901878056e-08, "grad_condition": 22744392.831777684, "lr": 0.00031593772365766127, "time_sec": 66.56322026252747 }, { "epoch": 63, "train_loss": 1.4804442275238037, "train_acc": 0.46586, "test_loss": 6.877338618469238, "test_acc": 0.1028, "lyapunov": null, "grad_norm": 1.5037529747226948, "grad_max_sv": 1.3301736950874328, "grad_min_sv": 6.064568385255597e-08, "grad_condition": 22458783.805724658, "lr": 0.0003014260546826097, "time_sec": 66.55420660972595 }, { "epoch": 64, "train_loss": 1.4785625118637085, "train_acc": 0.4676, "test_loss": 5.8289501716613765, "test_acc": 0.1058, "lyapunov": null, "grad_norm": 1.4955609555476688, "grad_max_sv": 1.2231090664863586, "grad_min_sv": 5.909942020210224e-08, "grad_condition": 21200746.17398096, "lr": 0.0002871103542174637, "time_sec": 66.55184054374695 }, { "epoch": 65, "train_loss": 1.474054185218811, "train_acc": 0.4692, "test_loss": 6.821263113403321, "test_acc": 0.1053, "lyapunov": null, "grad_norm": 1.4816881050330082, "grad_max_sv": 1.304422627389431, "grad_min_sv": 6.126439071607592e-08, "grad_condition": 22262717.79019341, "lr": 0.0002730047501302267, "time_sec": 66.54631876945496 }, { "epoch": 66, "train_loss": 1.468451905593872, "train_acc": 0.46872, "test_loss": 6.21660086593628, "test_acc": 0.1049, "lyapunov": null, "grad_norm": 1.4471343716270808, "grad_max_sv": 1.2118137910962106, "grad_min_sv": 5.677175121121536e-08, "grad_condition": 21833909.31574912, "lr": 0.00025912316294914234, "time_sec": 66.54650139808655 }, { "epoch": 67, "train_loss": 1.473218607635498, "train_acc": 0.46886, "test_loss": 5.585741909790039, "test_acc": 0.1093, "lyapunov": null, "grad_norm": 1.4454249735567377, "grad_max_sv": 1.344612455368042, "grad_min_sv": 5.805593232821593e-08, "grad_condition": 23703781.24599778, "lr": 0.0002454792921248144, "time_sec": 66.54963803291321 }, { "epoch": 68, "train_loss": 1.464357560043335, "train_acc": 0.47134, "test_loss": 6.43534487915039, "test_acc": 0.1036, "lyapunov": null, "grad_norm": 1.4158825945249984, "grad_max_sv": 1.216756673157215, "grad_min_sv": 5.594884520121468e-08, "grad_condition": 22117575.184218023, "lr": 0.00023208660251050164, "time_sec": 66.53380155563354 }, { "epoch": 69, "train_loss": 1.4605754261016846, "train_acc": 0.47354, "test_loss": 6.361464812469483, "test_acc": 0.1041, "lyapunov": null, "grad_norm": 1.4102858398212452, "grad_max_sv": 1.2650031745433807, "grad_min_sv": 5.616340708058942e-08, "grad_condition": 22755240.415779583, "lr": 0.00021895831107393473, "time_sec": 66.55379509925842 }, { "epoch": 70, "train_loss": 1.4566728033065797, "train_acc": 0.4732, "test_loss": 7.030058961486817, "test_acc": 0.1052, "lyapunov": null, "grad_norm": 1.4004542368068666, "grad_max_sv": 1.1733321487903594, "grad_min_sv": 5.324388059335661e-08, "grad_condition": 22428640.626706712, "lr": 0.00020610737385376356, "time_sec": 66.53196001052856 }, { "epoch": 71, "train_loss": 1.4595127109909058, "train_acc": 0.4747, "test_loss": 6.251192915344238, "test_acc": 0.1055, "lyapunov": null, "grad_norm": 1.4007518176750748, "grad_max_sv": 1.2036359310150146, "grad_min_sv": 5.3584219283919765e-08, "grad_condition": 22661079.860923886, "lr": 0.00019354647317351177, "time_sec": 66.53831934928894 }, { "epoch": 72, "train_loss": 1.4561804718780518, "train_acc": 0.47592, "test_loss": 6.078685757446289, "test_acc": 0.1053, "lyapunov": null, "grad_norm": 1.3882159701453969, "grad_max_sv": 1.1710434511303902, "grad_min_sv": 5.193670311598453e-08, "grad_condition": 22617697.621583022, "lr": 0.0001812880051256552, "time_sec": 66.53273725509644 }, { "epoch": 73, "train_loss": 1.456334539833069, "train_acc": 0.47646, "test_loss": 6.318551240539551, "test_acc": 0.1053, "lyapunov": null, "grad_norm": 1.3893052276682352, "grad_max_sv": 1.262186436355114, "grad_min_sv": 5.998066114898392e-08, "grad_condition": 21695066.67305842, "lr": 0.00016934406733817422, "time_sec": 66.53349781036377 }, { "epoch": 74, "train_loss": 1.450936794128418, "train_acc": 0.48046, "test_loss": 5.979817550659179, "test_acc": 0.105, "lyapunov": null, "grad_norm": 1.3659009379358413, "grad_max_sv": 1.2089540883898735, "grad_min_sv": 5.6734091380405974e-08, "grad_condition": 21453559.245642237, "lr": 0.0001577264470356557, "time_sec": 66.5519745349884 }, { "epoch": 75, "train_loss": 1.4469789163970947, "train_acc": 0.47906, "test_loss": 6.295627461242676, "test_acc": 0.1067, "lyapunov": null, "grad_norm": 1.3551347445295552, "grad_max_sv": 1.1976817324757576, "grad_min_sv": 5.458875831365617e-08, "grad_condition": 22252931.086762276, "lr": 0.00014644660940672634, "time_sec": 66.55559992790222 }, { "epoch": 76, "train_loss": 1.4463843099212645, "train_acc": 0.47934, "test_loss": 6.197264282226563, "test_acc": 0.1079, "lyapunov": null, "grad_norm": 1.3380208446863917, "grad_max_sv": 1.2127704448997974, "grad_min_sv": 5.3017609769057116e-08, "grad_condition": 23070185.252038278, "lr": 0.0001355156862892944, "time_sec": 66.54188418388367 }, { "epoch": 77, "train_loss": 1.4422340731430054, "train_acc": 0.47956, "test_loss": 6.095625473022461, "test_acc": 0.1068, "lyapunov": null, "grad_norm": 1.319834743092097, "grad_max_sv": 1.0997839123010635, "grad_min_sv": 5.253857917608684e-08, "grad_condition": 21034235.602306478, "lr": 0.00012494446518477025, "time_sec": 66.54432153701782 }, { "epoch": 78, "train_loss": 1.4469564128875732, "train_acc": 0.48036, "test_loss": 5.388970955657959, "test_acc": 0.11, "lyapunov": null, "grad_norm": 1.3475784983368762, "grad_max_sv": 1.2046680554747582, "grad_min_sv": 5.585839417676652e-08, "grad_condition": 21905924.79288598, "lr": 0.00011474337861210548, "time_sec": 66.53302836418152 }, { "epoch": 79, "train_loss": 1.4366684397125244, "train_acc": 0.4798, "test_loss": 6.206115145874024, "test_acc": 0.1069, "lyapunov": null, "grad_norm": 1.3130109628098805, "grad_max_sv": 1.1744658067822455, "grad_min_sv": 5.508810989596213e-08, "grad_condition": 21715398.426144313, "lr": 0.00010492249381215483, "time_sec": 66.53135848045349 }, { "epoch": 80, "train_loss": 1.4392537023544312, "train_acc": 0.48228, "test_loss": 6.179986186218262, "test_acc": 0.1064, "lyapunov": null, "grad_norm": 1.3256940413341314, "grad_max_sv": 1.1846244156360626, "grad_min_sv": 5.3839901603680576e-08, "grad_condition": 22125564.09370377, "lr": 9.549150281252637e-05, "time_sec": 66.5379912853241 }, { "epoch": 81, "train_loss": 1.4338660355377197, "train_acc": 0.48616, "test_loss": 6.177688023376465, "test_acc": 0.1068, "lyapunov": null, "grad_norm": 1.331304941867422, "grad_max_sv": 1.2059139341115952, "grad_min_sv": 5.419374078385886e-08, "grad_condition": 22342309.054380674, "lr": 8.645971286271918e-05, "time_sec": 66.5526373386383 }, { "epoch": 82, "train_loss": 1.4322706761550903, "train_acc": 0.48346, "test_loss": 6.39905592956543, "test_acc": 0.1049, "lyapunov": null, "grad_norm": 1.3160308800060254, "grad_max_sv": 1.1150345966219901, "grad_min_sv": 5.504024436220334e-08, "grad_condition": 20495998.096470684, "lr": 7.78360372489926e-05, "time_sec": 66.53385639190674 }, { "epoch": 83, "train_loss": 1.4299918703460692, "train_acc": 0.48306, "test_loss": 6.442905668640137, "test_acc": 0.1051, "lyapunov": null, "grad_norm": 1.3113912638515688, "grad_max_sv": 1.0838071212172509, "grad_min_sv": 5.43203230840561e-08, "grad_condition": 20241235.03989599, "lr": 6.962898649802815e-05, "time_sec": 66.52077317237854 }, { "epoch": 84, "train_loss": 1.4280065909194946, "train_acc": 0.4822, "test_loss": 6.0934767837524415, "test_acc": 0.1077, "lyapunov": null, "grad_norm": 1.3219999598887227, "grad_max_sv": 1.1636987075209617, "grad_min_sv": 5.4432569296380964e-08, "grad_condition": 21698960.666762732, "lr": 6.184665997806824e-05, "time_sec": 66.54324150085449 }, { "epoch": 85, "train_loss": 1.426846856918335, "train_acc": 0.4865, "test_loss": 5.9188161468505855, "test_acc": 0.107, "lyapunov": null, "grad_norm": 1.2965845421535789, "grad_max_sv": 1.1792906790971756, "grad_min_sv": 5.5100021434384416e-08, "grad_condition": 21690369.73733188, "lr": 5.449673790581613e-05, "time_sec": 66.53187370300293 }, { "epoch": 86, "train_loss": 1.4228094031524658, "train_acc": 0.48556, "test_loss": 6.137683601379394, "test_acc": 0.108, "lyapunov": null, "grad_norm": 1.292831856620217, "grad_max_sv": 1.0124387323856354, "grad_min_sv": 5.2233392278111523e-08, "grad_condition": 19602805.79996558, "lr": 4.758647376699034e-05, "time_sec": 66.53067183494568 }, { "epoch": 87, "train_loss": 1.429165520362854, "train_acc": 0.48332, "test_loss": 5.927753118133545, "test_acc": 0.1088, "lyapunov": null, "grad_norm": 1.3101745862822605, "grad_max_sv": 1.1612930461764335, "grad_min_sv": 5.276717347513227e-08, "grad_condition": 22472879.957919728, "lr": 4.112268715800956e-05, "time_sec": 66.53908562660217 }, { "epoch": 88, "train_loss": 1.4288117279052734, "train_acc": 0.48666, "test_loss": 6.013241593933105, "test_acc": 0.1075, "lyapunov": null, "grad_norm": 1.3007188330408852, "grad_max_sv": 1.139727284014225, "grad_min_sv": 5.308784185587001e-08, "grad_condition": 21649216.459450316, "lr": 3.511175705587434e-05, "time_sec": 66.52465963363647 }, { "epoch": 89, "train_loss": 1.4234879583358764, "train_acc": 0.48672, "test_loss": 5.440691387176513, "test_acc": 0.1132, "lyapunov": null, "grad_norm": 1.286797693166196, "grad_max_sv": 1.1378898680210114, "grad_min_sv": 5.206395803369901e-08, "grad_condition": 22299317.66856014, "lr": 2.9559615522887284e-05, "time_sec": 66.52217221260071 }, { "epoch": 90, "train_loss": 1.4255534106445313, "train_acc": 0.4873, "test_loss": 5.6889183303833, "test_acc": 0.1089, "lyapunov": null, "grad_norm": 1.2907871997501676, "grad_max_sv": 1.1832163825631141, "grad_min_sv": 5.3787662057658284e-08, "grad_condition": 22287194.786688134, "lr": 2.447174185242324e-05, "time_sec": 66.53036832809448 }, { "epoch": 91, "train_loss": 1.4252548498916626, "train_acc": 0.48792, "test_loss": 6.261311422729492, "test_acc": 0.1064, "lyapunov": null, "grad_norm": 1.3031797280361905, "grad_max_sv": 1.1937354177236557, "grad_min_sv": 5.396164546311866e-08, "grad_condition": 22285756.773222417, "lr": 1.9853157161528526e-05, "time_sec": 66.53405451774597 }, { "epoch": 92, "train_loss": 1.4257716689300537, "train_acc": 0.48484, "test_loss": 5.9496440505981445, "test_acc": 0.1083, "lyapunov": null, "grad_norm": 1.2963951565864091, "grad_max_sv": 1.1119507551193237, "grad_min_sv": 5.530857025703995e-08, "grad_condition": 20517700.461063318, "lr": 1.570841943568452e-05, "time_sec": 66.55413794517517 }, { "epoch": 93, "train_loss": 1.4217627249526978, "train_acc": 0.48994, "test_loss": 5.984926200866699, "test_acc": 0.1075, "lyapunov": null, "grad_norm": 1.264014206865248, "grad_max_sv": 1.0518594324588775, "grad_min_sv": 4.926823864437324e-08, "grad_condition": 21435816.94874554, "lr": 1.204161903062634e-05, "time_sec": 66.52945113182068 }, { "epoch": 94, "train_loss": 1.4220651029205322, "train_acc": 0.48712, "test_loss": 5.9274788650512695, "test_acc": 0.107, "lyapunov": null, "grad_norm": 1.2852744864782746, "grad_max_sv": 1.194958347082138, "grad_min_sv": 5.49836086882749e-08, "grad_condition": 21876849.948771022, "lr": 8.85637463565564e-06, "time_sec": 66.53060245513916 }, { "epoch": 95, "train_loss": 1.4127644922637939, "train_acc": 0.4891, "test_loss": 6.033211676025391, "test_acc": 0.1068, "lyapunov": null, "grad_norm": 1.2852733904252112, "grad_max_sv": 1.1103495568037034, "grad_min_sv": 5.0794950290367066e-08, "grad_condition": 21903481.59645809, "lr": 6.155829702431171e-06, "time_sec": 66.54151201248169 }, { "epoch": 96, "train_loss": 1.42291917427063, "train_acc": 0.48754, "test_loss": 5.946468173217774, "test_acc": 0.1078, "lyapunov": null, "grad_norm": 1.296502082808029, "grad_max_sv": 1.1921778261661529, "grad_min_sv": 5.59618015927299e-08, "grad_condition": 21704630.944007598, "lr": 3.942649342761118e-06, "time_sec": 66.53685402870178 }, { "epoch": 97, "train_loss": 1.4221784051132202, "train_acc": 0.48922, "test_loss": 5.77611974029541, "test_acc": 0.1107, "lyapunov": null, "grad_norm": 1.283101201721102, "grad_max_sv": 1.1582708179950714, "grad_min_sv": 5.3498822172315384e-08, "grad_condition": 21893400.606446274, "lr": 2.2190176984600023e-06, "time_sec": 66.51551508903503 }, { "epoch": 98, "train_loss": 1.4199727509307862, "train_acc": 0.48888, "test_loss": 5.947603340148926, "test_acc": 0.1072, "lyapunov": null, "grad_norm": 1.2852084329880165, "grad_max_sv": 1.12471182346344, "grad_min_sv": 5.5720254987789984e-08, "grad_condition": 20744598.237500653, "lr": 9.866357858642206e-07, "time_sec": 66.54128313064575 }, { "epoch": 99, "train_loss": 1.4189085994720458, "train_acc": 0.49036, "test_loss": 6.019410075378418, "test_acc": 0.1088, "lyapunov": null, "grad_norm": 1.2671570273045278, "grad_max_sv": 1.044458197057247, "grad_min_sv": 5.2453829901821794e-08, "grad_condition": 20122144.845569003, "lr": 2.467198171342e-07, "time_sec": 66.5876886844635 }, { "epoch": 100, "train_loss": 1.4237549599456787, "train_acc": 0.48696, "test_loss": 6.123869666290283, "test_acc": 0.1056, "lyapunov": null, "grad_norm": 1.2842958901976373, "grad_max_sv": 1.0893320694565773, "grad_min_sv": 5.240736280498481e-08, "grad_condition": 20983923.24178537, "lr": 0.0, "time_sec": 66.52526140213013 } ] }, "lyapunov": { "4": [ { "epoch": 1, "train_loss": 5.9559499659729, "train_acc": 0.1816, "test_loss": 2.127836145401001, "test_acc": 0.2458, "lyapunov": 3.1805403927707916, "grad_norm": 7.669457973262479, "grad_max_sv": 5.918661725521088, "grad_min_sv": 2.931642846704108e-07, "grad_condition": 20422744.62807854, "lr": 0.0009997532801828658, "time_sec": 38.74378061294556 }, { "epoch": 2, "train_loss": 4.402947195281983, "train_acc": 0.19622, "test_loss": 2.0710217851638792, "test_acc": 0.2599, "lyapunov": 2.5604425824206807, "grad_norm": 5.322089969338386, "grad_max_sv": 4.252373713254928, "grad_min_sv": 1.9552239614029076e-07, "grad_condition": 22174922.12126705, "lr": 0.0009990133642141358, "time_sec": 38.64048624038696 }, { "epoch": 3, "train_loss": 4.045168105316162, "train_acc": 0.22284, "test_loss": 2.047537351036072, "test_acc": 0.275, "lyapunov": 2.4094676093372236, "grad_norm": 3.329135536451279, "grad_max_sv": 2.700692330300808, "grad_min_sv": 1.3114565362570828e-07, "grad_condition": 21120674.055912692, "lr": 0.00099778098230154, "time_sec": 38.632225036621094 }, { "epoch": 4, "train_loss": 3.8760036846923827, "train_acc": 0.23552, "test_loss": 2.0494147090911867, "test_acc": 0.2624, "lyapunov": 2.323524356803016, "grad_norm": 1.6169046791962502, "grad_max_sv": 1.2880224913358689, "grad_min_sv": 5.374016822656813e-08, "grad_condition": 24107383.024291664, "lr": 0.000996057350657239, "time_sec": 38.643821477890015 }, { "epoch": 5, "train_loss": 3.7066750312805175, "train_acc": 0.23364, "test_loss": 2.073809361457825, "test_acc": 0.2559, "lyapunov": 2.2068090539454195, "grad_norm": 0.6888041501699484, "grad_max_sv": 0.4505885936319828, "grad_min_sv": 2.5095627176341396e-08, "grad_condition": 18224356.70160868, "lr": 0.0009938441702975688, "time_sec": 38.63996958732605 }, { "epoch": 6, "train_loss": 3.5870462338256837, "train_acc": 0.22278, "test_loss": 2.0948594261169435, "test_acc": 0.2419, "lyapunov": 2.1068829035819947, "grad_norm": 0.4525297557038159, "grad_max_sv": 0.2912705983966589, "grad_min_sv": 1.4355599531334918e-08, "grad_condition": 20443883.38963156, "lr": 0.0009911436253643444, "time_sec": 38.64875626564026 }, { "epoch": 7, "train_loss": 3.516497625274658, "train_acc": 0.20518, "test_loss": 2.122341016769409, "test_acc": 0.2149, "lyapunov": 2.031583094535886, "grad_norm": 0.4192338818357315, "grad_max_sv": 0.2666142761707306, "grad_min_sv": 1.244383397436266e-08, "grad_condition": 21524577.239365414, "lr": 0.0009879583809693736, "time_sec": 38.65327429771423 }, { "epoch": 8, "train_loss": 3.500787953567505, "train_acc": 0.15934, "test_loss": 2.30495919342041, "test_acc": 0.1, "lyapunov": 1.9705595735393826, "grad_norm": 0.364806685633591, "grad_max_sv": 0.19433156847953797, "grad_min_sv": 7.78323775238877e-09, "grad_condition": 1400511997.1550007, "lr": 0.0009842915805643154, "time_sec": 38.633607625961304 }, { "epoch": 9, "train_loss": 3.5612770445251463, "train_acc": 0.0995, "test_loss": 2.309052435684204, "test_acc": 0.1, "lyapunov": 1.9462372851188836, "grad_norm": 0.1961322565486487, "grad_max_sv": 0.08832639907486736, "grad_min_sv": 7.733921171735724e-10, "grad_condition": 10141008570.944132, "lr": 0.0009801468428384714, "time_sec": 38.646180152893066 }, { "epoch": 10, "train_loss": 3.538458889770508, "train_acc": 0.09824, "test_loss": 2.3040579429626464, "test_acc": 0.1, "lyapunov": 1.9283022353106447, "grad_norm": 0.21318046705690488, "grad_max_sv": 0.0782687779981643, "grad_min_sv": 8.435315090236436e-10, "grad_condition": 12098584585.465805, "lr": 0.0009755282581475767, "time_sec": 38.63904404640198 }, { "epoch": 11, "train_loss": 3.529650466461182, "train_acc": 0.10062, "test_loss": 2.302797904205322, "test_acc": 0.1, "lyapunov": 1.9214661554302401, "grad_norm": 0.14436104663435, "grad_max_sv": 0.07406298876740039, "grad_min_sv": 1.8938792208460978e-10, "grad_condition": 16582547419.599035, "lr": 0.0009704403844771127, "time_sec": 38.65141201019287 }, { "epoch": 12, "train_loss": 3.527643050994873, "train_acc": 0.09804, "test_loss": 2.3026904548645017, "test_acc": 0.1, "lyapunov": 1.9200294935489859, "grad_norm": 0.13153432020985192, "grad_max_sv": 0.05873946417123079, "grad_min_sv": 2.2213949011783955e-10, "grad_condition": 29679782911.168915, "lr": 0.0009648882429441257, "time_sec": 38.637062311172485 }, { "epoch": 13, "train_loss": 3.525748397216797, "train_acc": 0.09986, "test_loss": 2.3026839447021485, "test_acc": 0.1, "lyapunov": 1.9183377143367173, "grad_norm": 0.1253530383790545, "grad_max_sv": 0.054947068355977534, "grad_min_sv": 2.484597018350735e-10, "grad_condition": 32728296691.529114, "lr": 0.0009588773128419905, "time_sec": 38.639862060546875 }, { "epoch": 14, "train_loss": 3.5267535670471193, "train_acc": 0.09928, "test_loss": 2.303218070602417, "test_acc": 0.1, "lyapunov": 1.9196420743337372, "grad_norm": 0.1092532269273596, "grad_max_sv": 0.04395028324797749, "grad_min_sv": 9.613613581557888e-11, "grad_condition": 21168413985.92494, "lr": 0.0009524135262330098, "time_sec": 38.639400243759155 }, { "epoch": 15, "train_loss": 3.5285498448181154, "train_acc": 0.0982, "test_loss": 2.3035209484100343, "test_acc": 0.1, "lyapunov": 1.920996154055876, "grad_norm": 0.10604045531455125, "grad_max_sv": 0.030423881998285652, "grad_min_sv": 8.947113291620313e-11, "grad_condition": 14692894250.958597, "lr": 0.0009455032620941839, "time_sec": 38.645652770996094 }, { "epoch": 16, "train_loss": 3.5281584407806394, "train_acc": 0.09964, "test_loss": 2.3028687210083008, "test_acc": 0.1, "lyapunov": 1.9207957717768676, "grad_norm": 0.09543807455983376, "grad_max_sv": 0.006560872681438923, "grad_min_sv": 4.056405124991419e-12, "grad_condition": 3706750979.9989243, "lr": 0.0009381533400219318, "time_sec": 38.63558006286621 }, { "epoch": 17, "train_loss": 3.5265050379943848, "train_acc": 0.09798, "test_loss": 2.302896424102783, "test_acc": 0.1, "lyapunov": 1.9195188765635576, "grad_norm": 0.09404328433417611, "grad_max_sv": 0.005626836745068431, "grad_min_sv": 8.896868440940896e-13, "grad_condition": 3600570896.7918577, "lr": 0.0009303710135019719, "time_sec": 38.63581418991089 }, { "epoch": 18, "train_loss": 3.5274914381408693, "train_acc": 0.09708, "test_loss": 2.3026503776550293, "test_acc": 0.1, "lyapunov": 1.9202668194270804, "grad_norm": 0.09620880376142034, "grad_max_sv": 0.003721812926232815, "grad_min_sv": 3.080583531323011e-13, "grad_condition": 2605476049.955305, "lr": 0.0009221639627510076, "time_sec": 38.637654304504395 }, { "epoch": 19, "train_loss": 3.5240187657165527, "train_acc": 0.09788, "test_loss": 2.3026472286224364, "test_acc": 0.1, "lyapunov": 1.917564369833378, "grad_norm": 0.08696272623748423, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000913540287137281, "time_sec": 38.64585041999817 }, { "epoch": 20, "train_loss": 3.526093559265137, "train_acc": 0.09698, "test_loss": 2.302675205993652, "test_acc": 0.1, "lyapunov": 1.9192343212454521, "grad_norm": 0.08759130668154863, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009045084971874739, "time_sec": 38.63778305053711 }, { "epoch": 21, "train_loss": 3.5268382842254637, "train_acc": 0.0963, "test_loss": 2.302619518661499, "test_acc": 0.1, "lyapunov": 1.9198827185594212, "grad_norm": 0.09131899089817433, "grad_max_sv": 0.0007137967739254236, "grad_min_sv": 1.2143662959650498e-34, "grad_condition": 713796773.9254236, "lr": 0.0008950775061878452, "time_sec": 38.63694953918457 }, { "epoch": 22, "train_loss": 3.5266487127685546, "train_acc": 0.09736, "test_loss": 2.302595558166504, "test_acc": 0.1, "lyapunov": 1.919754564914557, "grad_norm": 0.08451797479839518, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008852566213878947, "time_sec": 38.62629771232605 }, { "epoch": 23, "train_loss": 3.526773832244873, "train_acc": 0.09764, "test_loss": 2.3026504470825193, "test_acc": 0.1, "lyapunov": 1.919811970132696, "grad_norm": 0.0880141883169143, "grad_max_sv": 0.003215626534074545, "grad_min_sv": 6.757893669575438e-13, "grad_condition": 421691349.6171393, "lr": 0.0008750555348152298, "time_sec": 38.627503395080566 }, { "epoch": 24, "train_loss": 3.5253559977722166, "train_acc": 0.09686, "test_loss": 2.302592763519287, "test_acc": 0.1, "lyapunov": 1.9186803285423142, "grad_norm": 0.08625519727104183, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107057, "time_sec": 38.62110924720764 }, { "epoch": 25, "train_loss": 3.5271505029296875, "train_acc": 0.09882, "test_loss": 2.3026457008361816, "test_acc": 0.1, "lyapunov": 1.9201455759575299, "grad_norm": 0.08664315655618471, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008535533905932737, "time_sec": 38.663304567337036 }, { "epoch": 26, "train_loss": 3.52567841835022, "train_acc": 0.09848, "test_loss": 2.302622730255127, "test_acc": 0.1, "lyapunov": 1.918919243775975, "grad_norm": 0.08931714213407926, "grad_max_sv": 0.0026560820173472167, "grad_min_sv": 7.80326428931121e-27, "grad_condition": 2656082017.346831, "lr": 0.0008422735529643444, "time_sec": 38.642497539520264 }, { "epoch": 27, "train_loss": 3.5247526208496094, "train_acc": 0.09662, "test_loss": 2.3026296226501466, "test_acc": 0.1, "lyapunov": 1.9182322189935943, "grad_norm": 0.08339910325165188, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008306559326618259, "time_sec": 38.63079476356506 }, { "epoch": 28, "train_loss": 3.5269400009155274, "train_acc": 0.09728, "test_loss": 2.3025920150756836, "test_acc": 0.1, "lyapunov": 1.9199587207316133, "grad_norm": 0.08394537087665149, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743449, "time_sec": 38.61244583129883 }, { "epoch": 29, "train_loss": 3.5242063328552247, "train_acc": 0.09546, "test_loss": 2.3025877166748048, "test_acc": 0.1, "lyapunov": 1.9176992738948149, "grad_norm": 0.08393484553605075, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008064535268264883, "time_sec": 38.62086057662964 }, { "epoch": 30, "train_loss": 3.524652021865845, "train_acc": 0.09846, "test_loss": 2.3025890396118163, "test_acc": 0.1, "lyapunov": 1.9180299269268886, "grad_norm": 0.08604739858068552, "grad_max_sv": 0.0037235306110233067, "grad_min_sv": 2.2816656604449788e-14, "grad_condition": 2522915018.0120707, "lr": 0.0007938926261462367, "time_sec": 38.63639521598816 }, { "epoch": 31, "train_loss": 3.5269307495117186, "train_acc": 0.09852, "test_loss": 2.302594734954834, "test_acc": 0.1, "lyapunov": 1.9199556487295635, "grad_norm": 0.08308332919661195, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007810416889260654, "time_sec": 38.632620334625244 }, { "epoch": 32, "train_loss": 3.526603982696533, "train_acc": 0.0987, "test_loss": 2.3026425048828125, "test_acc": 0.1, "lyapunov": 1.9197655053394835, "grad_norm": 0.08373608851321027, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894983, "time_sec": 38.6338005065918 }, { "epoch": 33, "train_loss": 3.5402134245300294, "train_acc": 0.09648, "test_loss": 2.3025889293670656, "test_acc": 0.1, "lyapunov": 1.926927990010937, "grad_norm": 0.09981834537565924, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007545207078751857, "time_sec": 38.6455602645874 }, { "epoch": 34, "train_loss": 3.5265413635253906, "train_acc": 0.09788, "test_loss": 2.302589825439453, "test_acc": 0.1, "lyapunov": 1.9196307095115448, "grad_norm": 0.08459800727870437, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508577, "time_sec": 38.652732133865356 }, { "epoch": 35, "train_loss": 3.526457656402588, "train_acc": 0.09848, "test_loss": 2.3025897277832033, "test_acc": 0.1, "lyapunov": 1.91963635930015, "grad_norm": 0.08392830107993868, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007269952498697734, "time_sec": 38.618977308273315 }, { "epoch": 36, "train_loss": 3.5264506495666503, "train_acc": 0.09836, "test_loss": 2.302591544342041, "test_acc": 0.1, "lyapunov": 1.919547389840226, "grad_norm": 0.0844841992615646, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825364, "time_sec": 38.635788917541504 }, { "epoch": 37, "train_loss": 3.525513755493164, "train_acc": 0.09824, "test_loss": 2.302587795257568, "test_acc": 0.1, "lyapunov": 1.9188998626626057, "grad_norm": 0.08511865281250128, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006985739453173903, "time_sec": 38.63599181175232 }, { "epoch": 38, "train_loss": 3.5258794207763673, "train_acc": 0.09634, "test_loss": 2.302587114715576, "test_acc": 0.1, "lyapunov": 1.9190363072983139, "grad_norm": 0.08976844520779069, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423391, "time_sec": 38.631999015808105 }, { "epoch": 39, "train_loss": 3.526812607116699, "train_acc": 0.09782, "test_loss": 2.3025868911743164, "test_acc": 0.1, "lyapunov": 1.9198928242144377, "grad_norm": 0.08338895706252505, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006693689601226458, "time_sec": 38.62815856933594 }, { "epoch": 40, "train_loss": 3.5299447924041747, "train_acc": 0.09834, "test_loss": 2.302587143325806, "test_acc": 0.1, "lyapunov": 1.9223552085554507, "grad_norm": 0.09522270183573409, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874737, "time_sec": 38.62764048576355 }, { "epoch": 41, "train_loss": 3.529573831253052, "train_acc": 0.0978, "test_loss": 2.3025870990753172, "test_acc": 0.1, "lyapunov": 1.922197810829143, "grad_norm": 0.08338290015497958, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006394955530196147, "time_sec": 38.63026428222656 }, { "epoch": 42, "train_loss": 3.5254642880249025, "train_acc": 0.09878, "test_loss": 2.302588144683838, "test_acc": 0.1, "lyapunov": 1.9188408784549256, "grad_norm": 0.08333708848875665, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824273, "time_sec": 38.63510298728943 }, { "epoch": 43, "train_loss": 3.527522850036621, "train_acc": 0.09724, "test_loss": 2.302586852264404, "test_acc": 0.1, "lyapunov": 1.920439124717127, "grad_norm": 0.08392990999765709, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006090716206982714, "time_sec": 38.61439347267151 }, { "epoch": 44, "train_loss": 3.5268155879211425, "train_acc": 0.09854, "test_loss": 2.302588026046753, "test_acc": 0.1, "lyapunov": 1.919859874583876, "grad_norm": 0.08808142140863674, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005936906572928625, "time_sec": 38.63164472579956 }, { "epoch": 45, "train_loss": 3.528644903793335, "train_acc": 0.09726, "test_loss": 2.302586632156372, "test_acc": 0.1, "lyapunov": 1.9213885017063306, "grad_norm": 0.08163685266757659, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005782172325201156, "time_sec": 38.63089060783386 }, { "epoch": 46, "train_loss": 3.5269173733520507, "train_acc": 0.09548, "test_loss": 2.302586455535889, "test_acc": 0.1, "lyapunov": 1.9199798500446408, "grad_norm": 0.08000528496736534, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821523, "time_sec": 38.636719703674316 }, { "epoch": 47, "train_loss": 3.525616721343994, "train_acc": 0.0969, "test_loss": 2.3025855419158936, "test_acc": 0.1, "lyapunov": 1.918914921753242, "grad_norm": 0.0847797082901155, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005470541566592572, "time_sec": 38.63527321815491 }, { "epoch": 48, "train_loss": 3.527122305908203, "train_acc": 0.09908, "test_loss": 2.302587979507446, "test_acc": 0.1, "lyapunov": 1.9201535523090216, "grad_norm": 0.08334551671941194, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646569, "time_sec": 38.6254460811615 }, { "epoch": 49, "train_loss": 3.529289007568359, "train_acc": 0.09836, "test_loss": 2.3025873039245606, "test_acc": 0.1, "lyapunov": 1.9219778029205243, "grad_norm": 0.08239563380139257, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005157053795390643, "time_sec": 38.63705110549927 }, { "epoch": 50, "train_loss": 3.5303411560821534, "train_acc": 0.0977, "test_loss": 2.3025870582580565, "test_acc": 0.1, "lyapunov": 1.9227478766380368, "grad_norm": 0.08162963599167514, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005000000000000002, "time_sec": 38.626914262771606 }, { "epoch": 51, "train_loss": 3.5286489057922363, "train_acc": 0.09604, "test_loss": 2.302586822128296, "test_acc": 0.1, "lyapunov": 1.9214349052180415, "grad_norm": 0.08139452605749796, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00048429462046093607, "time_sec": 38.64423418045044 }, { "epoch": 52, "train_loss": 3.525787140045166, "train_acc": 0.09778, "test_loss": 2.3025859855651856, "test_acc": 0.1, "lyapunov": 1.9190660763884444, "grad_norm": 0.08146521230474718, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004686047402353435, "time_sec": 38.6294162273407 }, { "epoch": 53, "train_loss": 3.5288507063293455, "train_acc": 0.09546, "test_loss": 2.3025855419158936, "test_acc": 0.1, "lyapunov": 1.9215699824530754, "grad_norm": 0.08218605919682316, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000452945843340743, "time_sec": 38.62653970718384 }, { "epoch": 54, "train_loss": 3.5271841695404054, "train_acc": 0.09872, "test_loss": 2.3025858070373535, "test_acc": 0.1, "lyapunov": 1.9201822860161666, "grad_norm": 0.08216715344839949, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784806, "time_sec": 38.638410806655884 }, { "epoch": 55, "train_loss": 3.526853522644043, "train_acc": 0.09744, "test_loss": 2.3025860900878907, "test_acc": 0.1, "lyapunov": 1.919959136897036, "grad_norm": 0.0817176354250303, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004217827674798847, "time_sec": 38.630091190338135 }, { "epoch": 56, "train_loss": 3.5288575717926025, "train_acc": 0.09954, "test_loss": 2.302586184310913, "test_acc": 0.1, "lyapunov": 1.921623296444983, "grad_norm": 0.08257148205256129, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00040630934270713783, "time_sec": 38.64346218109131 }, { "epoch": 57, "train_loss": 3.5272767601776125, "train_acc": 0.09642, "test_loss": 2.302586555480957, "test_acc": 0.1, "lyapunov": 1.9202661358791848, "grad_norm": 0.08293348649238423, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000390928379301729, "time_sec": 38.64233660697937 }, { "epoch": 58, "train_loss": 3.526464948577881, "train_acc": 0.09672, "test_loss": 2.3025856628417967, "test_acc": 0.1, "lyapunov": 1.9196561523105786, "grad_norm": 0.08164186959675705, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003756550564175727, "time_sec": 38.63249588012695 }, { "epoch": 59, "train_loss": 3.5295531370544433, "train_acc": 0.09774, "test_loss": 2.302585400390625, "test_acc": 0.1, "lyapunov": 1.9221740268990206, "grad_norm": 0.08246273738852085, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036050444698038553, "time_sec": 38.646018266677856 }, { "epoch": 60, "train_loss": 3.5271629650115965, "train_acc": 0.0971, "test_loss": 2.3025858444213867, "test_acc": 0.1, "lyapunov": 1.9201987954356787, "grad_norm": 0.08208001883222767, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00034549150281252655, "time_sec": 38.6309814453125 }, { "epoch": 61, "train_loss": 3.5265548262023927, "train_acc": 0.0977, "test_loss": 2.302585780715942, "test_acc": 0.1, "lyapunov": 1.9197500297785415, "grad_norm": 0.08189736323511718, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003306310398773544, "time_sec": 38.638221740722656 }, { "epoch": 62, "train_loss": 3.52600441986084, "train_acc": 0.09678, "test_loss": 2.302585761642456, "test_acc": 0.1, "lyapunov": 1.9192463177854142, "grad_norm": 0.08137598978711448, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766127, "time_sec": 38.63043713569641 }, { "epoch": 63, "train_loss": 3.5271013943481444, "train_acc": 0.09814, "test_loss": 2.302585670852661, "test_acc": 0.1, "lyapunov": 1.920157666096602, "grad_norm": 0.0823619758981674, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003014260546826097, "time_sec": 38.63147497177124 }, { "epoch": 64, "train_loss": 3.526780191192627, "train_acc": 0.09852, "test_loss": 2.302585818862915, "test_acc": 0.1, "lyapunov": 1.919904801546765, "grad_norm": 0.08022492391600272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002871103542174637, "time_sec": 38.62516927719116 }, { "epoch": 65, "train_loss": 3.5343781797790528, "train_acc": 0.09912, "test_loss": 2.3025853904724123, "test_acc": 0.1, "lyapunov": 1.9257748550771143, "grad_norm": 0.10073329729823817, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002730047501302267, "time_sec": 38.634148836135864 }, { "epoch": 66, "train_loss": 3.5349793888092043, "train_acc": 0.09842, "test_loss": 2.3025853446960447, "test_acc": 0.1, "lyapunov": 1.9264679845336758, "grad_norm": 0.11920770311136344, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00025912316294914234, "time_sec": 38.61845135688782 }, { "epoch": 67, "train_loss": 3.526273007965088, "train_acc": 0.09544, "test_loss": 2.3025852378845215, "test_acc": 0.1, "lyapunov": 1.9194827823687697, "grad_norm": 0.08304121043671493, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002454792921248144, "time_sec": 38.626497983932495 }, { "epoch": 68, "train_loss": 3.5271414315795897, "train_acc": 0.0966, "test_loss": 2.3025850952148437, "test_acc": 0.1, "lyapunov": 1.9202514917344389, "grad_norm": 0.08574615477087318, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00023208660251050164, "time_sec": 38.627126693725586 }, { "epoch": 69, "train_loss": 3.529951874008179, "train_acc": 0.0986, "test_loss": 2.30258518447876, "test_acc": 0.1, "lyapunov": 1.9225430412365652, "grad_norm": 0.08082947961897828, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00021895831107393473, "time_sec": 38.630186319351196 }, { "epoch": 70, "train_loss": 3.526535584869385, "train_acc": 0.09668, "test_loss": 2.3025852592468263, "test_acc": 0.1, "lyapunov": 1.919725867183617, "grad_norm": 0.08274796493939703, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376356, "time_sec": 38.6431679725647 }, { "epoch": 71, "train_loss": 3.5277945655822753, "train_acc": 0.09836, "test_loss": 2.3025853775024414, "test_acc": 0.1, "lyapunov": 1.920768865843868, "grad_norm": 0.08235441909099428, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019354647317351177, "time_sec": 38.63748812675476 }, { "epoch": 72, "train_loss": 3.5274662791442872, "train_acc": 0.0948, "test_loss": 2.3025851234436034, "test_acc": 0.1, "lyapunov": 1.9204377185963, "grad_norm": 0.08364637794680509, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001812880051256552, "time_sec": 38.6381402015686 }, { "epoch": 73, "train_loss": 3.526118115386963, "train_acc": 0.09886, "test_loss": 2.302585259628296, "test_acc": 0.1, "lyapunov": 1.9193554836160995, "grad_norm": 0.0826562338509352, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016934406733817422, "time_sec": 38.65567326545715 }, { "epoch": 74, "train_loss": 3.527300643615723, "train_acc": 0.09764, "test_loss": 2.302585151672363, "test_acc": 0.1, "lyapunov": 1.9203089323190168, "grad_norm": 0.08128595818241462, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001577264470356557, "time_sec": 38.65558409690857 }, { "epoch": 75, "train_loss": 3.52685251663208, "train_acc": 0.09664, "test_loss": 2.3025852661132813, "test_acc": 0.1, "lyapunov": 1.9200191327068201, "grad_norm": 0.08404244166329763, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014644660940672634, "time_sec": 38.63766312599182 }, { "epoch": 76, "train_loss": 3.5262623787689207, "train_acc": 0.09722, "test_loss": 2.3025850158691408, "test_acc": 0.1, "lyapunov": 1.919482776271108, "grad_norm": 0.08232879952859255, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001355156862892944, "time_sec": 38.633180379867554 }, { "epoch": 77, "train_loss": 3.528319863128662, "train_acc": 0.09596, "test_loss": 2.3025850936889647, "test_acc": 0.1, "lyapunov": 1.9211895322555776, "grad_norm": 0.08358594679641423, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012494446518477025, "time_sec": 38.6444034576416 }, { "epoch": 78, "train_loss": 3.526455977935791, "train_acc": 0.09646, "test_loss": 2.3025851753234865, "test_acc": 0.1, "lyapunov": 1.919646045740913, "grad_norm": 0.0800944099425941, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210548, "time_sec": 38.63438820838928 }, { "epoch": 79, "train_loss": 3.528594108276367, "train_acc": 0.09844, "test_loss": 2.302585315704346, "test_acc": 0.1, "lyapunov": 1.9213674385529345, "grad_norm": 0.0823521435571041, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010492249381215483, "time_sec": 38.63344979286194 }, { "epoch": 80, "train_loss": 3.5273741276550292, "train_acc": 0.09784, "test_loss": 2.3025850051879884, "test_acc": 0.1, "lyapunov": 1.9203915013681592, "grad_norm": 0.0830759912493753, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252637e-05, "time_sec": 38.62626814842224 }, { "epoch": 81, "train_loss": 3.5291355400848388, "train_acc": 0.09736, "test_loss": 2.3025851634979246, "test_acc": 0.1, "lyapunov": 1.921823484818344, "grad_norm": 0.08275874029214267, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.645971286271918e-05, "time_sec": 38.62844204902649 }, { "epoch": 82, "train_loss": 3.525912507019043, "train_acc": 0.09748, "test_loss": 2.3025852321624756, "test_acc": 0.1, "lyapunov": 1.91920463874212, "grad_norm": 0.08153852660653182, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.78360372489926e-05, "time_sec": 38.653265714645386 }, { "epoch": 83, "train_loss": 3.5292207734680177, "train_acc": 0.0958, "test_loss": 2.3025851135253905, "test_acc": 0.1, "lyapunov": 1.9219502158786939, "grad_norm": 0.08350888633092267, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.962898649802815e-05, "time_sec": 38.634111642837524 }, { "epoch": 84, "train_loss": 3.5284012381744385, "train_acc": 0.09624, "test_loss": 2.30258512878418, "test_acc": 0.1, "lyapunov": 1.9212511674217556, "grad_norm": 0.08116909186786311, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806824e-05, "time_sec": 38.64353036880493 }, { "epoch": 85, "train_loss": 3.5251765769195558, "train_acc": 0.09792, "test_loss": 2.30258514251709, "test_acc": 0.1, "lyapunov": 1.918617296401802, "grad_norm": 0.07954191314548852, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.449673790581613e-05, "time_sec": 38.62560677528381 }, { "epoch": 86, "train_loss": 3.5287663554382322, "train_acc": 0.09838, "test_loss": 2.302585173034668, "test_acc": 0.1, "lyapunov": 1.9215295982482794, "grad_norm": 0.08355699198177892, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.758647376699034e-05, "time_sec": 38.65434241294861 }, { "epoch": 87, "train_loss": 3.5260034490966796, "train_acc": 0.09604, "test_loss": 2.3025851554870607, "test_acc": 0.1, "lyapunov": 1.9192945807791122, "grad_norm": 0.08149215014053633, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.112268715800956e-05, "time_sec": 38.63465094566345 }, { "epoch": 88, "train_loss": 3.5243265664672854, "train_acc": 0.09828, "test_loss": 2.302585033416748, "test_acc": 0.1, "lyapunov": 1.9179029281791824, "grad_norm": 0.08154521467921626, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.511175705587434e-05, "time_sec": 38.6289963722229 }, { "epoch": 89, "train_loss": 3.5287904942321777, "train_acc": 0.09666, "test_loss": 2.302585191345215, "test_acc": 0.1, "lyapunov": 1.9215726117648737, "grad_norm": 0.084132595254172, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.9559615522887284e-05, "time_sec": 38.642388105392456 }, { "epoch": 90, "train_loss": 3.526969603881836, "train_acc": 0.09754, "test_loss": 2.302585014343262, "test_acc": 0.1, "lyapunov": 1.920039845549542, "grad_norm": 0.0821271686806539, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.447174185242324e-05, "time_sec": 38.63814377784729 }, { "epoch": 91, "train_loss": 3.527617153930664, "train_acc": 0.09638, "test_loss": 2.302585041809082, "test_acc": 0.1, "lyapunov": 1.9205815706716474, "grad_norm": 0.08312510555513332, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.9853157161528526e-05, "time_sec": 38.61940360069275 }, { "epoch": 92, "train_loss": 3.5268433947753905, "train_acc": 0.09684, "test_loss": 2.3025852138519287, "test_acc": 0.1, "lyapunov": 1.9199492108181615, "grad_norm": 0.0823876986166593, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568452e-05, "time_sec": 38.627458810806274 }, { "epoch": 93, "train_loss": 3.53038783744812, "train_acc": 0.0982, "test_loss": 2.3025850196838378, "test_acc": 0.1, "lyapunov": 1.9228984605320885, "grad_norm": 0.08263085862758328, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.204161903062634e-05, "time_sec": 38.63483691215515 }, { "epoch": 94, "train_loss": 3.5289703980255127, "train_acc": 0.09816, "test_loss": 2.3025850566864015, "test_acc": 0.1, "lyapunov": 1.9216854218631754, "grad_norm": 0.08327210271669083, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.85637463565564e-06, "time_sec": 38.63469362258911 }, { "epoch": 95, "train_loss": 3.5277647956848144, "train_acc": 0.0995, "test_loss": 2.3025852081298828, "test_acc": 0.1, "lyapunov": 1.9207559202028357, "grad_norm": 0.08352486265414892, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.155829702431171e-06, "time_sec": 38.64616012573242 }, { "epoch": 96, "train_loss": 3.526619141845703, "train_acc": 0.09938, "test_loss": 2.3025851345062254, "test_acc": 0.1, "lyapunov": 1.9198539360709812, "grad_norm": 0.08098182122024891, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761118e-06, "time_sec": 38.62220072746277 }, { "epoch": 97, "train_loss": 3.5280892516326903, "train_acc": 0.1, "test_loss": 2.3025852352142335, "test_acc": 0.1, "lyapunov": 1.921060741100165, "grad_norm": 0.08211810367594433, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.2190176984600023e-06, "time_sec": 38.645119190216064 }, { "epoch": 98, "train_loss": 3.5287079336547853, "train_acc": 0.1, "test_loss": 2.3025850273132322, "test_acc": 0.1, "lyapunov": 1.9215380800959398, "grad_norm": 0.08325515946558669, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642206e-07, "time_sec": 38.63027763366699 }, { "epoch": 99, "train_loss": 3.5253015606689453, "train_acc": 0.1, "test_loss": 2.30258511428833, "test_acc": 0.1, "lyapunov": 1.9187132022569857, "grad_norm": 0.08193671483030009, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.467198171342e-07, "time_sec": 38.63921046257019 }, { "epoch": 100, "train_loss": 3.5272140621948243, "train_acc": 0.1, "test_loss": 2.302585135269165, "test_acc": 0.1, "lyapunov": 1.9202767503840843, "grad_norm": 0.08222655054617872, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 38.6323139667511 } ], "8": [ { "epoch": 1, "train_loss": 8.479881681365967, "train_acc": 0.15672, "test_loss": 2.162619204711914, "test_acc": 0.2125, "lyapunov": 4.108346384199684, "grad_norm": 7.697098833505723, "grad_max_sv": 6.178906440734863, "grad_min_sv": 2.761631513692464e-07, "grad_condition": 23140136.221944965, "lr": 0.0009997532801828658, "time_sec": 81.47396469116211 }, { "epoch": 2, "train_loss": 5.665244631958008, "train_acc": 0.18, "test_loss": 2.1842808677673338, "test_acc": 0.1923, "lyapunov": 3.230283256686862, "grad_norm": 5.392009012742897, "grad_max_sv": 4.110089653730393, "grad_min_sv": 1.9321651976156317e-07, "grad_condition": 21420475.323837068, "lr": 0.0009990133642141358, "time_sec": 81.45991396903992 }, { "epoch": 3, "train_loss": 5.333162035522461, "train_acc": 0.1952, "test_loss": 2.225303956604004, "test_acc": 0.167, "lyapunov": 3.1082111679379594, "grad_norm": 3.851771920219555, "grad_max_sv": 3.176962560415268, "grad_min_sv": 1.3438213457561688e-07, "grad_condition": 23879291.498504233, "lr": 0.00099778098230154, "time_sec": 81.46788787841797 }, { "epoch": 4, "train_loss": 5.171234805908203, "train_acc": 0.20002, "test_loss": 2.235258939361572, "test_acc": 0.159, "lyapunov": 3.0473744570446746, "grad_norm": 2.481126294013876, "grad_max_sv": 2.0792742133140565, "grad_min_sv": 8.9392968050106e-08, "grad_condition": 24637829.84704242, "lr": 0.000996057350657239, "time_sec": 81.47967004776001 }, { "epoch": 5, "train_loss": 5.166805406799316, "train_acc": 0.19452, "test_loss": 2.237046794128418, "test_acc": 0.1327, "lyapunov": 3.0511742223559133, "grad_norm": 1.3615579983642885, "grad_max_sv": 1.0548206314444541, "grad_min_sv": 4.5490313116403056e-08, "grad_condition": 23987300.59429905, "lr": 0.0009938441702975688, "time_sec": 81.459157705307 }, { "epoch": 6, "train_loss": 4.8697237976074215, "train_acc": 0.1737, "test_loss": 2.2830872146606445, "test_acc": 0.1253, "lyapunov": 2.8754516471072535, "grad_norm": 0.6903867745940513, "grad_max_sv": 0.41943032629787924, "grad_min_sv": 1.919375629544362e-08, "grad_condition": 22192013.87340497, "lr": 0.0009911436253643444, "time_sec": 81.48192954063416 }, { "epoch": 7, "train_loss": 4.493588522949219, "train_acc": 0.15938, "test_loss": 2.3302653469085692, "test_acc": 0.1, "lyapunov": 2.653091859939458, "grad_norm": 0.7557218960403191, "grad_max_sv": 0.26077940948307515, "grad_min_sv": 1.0986899512399616e-08, "grad_condition": 25117189.859535195, "lr": 0.0009879583809693736, "time_sec": 81.4841628074646 }, { "epoch": 8, "train_loss": 4.350341845397949, "train_acc": 0.15252, "test_loss": 2.3086660652160647, "test_acc": 0.1, "lyapunov": 2.5555299291830234, "grad_norm": 0.6250628446482196, "grad_max_sv": 0.20942260958254338, "grad_min_sv": 7.251302003297155e-09, "grad_condition": 30522570.970140863, "lr": 0.0009842915805643154, "time_sec": 81.46237683296204 }, { "epoch": 9, "train_loss": 4.145118522186279, "train_acc": 0.13274, "test_loss": 2.315164138031006, "test_acc": 0.1, "lyapunov": 2.40533269762688, "grad_norm": 0.6205908073118289, "grad_max_sv": 0.14447018823120744, "grad_min_sv": 4.4057232563565755e-09, "grad_condition": 34238562.93985257, "lr": 0.0009801468428384714, "time_sec": 81.4730293750763 }, { "epoch": 10, "train_loss": 4.078840268859863, "train_acc": 0.1284, "test_loss": 2.3138900623321534, "test_acc": 0.1, "lyapunov": 2.363016066343888, "grad_norm": 0.7930843872612708, "grad_max_sv": 0.10398251404985785, "grad_min_sv": 3.7019540950061767e-09, "grad_condition": 60913515.913623154, "lr": 0.0009755282581475767, "time_sec": 81.45200657844543 }, { "epoch": 11, "train_loss": 4.092224692230225, "train_acc": 0.1466, "test_loss": 2.312975662994385, "test_acc": 0.1, "lyapunov": 2.3754844513085795, "grad_norm": 1.1984655112922225, "grad_max_sv": 0.17450910471379757, "grad_min_sv": 5.5799074860640734e-09, "grad_condition": 13168082812.37189, "lr": 0.0009704403844771127, "time_sec": 81.45421433448792 }, { "epoch": 12, "train_loss": 4.142614550323486, "train_acc": 0.10048, "test_loss": 2.3073625778198243, "test_acc": 0.1, "lyapunov": 2.36521298623146, "grad_norm": 0.8201455961321854, "grad_max_sv": 0.06452706009149552, "grad_min_sv": 1.4042129118228878e-12, "grad_condition": 50885083514.90724, "lr": 0.0009648882429441257, "time_sec": 81.46072387695312 }, { "epoch": 13, "train_loss": 3.979385091934204, "train_acc": 0.10066, "test_loss": 2.3081630187988282, "test_acc": 0.1, "lyapunov": 2.26381984696059, "grad_norm": 0.16210184952823345, "grad_max_sv": 0.04905642978847027, "grad_min_sv": 2.7241308859756593e-12, "grad_condition": 39268609789.13625, "lr": 0.0009588773128419905, "time_sec": 81.4600670337677 }, { "epoch": 14, "train_loss": 4.013840252990723, "train_acc": 0.09774, "test_loss": 2.3071225547790526, "test_acc": 0.1, "lyapunov": 2.2779995590219717, "grad_norm": 0.2350799590612887, "grad_max_sv": 0.03584399004466832, "grad_min_sv": 2.4371194341884142e-11, "grad_condition": 24256890299.017464, "lr": 0.0009524135262330098, "time_sec": 81.45963406562805 }, { "epoch": 15, "train_loss": 3.9913157040405274, "train_acc": 0.09784, "test_loss": 2.319146055984497, "test_acc": 0.1, "lyapunov": 2.268958825894329, "grad_norm": 0.15763925383129676, "grad_max_sv": 0.009183965646661818, "grad_min_sv": 1.97946225383161e-12, "grad_condition": 8163098832.376617, "lr": 0.0009455032620941839, "time_sec": 81.44594478607178 }, { "epoch": 16, "train_loss": 3.9718331854248046, "train_acc": 0.0996, "test_loss": 2.3092525833129884, "test_acc": 0.1, "lyapunov": 2.2586230457286396, "grad_norm": 0.11766352456542575, "grad_max_sv": 0.006989215174689889, "grad_min_sv": 2.4024430389645366e-14, "grad_condition": 6504081924.260536, "lr": 0.0009381533400219318, "time_sec": 81.44390797615051 }, { "epoch": 17, "train_loss": 3.9787883277130125, "train_acc": 0.09702, "test_loss": 2.3043574817657473, "test_acc": 0.1, "lyapunov": 2.2631307922665727, "grad_norm": 0.1527010207412437, "grad_max_sv": 0.009803948854096235, "grad_min_sv": 1.4435005241224427e-33, "grad_condition": 9803948854.096233, "lr": 0.0009303710135019719, "time_sec": 81.43403100967407 }, { "epoch": 18, "train_loss": 3.9913615090942383, "train_acc": 0.09744, "test_loss": 2.3033508323669434, "test_acc": 0.1, "lyapunov": 2.269262256524752, "grad_norm": 0.11184179273021279, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009221639627510076, "time_sec": 81.42399740219116 }, { "epoch": 19, "train_loss": 3.9763801429748535, "train_acc": 0.0977, "test_loss": 2.3026752422332764, "test_acc": 0.1, "lyapunov": 2.2619051079615913, "grad_norm": 0.11713248666386221, "grad_max_sv": 0.000484072370454669, "grad_min_sv": 0.0, "grad_condition": 484072370.454669, "lr": 0.000913540287137281, "time_sec": 81.4525249004364 }, { "epoch": 20, "train_loss": 3.976750040283203, "train_acc": 0.09734, "test_loss": 2.302591667175293, "test_acc": 0.1, "lyapunov": 2.262148560770332, "grad_norm": 0.11345857984491753, "grad_max_sv": 0.004815328773111105, "grad_min_sv": 7.298523316195025e-36, "grad_condition": 4815328773.111105, "lr": 0.0009045084971874739, "time_sec": 81.51628756523132 }, { "epoch": 21, "train_loss": 3.980269993438721, "train_acc": 0.09802, "test_loss": 2.302587752532959, "test_acc": 0.1, "lyapunov": 2.264334798164075, "grad_norm": 0.13684662833237576, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008950775061878452, "time_sec": 81.45560097694397 }, { "epoch": 22, "train_loss": 3.9804648877716065, "train_acc": 0.0979, "test_loss": 2.302587752532959, "test_acc": 0.1, "lyapunov": 2.2635294013011182, "grad_norm": 0.13344079799844585, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008852566213878947, "time_sec": 81.44366526603699 }, { "epoch": 23, "train_loss": 3.9813251597595216, "train_acc": 0.09872, "test_loss": 2.302596923828125, "test_acc": 0.1, "lyapunov": 2.264318755825462, "grad_norm": 0.11240815342914404, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008750555348152298, "time_sec": 81.4700722694397 }, { "epoch": 24, "train_loss": 3.9829969465637207, "train_acc": 0.09762, "test_loss": 2.302590003967285, "test_acc": 0.1, "lyapunov": 2.2655306484388267, "grad_norm": 0.13657445352154945, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107057, "time_sec": 81.44092345237732 }, { "epoch": 25, "train_loss": 3.9867445934295653, "train_acc": 0.09768, "test_loss": 2.3025884731292723, "test_acc": 0.1, "lyapunov": 2.2683042187215117, "grad_norm": 0.13504220620651136, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008535533905932737, "time_sec": 81.44885325431824 }, { "epoch": 26, "train_loss": 4.011947896575927, "train_acc": 0.09772, "test_loss": 2.302588147735596, "test_acc": 0.1, "lyapunov": 2.2796514083052535, "grad_norm": 0.16320303411181733, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643444, "time_sec": 81.45354628562927 }, { "epoch": 27, "train_loss": 3.9786824931335447, "train_acc": 0.09896, "test_loss": 2.302594832611084, "test_acc": 0.1, "lyapunov": 2.26323458300832, "grad_norm": 0.10988564477689002, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008306559326618259, "time_sec": 81.44628882408142 }, { "epoch": 28, "train_loss": 3.977536257247925, "train_acc": 0.098, "test_loss": 2.302598391723633, "test_acc": 0.1, "lyapunov": 2.262441022926584, "grad_norm": 0.12595116922261335, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743449, "time_sec": 81.4543764591217 }, { "epoch": 29, "train_loss": 3.976567816162109, "train_acc": 0.09876, "test_loss": 2.302590633010864, "test_acc": 0.1, "lyapunov": 2.2617232262935785, "grad_norm": 0.11663224483129596, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008064535268264883, "time_sec": 81.45405316352844 }, { "epoch": 30, "train_loss": 3.98611599609375, "train_acc": 0.09902, "test_loss": 2.302588882827759, "test_acc": 0.1, "lyapunov": 2.268034580723404, "grad_norm": 0.12156603788402341, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462367, "time_sec": 81.43305087089539 }, { "epoch": 31, "train_loss": 3.973400810546875, "train_acc": 0.09778, "test_loss": 2.3025912315368653, "test_acc": 0.1, "lyapunov": 2.259550383633665, "grad_norm": 0.11416147448139306, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007810416889260654, "time_sec": 81.45837593078613 }, { "epoch": 32, "train_loss": 3.988133301086426, "train_acc": 0.0974, "test_loss": 2.3025894966125486, "test_acc": 0.1, "lyapunov": 2.2669999562870817, "grad_norm": 0.11056723038790034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894983, "time_sec": 81.44456076622009 }, { "epoch": 33, "train_loss": 4.005648225860596, "train_acc": 0.09582, "test_loss": 2.302590217590332, "test_acc": 0.1, "lyapunov": 2.2759649180390342, "grad_norm": 0.15627582965327647, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007545207078751857, "time_sec": 81.45507860183716 }, { "epoch": 34, "train_loss": 3.979487621154785, "train_acc": 0.09842, "test_loss": 2.3025886589050293, "test_acc": 0.1, "lyapunov": 2.2636950528225324, "grad_norm": 0.11766964677730013, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508577, "time_sec": 81.40873432159424 }, { "epoch": 35, "train_loss": 3.9761420146942137, "train_acc": 0.09734, "test_loss": 2.3025886192321776, "test_acc": 0.1, "lyapunov": 2.2615554509565348, "grad_norm": 0.13516175590778773, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007269952498697734, "time_sec": 81.41994976997375 }, { "epoch": 36, "train_loss": 3.982365760269165, "train_acc": 0.09772, "test_loss": 2.302588511276245, "test_acc": 0.1, "lyapunov": 2.2654811189607584, "grad_norm": 0.11681074828605718, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825364, "time_sec": 81.44073605537415 }, { "epoch": 37, "train_loss": 4.0145159342956545, "train_acc": 0.09844, "test_loss": 2.3025877605438234, "test_acc": 0.1, "lyapunov": 2.279959214617834, "grad_norm": 0.16927419652036743, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006985739453173903, "time_sec": 81.44942951202393 }, { "epoch": 38, "train_loss": 3.9834751657104492, "train_acc": 0.0988, "test_loss": 2.3025879089355468, "test_acc": 0.1, "lyapunov": 2.26584634939423, "grad_norm": 0.14984272020285577, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423391, "time_sec": 81.45499515533447 }, { "epoch": 39, "train_loss": 4.02413849609375, "train_acc": 0.09734, "test_loss": 2.30258787689209, "test_acc": 0.1, "lyapunov": 2.286009701316619, "grad_norm": 0.22145868959770007, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006693689601226458, "time_sec": 81.45317363739014 }, { "epoch": 40, "train_loss": 3.9736411520385744, "train_acc": 0.09894, "test_loss": 2.3025887702941894, "test_acc": 0.1, "lyapunov": 2.259992800710146, "grad_norm": 0.08893647577966153, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874737, "time_sec": 81.45592546463013 }, { "epoch": 41, "train_loss": 3.976674521484375, "train_acc": 0.09844, "test_loss": 2.302586205673218, "test_acc": 0.1, "lyapunov": 2.262093958647355, "grad_norm": 0.09526075366227103, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006394955530196147, "time_sec": 81.4629635810852 }, { "epoch": 42, "train_loss": 3.9767224240112307, "train_acc": 0.09934, "test_loss": 2.3025863662719726, "test_acc": 0.1, "lyapunov": 2.2621575853098994, "grad_norm": 0.0889728077319319, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824273, "time_sec": 81.4452486038208 }, { "epoch": 43, "train_loss": 3.9843084770202637, "train_acc": 0.0983, "test_loss": 2.302587857055664, "test_acc": 0.1, "lyapunov": 2.266823678980093, "grad_norm": 0.14286833201945623, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006090716206982714, "time_sec": 81.46053290367126 }, { "epoch": 44, "train_loss": 3.978666923828125, "train_acc": 0.09862, "test_loss": 2.302588472366333, "test_acc": 0.1, "lyapunov": 2.262758489764865, "grad_norm": 0.10285858309556797, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005936906572928625, "time_sec": 81.4441590309143 }, { "epoch": 45, "train_loss": 3.984368924102783, "train_acc": 0.09714, "test_loss": 2.3025872661590574, "test_acc": 0.1, "lyapunov": 2.2663481009890662, "grad_norm": 0.11152947980914625, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005782172325201156, "time_sec": 81.43797850608826 }, { "epoch": 46, "train_loss": 3.9835290453338623, "train_acc": 0.09794, "test_loss": 2.302588889694214, "test_acc": 0.1, "lyapunov": 2.2661942069792684, "grad_norm": 0.12155880302110986, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821523, "time_sec": 81.4439845085144 }, { "epoch": 47, "train_loss": 3.976571675872803, "train_acc": 0.09746, "test_loss": 2.302587047958374, "test_acc": 0.1, "lyapunov": 2.262034943646482, "grad_norm": 0.09434388559512244, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005470541566592572, "time_sec": 81.44648504257202 }, { "epoch": 48, "train_loss": 3.978961787414551, "train_acc": 0.09674, "test_loss": 2.302586452484131, "test_acc": 0.1, "lyapunov": 2.2636160929794507, "grad_norm": 0.09388300184277713, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646569, "time_sec": 81.50625872612 }, { "epoch": 49, "train_loss": 3.9766515798950195, "train_acc": 0.09856, "test_loss": 2.302586361694336, "test_acc": 0.1, "lyapunov": 2.2621047679725512, "grad_norm": 0.08611192583269686, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005157053795390643, "time_sec": 81.42919588088989 }, { "epoch": 50, "train_loss": 3.9754750718688965, "train_acc": 0.09614, "test_loss": 2.302587022018433, "test_acc": 0.1, "lyapunov": 2.261166003049182, "grad_norm": 0.09585057441328976, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005000000000000002, "time_sec": 81.43738746643066 }, { "epoch": 51, "train_loss": 3.9752406224823, "train_acc": 0.09726, "test_loss": 2.302586801147461, "test_acc": 0.1, "lyapunov": 2.2611102423704494, "grad_norm": 0.09095072097377155, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00048429462046093607, "time_sec": 81.45784163475037 }, { "epoch": 52, "train_loss": 3.98188600982666, "train_acc": 0.0951, "test_loss": 2.302586806488037, "test_acc": 0.1, "lyapunov": 2.265076126893768, "grad_norm": 0.1123738428492386, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004686047402353435, "time_sec": 81.47153091430664 }, { "epoch": 53, "train_loss": 3.980596968536377, "train_acc": 0.0976, "test_loss": 2.3025859146118166, "test_acc": 0.1, "lyapunov": 2.2645553932775315, "grad_norm": 0.1076773200596488, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000452945843340743, "time_sec": 81.44375872612 }, { "epoch": 54, "train_loss": 3.9776349996948244, "train_acc": 0.09706, "test_loss": 2.3025868438720702, "test_acc": 0.1, "lyapunov": 2.2628720568878875, "grad_norm": 0.08828239082049001, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784806, "time_sec": 81.42411518096924 }, { "epoch": 55, "train_loss": 3.9808822979736327, "train_acc": 0.09588, "test_loss": 2.302585488128662, "test_acc": 0.1, "lyapunov": 2.2643827629821076, "grad_norm": 0.11262628002715089, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004217827674798847, "time_sec": 81.4528546333313 }, { "epoch": 56, "train_loss": 3.974801806488037, "train_acc": 0.09592, "test_loss": 2.3025861625671387, "test_acc": 0.1, "lyapunov": 2.2608287944208327, "grad_norm": 0.09195483599034024, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00040630934270713783, "time_sec": 81.44676446914673 }, { "epoch": 57, "train_loss": 3.976495365371704, "train_acc": 0.09736, "test_loss": 2.3025858879089354, "test_acc": 0.1, "lyapunov": 2.262001718096721, "grad_norm": 0.08361845913085657, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000390928379301729, "time_sec": 81.45348882675171 }, { "epoch": 58, "train_loss": 3.980894155731201, "train_acc": 0.09842, "test_loss": 2.3025855281829832, "test_acc": 0.1, "lyapunov": 2.2647068646862683, "grad_norm": 0.11991605921354555, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003756550564175727, "time_sec": 81.47408199310303 }, { "epoch": 59, "train_loss": 3.994586195449829, "train_acc": 0.0973, "test_loss": 2.3025854663848877, "test_acc": 0.1, "lyapunov": 2.27294464672313, "grad_norm": 0.18222829815312913, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036050444698038553, "time_sec": 81.44711089134216 }, { "epoch": 60, "train_loss": 3.9781198291015625, "train_acc": 0.09658, "test_loss": 2.3025856033325196, "test_acc": 0.1, "lyapunov": 2.263154449365328, "grad_norm": 0.08448254246697348, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00034549150281252655, "time_sec": 81.44161295890808 }, { "epoch": 61, "train_loss": 4.02450031616211, "train_acc": 0.0976, "test_loss": 2.302585502624512, "test_acc": 0.1, "lyapunov": 2.286170544831649, "grad_norm": 0.23432897685131301, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003306310398773544, "time_sec": 81.45745611190796 }, { "epoch": 62, "train_loss": 3.988269701385498, "train_acc": 0.09688, "test_loss": 2.3025854175567626, "test_acc": 0.1, "lyapunov": 2.267505117084669, "grad_norm": 0.10764931064603923, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766127, "time_sec": 81.45787954330444 }, { "epoch": 63, "train_loss": 3.9736854934692385, "train_acc": 0.09646, "test_loss": 2.3025857013702393, "test_acc": 0.1, "lyapunov": 2.2600014398774833, "grad_norm": 0.08382317206831051, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003014260546826097, "time_sec": 81.44196057319641 }, { "epoch": 64, "train_loss": 3.9797292990875244, "train_acc": 0.0969, "test_loss": 2.3025853332519532, "test_acc": 0.1, "lyapunov": 2.264177340680681, "grad_norm": 0.11933485737211565, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002871103542174637, "time_sec": 81.45828652381897 }, { "epoch": 65, "train_loss": 3.9763733405303956, "train_acc": 0.097, "test_loss": 2.3025854026794432, "test_acc": 0.1, "lyapunov": 2.2618614468733065, "grad_norm": 0.08601466707594763, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002730047501302267, "time_sec": 81.44515085220337 }, { "epoch": 66, "train_loss": 4.001672252197266, "train_acc": 0.09836, "test_loss": 2.302585359954834, "test_acc": 0.1, "lyapunov": 2.276178054492492, "grad_norm": 0.19097066416551475, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00025912316294914234, "time_sec": 81.44997453689575 }, { "epoch": 67, "train_loss": 3.983064818649292, "train_acc": 0.09848, "test_loss": 2.302585221862793, "test_acc": 0.1, "lyapunov": 2.2660030678410052, "grad_norm": 0.11726894505680324, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002454792921248144, "time_sec": 81.45755219459534 }, { "epoch": 68, "train_loss": 3.9874353774261473, "train_acc": 0.09726, "test_loss": 2.302585542297363, "test_acc": 0.1, "lyapunov": 2.26753244497587, "grad_norm": 0.1096052061821724, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00023208660251050164, "time_sec": 81.45092463493347 }, { "epoch": 69, "train_loss": 3.984990802612305, "train_acc": 0.09842, "test_loss": 2.3025853466033936, "test_acc": 0.1, "lyapunov": 2.2674437922894803, "grad_norm": 0.08538883278176537, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00021895831107393473, "time_sec": 81.44036960601807 }, { "epoch": 70, "train_loss": 3.9768560768127443, "train_acc": 0.09864, "test_loss": 2.3025853176116944, "test_acc": 0.1, "lyapunov": 2.262266612113894, "grad_norm": 0.0826759570118499, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376356, "time_sec": 81.44237995147705 }, { "epoch": 71, "train_loss": 3.97729412109375, "train_acc": 0.09838, "test_loss": 2.3025852783203127, "test_acc": 0.1, "lyapunov": 2.262566337195199, "grad_norm": 0.08149339121565821, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019354647317351177, "time_sec": 81.46553111076355 }, { "epoch": 72, "train_loss": 3.999013508300781, "train_acc": 0.09792, "test_loss": 2.3025853332519532, "test_acc": 0.1, "lyapunov": 2.2738718602358534, "grad_norm": 0.15690481475260892, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001812880051256552, "time_sec": 81.440505027771 }, { "epoch": 73, "train_loss": 3.9769914697265625, "train_acc": 0.09758, "test_loss": 2.302585132598877, "test_acc": 0.1, "lyapunov": 2.262345004264656, "grad_norm": 0.08468511131490652, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016934406733817422, "time_sec": 81.45508050918579 }, { "epoch": 74, "train_loss": 3.9735559133148195, "train_acc": 0.09684, "test_loss": 2.302585078430176, "test_acc": 0.1, "lyapunov": 2.2599204360981426, "grad_norm": 0.08407853053475459, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001577264470356557, "time_sec": 81.43686723709106 }, { "epoch": 75, "train_loss": 3.975616183166504, "train_acc": 0.09758, "test_loss": 2.302585101699829, "test_acc": 0.1, "lyapunov": 2.2613788644980897, "grad_norm": 0.08410718060667108, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014644660940672634, "time_sec": 81.46202492713928 }, { "epoch": 76, "train_loss": 3.9777969396972654, "train_acc": 0.09642, "test_loss": 2.302585230255127, "test_acc": 0.1, "lyapunov": 2.262849387000589, "grad_norm": 0.08412741392957411, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001355156862892944, "time_sec": 81.69426202774048 }, { "epoch": 77, "train_loss": 3.997583436126709, "train_acc": 0.09804, "test_loss": 2.3025851612091066, "test_acc": 0.1, "lyapunov": 2.272977476534636, "grad_norm": 0.19693507091470583, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012494446518477025, "time_sec": 81.47962164878845 }, { "epoch": 78, "train_loss": 3.981567749633789, "train_acc": 0.0972, "test_loss": 2.302585176086426, "test_acc": 0.1, "lyapunov": 2.2653762513719253, "grad_norm": 0.08819478927352292, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210548, "time_sec": 81.44144415855408 }, { "epoch": 79, "train_loss": 3.979712967529297, "train_acc": 0.09928, "test_loss": 2.3025852310180666, "test_acc": 0.1, "lyapunov": 2.2640710157506607, "grad_norm": 0.10900387268878003, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010492249381215483, "time_sec": 81.44691228866577 }, { "epoch": 80, "train_loss": 3.9752784634399414, "train_acc": 0.09612, "test_loss": 2.3025851806640625, "test_acc": 0.1, "lyapunov": 2.2611999310495907, "grad_norm": 0.08485114515050625, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252637e-05, "time_sec": 81.44573497772217 }, { "epoch": 81, "train_loss": 3.973998136444092, "train_acc": 0.09674, "test_loss": 2.302585205078125, "test_acc": 0.1, "lyapunov": 2.2602438634009006, "grad_norm": 0.08193297107495977, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.645971286271918e-05, "time_sec": 81.44051194190979 }, { "epoch": 82, "train_loss": 3.9795581608581543, "train_acc": 0.0974, "test_loss": 2.3025851707458496, "test_acc": 0.1, "lyapunov": 2.2642151602088947, "grad_norm": 0.08382214616673372, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.78360372489926e-05, "time_sec": 81.44579362869263 }, { "epoch": 83, "train_loss": 3.97544639793396, "train_acc": 0.0975, "test_loss": 2.3025851676940916, "test_acc": 0.1, "lyapunov": 2.261258240550985, "grad_norm": 0.0830598190151241, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.962898649802815e-05, "time_sec": 81.46574568748474 }, { "epoch": 84, "train_loss": 3.9764262825775147, "train_acc": 0.09818, "test_loss": 2.302585060119629, "test_acc": 0.1, "lyapunov": 2.2619712322264376, "grad_norm": 0.08369246247456191, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806824e-05, "time_sec": 81.45664143562317 }, { "epoch": 85, "train_loss": 3.9776910205078124, "train_acc": 0.0955, "test_loss": 2.3025851593017577, "test_acc": 0.1, "lyapunov": 2.2629058550080985, "grad_norm": 0.08247891269837844, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.449673790581613e-05, "time_sec": 81.461270570755 }, { "epoch": 86, "train_loss": 3.9771215029907228, "train_acc": 0.09536, "test_loss": 2.3025850746154783, "test_acc": 0.1, "lyapunov": 2.2625219870711226, "grad_norm": 0.08304329059000737, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.758647376699034e-05, "time_sec": 81.45261931419373 }, { "epoch": 87, "train_loss": 3.9780111279296877, "train_acc": 0.09718, "test_loss": 2.3025850124359133, "test_acc": 0.1, "lyapunov": 2.263096221572603, "grad_norm": 0.08168556680409891, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.112268715800956e-05, "time_sec": 81.47083902359009 }, { "epoch": 88, "train_loss": 3.975586996154785, "train_acc": 0.09506, "test_loss": 2.3025851093292236, "test_acc": 0.1, "lyapunov": 2.261420638360026, "grad_norm": 0.08585199329222436, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.511175705587434e-05, "time_sec": 81.46594524383545 }, { "epoch": 89, "train_loss": 3.9770257449340822, "train_acc": 0.0982, "test_loss": 2.3025851146698, "test_acc": 0.1, "lyapunov": 2.262422331153889, "grad_norm": 0.08469063518506169, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.9559615522887284e-05, "time_sec": 81.46577405929565 }, { "epoch": 90, "train_loss": 3.973931856689453, "train_acc": 0.09746, "test_loss": 2.3025850677490234, "test_acc": 0.1, "lyapunov": 2.2602365346210997, "grad_norm": 0.08267580569635262, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.447174185242324e-05, "time_sec": 81.45771622657776 }, { "epoch": 91, "train_loss": 3.9777387670898436, "train_acc": 0.09732, "test_loss": 2.3025851654052736, "test_acc": 0.1, "lyapunov": 2.262757078765908, "grad_norm": 0.10473963211370652, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.9853157161528526e-05, "time_sec": 81.46830105781555 }, { "epoch": 92, "train_loss": 3.973895709075928, "train_acc": 0.09754, "test_loss": 2.302585176086426, "test_acc": 0.1, "lyapunov": 2.2601819568887698, "grad_norm": 0.08524438116449506, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568452e-05, "time_sec": 81.45872473716736 }, { "epoch": 93, "train_loss": 3.975780742340088, "train_acc": 0.09832, "test_loss": 2.302585258483887, "test_acc": 0.1, "lyapunov": 2.261494060916364, "grad_norm": 0.08296746372602809, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.204161903062634e-05, "time_sec": 81.44344329833984 }, { "epoch": 94, "train_loss": 3.9749393853759765, "train_acc": 0.099, "test_loss": 2.3025851181030275, "test_acc": 0.1, "lyapunov": 2.2609141049787516, "grad_norm": 0.081703214219651, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.85637463565564e-06, "time_sec": 81.47197723388672 }, { "epoch": 95, "train_loss": 3.977360173110962, "train_acc": 0.09844, "test_loss": 2.3025852035522463, "test_acc": 0.1, "lyapunov": 2.2626446403200973, "grad_norm": 0.08370580659845218, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.155829702431171e-06, "time_sec": 81.4649875164032 }, { "epoch": 96, "train_loss": 3.9748195641326904, "train_acc": 0.09918, "test_loss": 2.3025851348876953, "test_acc": 0.1, "lyapunov": 2.2608655974688125, "grad_norm": 0.08506351899121649, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761118e-06, "time_sec": 81.45548796653748 }, { "epoch": 97, "train_loss": 3.977184408874512, "train_acc": 0.09888, "test_loss": 2.3025851238250734, "test_acc": 0.1, "lyapunov": 2.262512852163876, "grad_norm": 0.08383579924614167, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.2190176984600023e-06, "time_sec": 81.4503653049469 }, { "epoch": 98, "train_loss": 3.979651080627441, "train_acc": 0.1, "test_loss": 2.3025852249145506, "test_acc": 0.1, "lyapunov": 2.264271725778994, "grad_norm": 0.08181479722385572, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642206e-07, "time_sec": 81.46501636505127 }, { "epoch": 99, "train_loss": 3.9744724880981446, "train_acc": 0.1, "test_loss": 2.302585131072998, "test_acc": 0.1, "lyapunov": 2.260578519547992, "grad_norm": 0.08286890329554125, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.467198171342e-07, "time_sec": 81.44538688659668 }, { "epoch": 100, "train_loss": 3.9755064764404295, "train_acc": 0.1, "test_loss": 2.302585161590576, "test_acc": 0.1, "lyapunov": 2.2613274374276475, "grad_norm": 0.08253103448725845, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 81.44115138053894 } ], "12": [ { "epoch": 1, "train_loss": 11.514268187866211, "train_acc": 0.12322, "test_loss": 2.335220721435547, "test_acc": 0.1082, "lyapunov": 5.094494405609872, "grad_norm": 6.68472372840091, "grad_max_sv": 5.768041110038757, "grad_min_sv": 2.425695402763495e-07, "grad_condition": 23767971.115653183, "lr": 0.0009997532801828658, "time_sec": 124.28109288215637 }, { "epoch": 2, "train_loss": 6.767582432556153, "train_acc": 0.13338, "test_loss": 2.3135711360931395, "test_acc": 0.1058, "lyapunov": 3.703414491375389, "grad_norm": 4.437490608687784, "grad_max_sv": 3.688317948579788, "grad_min_sv": 1.6068337682639822e-07, "grad_condition": 23679624.47851156, "lr": 0.0009990133642141358, "time_sec": 124.28083038330078 }, { "epoch": 3, "train_loss": 6.359151521911621, "train_acc": 0.1371, "test_loss": 2.3046204761505127, "test_acc": 0.1017, "lyapunov": 3.53740519087028, "grad_norm": 3.3992685611612004, "grad_max_sv": 3.1906665176153184, "grad_min_sv": 1.0806052515022202e-07, "grad_condition": 30020073.39935509, "lr": 0.00099778098230154, "time_sec": 124.26130867004395 }, { "epoch": 4, "train_loss": 5.680015151367187, "train_acc": 0.12346, "test_loss": 2.4307143615722655, "test_acc": 0.0946, "lyapunov": 3.2194143725783015, "grad_norm": 3.6284679983008856, "grad_max_sv": 2.3083297662011844, "grad_min_sv": 7.267783242878633e-08, "grad_condition": 28802302.157710887, "lr": 0.000996057350657239, "time_sec": 124.2893226146698 }, { "epoch": 5, "train_loss": 5.515282614440918, "train_acc": 0.11878, "test_loss": 2.3333636627197265, "test_acc": 0.0806, "lyapunov": 3.1298821100493526, "grad_norm": 2.1440857096164527, "grad_max_sv": 1.8293321043252946, "grad_min_sv": 6.11613814704981e-08, "grad_condition": 30298382.919277746, "lr": 0.0009938441702975688, "time_sec": 124.24556708335876 }, { "epoch": 6, "train_loss": 4.830215334472657, "train_acc": 0.10662, "test_loss": 2.3030837219238283, "test_acc": 0.1, "lyapunov": 2.7727705700623106, "grad_norm": 2.350059460657985, "grad_max_sv": 1.5110829517245292, "grad_min_sv": 2.7742502849842366e-08, "grad_condition": 415971679.7996719, "lr": 0.0009911436253643444, "time_sec": 124.2670316696167 }, { "epoch": 7, "train_loss": 5.0002188845825195, "train_acc": 0.1014, "test_loss": 2.306517247772217, "test_acc": 0.1, "lyapunov": 2.8697540314910968, "grad_norm": 4.791639177202153, "grad_max_sv": 0.7900435705131315, "grad_min_sv": 1.012708673176853e-08, "grad_condition": 1185811132.9619708, "lr": 0.0009879583809693736, "time_sec": 124.2431480884552 }, { "epoch": 8, "train_loss": 5.872336234741211, "train_acc": 0.10816, "test_loss": 2.3033512046813964, "test_acc": 0.1, "lyapunov": 3.2996887185079666, "grad_norm": 4.562165296743471, "grad_max_sv": 0.4824362076822354, "grad_min_sv": 1.352856967967285e-08, "grad_condition": 33563973.110157445, "lr": 0.0009842915805643154, "time_sec": 124.24206638336182 }, { "epoch": 9, "train_loss": 5.207491922912598, "train_acc": 0.1015, "test_loss": 2.302657497024536, "test_acc": 0.1, "lyapunov": 2.982921624732444, "grad_norm": 1.2857988530859297, "grad_max_sv": 0.4782970450818539, "grad_min_sv": 6.14909029240993e-09, "grad_condition": 17001336844.82257, "lr": 0.0009801468428384714, "time_sec": 124.2599868774414 }, { "epoch": 10, "train_loss": 5.278977078552246, "train_acc": 0.11042, "test_loss": 2.303682248687744, "test_acc": 0.1, "lyapunov": 3.0210835842220374, "grad_norm": 2.219210747930246, "grad_max_sv": 0.26804067082703115, "grad_min_sv": 5.793725242549423e-09, "grad_condition": 7080161076.764597, "lr": 0.0009755282581475767, "time_sec": 124.2449324131012 }, { "epoch": 11, "train_loss": 4.803467753601074, "train_acc": 0.1012, "test_loss": 4.169252464294433, "test_acc": 0.1, "lyapunov": 2.77325821654571, "grad_norm": 2.127622649938152, "grad_max_sv": 0.1682983461767435, "grad_min_sv": 5.603680153853458e-10, "grad_condition": 68373983123.414894, "lr": 0.0009704403844771127, "time_sec": 124.30126142501831 }, { "epoch": 12, "train_loss": 4.544517149658203, "train_acc": 0.09926, "test_loss": 4.290980886840821, "test_acc": 0.1, "lyapunov": 2.62944141068422, "grad_norm": 1.638854096476257, "grad_max_sv": 0.07512564162607305, "grad_min_sv": 2.6490731026315825e-12, "grad_condition": 54196459261.33328, "lr": 0.0009648882429441257, "time_sec": 124.24927043914795 }, { "epoch": 13, "train_loss": 4.369602390441894, "train_acc": 0.09752, "test_loss": 4.109600519561767, "test_acc": 0.1, "lyapunov": 2.5177556279370243, "grad_norm": 2.133122078616872, "grad_max_sv": 0.09587469333782792, "grad_min_sv": 2.093604774056981e-12, "grad_condition": 86094204980.57991, "lr": 0.0009588773128419905, "time_sec": 124.26178216934204 }, { "epoch": 14, "train_loss": 4.34119681640625, "train_acc": 0.09926, "test_loss": 4.199708403778076, "test_acc": 0.1, "lyapunov": 2.495693293373908, "grad_norm": 2.708849611541162, "grad_max_sv": 0.09101940747350454, "grad_min_sv": 8.368649587364072e-14, "grad_condition": 87173383288.77208, "lr": 0.0009524135262330098, "time_sec": 124.24493861198425 }, { "epoch": 15, "train_loss": 5.13457500289917, "train_acc": 0.10424, "test_loss": 2.308458815765381, "test_acc": 0.1, "lyapunov": 2.9219820334783297, "grad_norm": 3.354402938679459, "grad_max_sv": 0.09543408825993538, "grad_min_sv": 1.3719995468877692e-10, "grad_condition": 59504120268.59434, "lr": 0.0009455032620941839, "time_sec": 124.29389190673828 }, { "epoch": 16, "train_loss": 5.3248897048950194, "train_acc": 0.10296, "test_loss": 2.302912854766846, "test_acc": 0.1, "lyapunov": 2.9764596306149613, "grad_norm": 0.6322085012676749, "grad_max_sv": 0.053145987424068154, "grad_min_sv": 3.2089368939156336e-11, "grad_condition": 21592510035.150898, "lr": 0.0009381533400219318, "time_sec": 124.22647547721863 }, { "epoch": 17, "train_loss": 4.330915478057861, "train_acc": 0.09936, "test_loss": 2.3026626167297364, "test_acc": 0.1, "lyapunov": 2.493599863613353, "grad_norm": 0.20813626461361764, "grad_max_sv": 0.0220638582482934, "grad_min_sv": 5.079951297939575e-13, "grad_condition": 7528215997.404785, "lr": 0.0009303710135019719, "time_sec": 124.25075626373291 }, { "epoch": 18, "train_loss": 4.329695655975342, "train_acc": 0.09802, "test_loss": 2.3026026527404784, "test_acc": 0.1, "lyapunov": 2.4943465003577034, "grad_norm": 0.28764831256555634, "grad_max_sv": 0.00430559329688549, "grad_min_sv": 1.0630859058082507e-17, "grad_condition": 4303763188.890272, "lr": 0.0009221639627510076, "time_sec": 124.26908159255981 }, { "epoch": 19, "train_loss": 4.449291636352539, "train_acc": 0.09546, "test_loss": 2.3025916465759275, "test_acc": 0.1, "lyapunov": 2.5493475122524956, "grad_norm": 0.286977076303005, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000913540287137281, "time_sec": 124.22392654418945 }, { "epoch": 20, "train_loss": 4.275282980957031, "train_acc": 0.09758, "test_loss": 2.3025943778991698, "test_acc": 0.1, "lyapunov": 2.4641005602639043, "grad_norm": 0.11226214403634883, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0009045084971874739, "time_sec": 124.30651044845581 }, { "epoch": 21, "train_loss": 4.299091949005127, "train_acc": 0.09792, "test_loss": 2.30259245262146, "test_acc": 0.1, "lyapunov": 2.477661563917194, "grad_norm": 0.12888554972749486, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008950775061878452, "time_sec": 124.23446798324585 }, { "epoch": 22, "train_loss": 4.315002240905762, "train_acc": 0.0975, "test_loss": 2.3025940551757813, "test_acc": 0.1, "lyapunov": 2.4848342008907776, "grad_norm": 0.13926908971905202, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008852566213878947, "time_sec": 124.30266809463501 }, { "epoch": 23, "train_loss": 4.362473590087891, "train_acc": 0.09968, "test_loss": 2.3025879684448243, "test_acc": 0.1, "lyapunov": 2.508172784619929, "grad_norm": 0.25147158848993745, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008750555348152298, "time_sec": 124.24051856994629 }, { "epoch": 24, "train_loss": 4.361022654266358, "train_acc": 0.09674, "test_loss": 2.3025897010803225, "test_acc": 0.1, "lyapunov": 2.5060998808087596, "grad_norm": 0.25289701667178555, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008644843137107057, "time_sec": 124.22614932060242 }, { "epoch": 25, "train_loss": 4.292231715545654, "train_acc": 0.098, "test_loss": 2.3025892387390137, "test_acc": 0.1, "lyapunov": 2.4726591543163483, "grad_norm": 0.15846202884892668, "grad_max_sv": 0.007139207795262337, "grad_min_sv": 1.1884213096035809e-14, "grad_condition": 5768863374.104107, "lr": 0.0008535533905932737, "time_sec": 124.29175138473511 }, { "epoch": 26, "train_loss": 4.278334856414795, "train_acc": 0.09952, "test_loss": 2.302597050857544, "test_acc": 0.1, "lyapunov": 2.46608062229498, "grad_norm": 0.09871518957397614, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008422735529643444, "time_sec": 124.22811436653137 }, { "epoch": 27, "train_loss": 4.279530144348144, "train_acc": 0.09882, "test_loss": 2.3025887565612795, "test_acc": 0.1, "lyapunov": 2.466456468757766, "grad_norm": 0.09728576577451334, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008306559326618259, "time_sec": 124.25813937187195 }, { "epoch": 28, "train_loss": 4.276873157348633, "train_acc": 0.0965, "test_loss": 2.302586852264404, "test_acc": 0.1, "lyapunov": 2.4651820092554897, "grad_norm": 0.09336828927700111, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743449, "time_sec": 124.22499465942383 }, { "epoch": 29, "train_loss": 4.274294167022705, "train_acc": 0.09674, "test_loss": 2.302587184906006, "test_acc": 0.1, "lyapunov": 2.4635079608244053, "grad_norm": 0.08132883703681491, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008064535268264883, "time_sec": 124.26223015785217 }, { "epoch": 30, "train_loss": 4.3161706869506835, "train_acc": 0.09742, "test_loss": 2.302589612197876, "test_acc": 0.1, "lyapunov": 2.4838878163291365, "grad_norm": 0.1244076499240839, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007938926261462367, "time_sec": 124.22068643569946 }, { "epoch": 31, "train_loss": 4.2865172996520995, "train_acc": 0.09864, "test_loss": 2.3025933723449707, "test_acc": 0.1, "lyapunov": 2.4704265179841416, "grad_norm": 0.11325710428703713, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007810416889260654, "time_sec": 124.27307343482971 }, { "epoch": 32, "train_loss": 4.276113499755859, "train_acc": 0.09876, "test_loss": 2.302595587158203, "test_acc": 0.1, "lyapunov": 2.464605447276474, "grad_norm": 0.11188150655123451, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894983, "time_sec": 124.21617436408997 }, { "epoch": 33, "train_loss": 4.390245020904541, "train_acc": 0.09734, "test_loss": 2.302589817047119, "test_acc": 0.1, "lyapunov": 2.5185477038478608, "grad_norm": 0.2703519117597579, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007545207078751857, "time_sec": 124.22293186187744 }, { "epoch": 34, "train_loss": 4.350401836242676, "train_acc": 0.09758, "test_loss": 2.302588123321533, "test_acc": 0.1, "lyapunov": 2.4999206596628176, "grad_norm": 0.21853702579717843, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508577, "time_sec": 124.26609373092651 }, { "epoch": 35, "train_loss": 4.305715147399902, "train_acc": 0.09856, "test_loss": 2.302589534378052, "test_acc": 0.1, "lyapunov": 2.4810556158080432, "grad_norm": 0.17605927419881373, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007269952498697734, "time_sec": 124.22794723510742 }, { "epoch": 36, "train_loss": 4.305906265258789, "train_acc": 0.09718, "test_loss": 2.302591007232666, "test_acc": 0.1, "lyapunov": 2.477643119709571, "grad_norm": 0.1236420897514881, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825364, "time_sec": 124.26314496994019 }, { "epoch": 37, "train_loss": 4.27584158996582, "train_acc": 0.0968, "test_loss": 2.302587622451782, "test_acc": 0.1, "lyapunov": 2.464479011038075, "grad_norm": 0.09532844351778941, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006985739453173903, "time_sec": 124.25255799293518 }, { "epoch": 38, "train_loss": 4.283268468475342, "train_acc": 0.097, "test_loss": 2.302587129211426, "test_acc": 0.1, "lyapunov": 2.4685643030249556, "grad_norm": 0.12053745808537034, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423391, "time_sec": 124.26603984832764 }, { "epoch": 39, "train_loss": 4.340071802978516, "train_acc": 0.09756, "test_loss": 2.302587187576294, "test_acc": 0.1, "lyapunov": 2.496372491807279, "grad_norm": 0.2265015040889252, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006693689601226458, "time_sec": 124.26093554496765 }, { "epoch": 40, "train_loss": 4.285524172973632, "train_acc": 0.0976, "test_loss": 2.302589253234863, "test_acc": 0.1, "lyapunov": 2.4703913722806576, "grad_norm": 0.12837922155849044, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874737, "time_sec": 124.23279547691345 }, { "epoch": 41, "train_loss": 4.353975823822021, "train_acc": 0.0984, "test_loss": 2.3025891468048094, "test_acc": 0.1, "lyapunov": 2.502122705854723, "grad_norm": 0.31834434179235455, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006394955530196147, "time_sec": 124.27406620979309 }, { "epoch": 42, "train_loss": 4.285235863494873, "train_acc": 0.0975, "test_loss": 2.3025873653411866, "test_acc": 0.1, "lyapunov": 2.4699011251444705, "grad_norm": 0.16460675806479913, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824273, "time_sec": 124.23745155334473 }, { "epoch": 43, "train_loss": 4.273813045043945, "train_acc": 0.09694, "test_loss": 2.3025889190673827, "test_acc": 0.1, "lyapunov": 2.463189967148139, "grad_norm": 0.09609475828794435, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006090716206982714, "time_sec": 124.27437806129456 }, { "epoch": 44, "train_loss": 4.297922962646484, "train_acc": 0.09686, "test_loss": 2.3025868633270266, "test_acc": 0.1, "lyapunov": 2.474009756541923, "grad_norm": 0.14502465560049782, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005936906572928625, "time_sec": 124.22268414497375 }, { "epoch": 45, "train_loss": 4.279574555053711, "train_acc": 0.09652, "test_loss": 2.3025878047943116, "test_acc": 0.1, "lyapunov": 2.4667322599064665, "grad_norm": 0.12003136414158579, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005782172325201156, "time_sec": 124.28323554992676 }, { "epoch": 46, "train_loss": 4.273971158905029, "train_acc": 0.0966, "test_loss": 2.302587424468994, "test_acc": 0.1, "lyapunov": 2.463305209908644, "grad_norm": 0.09172584937965118, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821523, "time_sec": 124.20362710952759 }, { "epoch": 47, "train_loss": 4.313593041381836, "train_acc": 0.09574, "test_loss": 2.302586856460571, "test_acc": 0.1, "lyapunov": 2.4801262095761114, "grad_norm": 0.15167690922053198, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005470541566592572, "time_sec": 124.29144883155823 }, { "epoch": 48, "train_loss": 4.295382699737549, "train_acc": 0.09748, "test_loss": 2.302586772155762, "test_acc": 0.1, "lyapunov": 2.4740971671345897, "grad_norm": 0.10879569327624422, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646569, "time_sec": 124.23017454147339 }, { "epoch": 49, "train_loss": 4.2751529647827144, "train_acc": 0.09936, "test_loss": 2.3025859580993653, "test_acc": 0.1, "lyapunov": 2.4640432062661253, "grad_norm": 0.10568439425734225, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005157053795390643, "time_sec": 124.25622701644897 }, { "epoch": 50, "train_loss": 4.273743729553223, "train_acc": 0.0957, "test_loss": 2.3025863090515135, "test_acc": 0.1, "lyapunov": 2.4630955387564266, "grad_norm": 0.11615112587060138, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005000000000000002, "time_sec": 124.27268052101135 }, { "epoch": 51, "train_loss": 4.280425806427002, "train_acc": 0.09628, "test_loss": 2.302586248397827, "test_acc": 0.1, "lyapunov": 2.466461474938161, "grad_norm": 0.10654878565362114, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00048429462046093607, "time_sec": 124.24109268188477 }, { "epoch": 52, "train_loss": 4.279801727294922, "train_acc": 0.09702, "test_loss": 2.3025866828918455, "test_acc": 0.1, "lyapunov": 2.4669952484043054, "grad_norm": 0.130514829251149, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004686047402353435, "time_sec": 124.26980781555176 }, { "epoch": 53, "train_loss": 4.315970222320557, "train_acc": 0.09704, "test_loss": 2.3025870681762695, "test_acc": 0.1, "lyapunov": 2.484521316445392, "grad_norm": 0.1939414239261272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000452945843340743, "time_sec": 124.22718167304993 }, { "epoch": 54, "train_loss": 4.311761430969239, "train_acc": 0.09862, "test_loss": 2.3025857872009277, "test_acc": 0.1, "lyapunov": 2.482763496506245, "grad_norm": 0.18263667447361673, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784806, "time_sec": 124.2686333656311 }, { "epoch": 55, "train_loss": 4.277025068054199, "train_acc": 0.09778, "test_loss": 2.3025857639312743, "test_acc": 0.1, "lyapunov": 2.465040735576464, "grad_norm": 0.09424723224869033, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004217827674798847, "time_sec": 124.23272252082825 }, { "epoch": 56, "train_loss": 4.308205063934326, "train_acc": 0.0989, "test_loss": 2.3025861671447756, "test_acc": 0.1, "lyapunov": 2.4804823679082535, "grad_norm": 0.20788469844558666, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00040630934270713783, "time_sec": 124.45265817642212 }, { "epoch": 57, "train_loss": 4.282971714477539, "train_acc": 0.09876, "test_loss": 2.3025856742858886, "test_acc": 0.1, "lyapunov": 2.4687917086169544, "grad_norm": 0.1374470775631024, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000390928379301729, "time_sec": 124.2466242313385 }, { "epoch": 58, "train_loss": 4.311033409729004, "train_acc": 0.09662, "test_loss": 2.302585438156128, "test_acc": 0.1, "lyapunov": 2.4805221582007837, "grad_norm": 0.15017627742331574, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003756550564175727, "time_sec": 124.22827982902527 }, { "epoch": 59, "train_loss": 4.29637522354126, "train_acc": 0.09756, "test_loss": 2.302585637664795, "test_acc": 0.1, "lyapunov": 2.4749210880845403, "grad_norm": 0.1570135955415664, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036050444698038553, "time_sec": 124.30038142204285 }, { "epoch": 60, "train_loss": 4.307900915527344, "train_acc": 0.09804, "test_loss": 2.302586008834839, "test_acc": 0.1, "lyapunov": 2.4804043434465024, "grad_norm": 0.21537262268091628, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00034549150281252655, "time_sec": 124.21648406982422 }, { "epoch": 61, "train_loss": 4.294828899230957, "train_acc": 0.09696, "test_loss": 2.302585659408569, "test_acc": 0.1, "lyapunov": 2.474180576441538, "grad_norm": 0.15175328138376964, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003306310398773544, "time_sec": 124.26800394058228 }, { "epoch": 62, "train_loss": 4.27745719039917, "train_acc": 0.09794, "test_loss": 2.302585639190674, "test_acc": 0.1, "lyapunov": 2.465500669406198, "grad_norm": 0.10570315629890674, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766127, "time_sec": 124.23925018310547 }, { "epoch": 63, "train_loss": 4.2727640603637695, "train_acc": 0.09586, "test_loss": 2.3025855934143067, "test_acc": 0.1, "lyapunov": 2.4626387360760624, "grad_norm": 0.0890330369346984, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003014260546826097, "time_sec": 124.27016854286194 }, { "epoch": 64, "train_loss": 4.272457419738769, "train_acc": 0.09604, "test_loss": 2.3025855697631834, "test_acc": 0.1, "lyapunov": 2.4623735072972526, "grad_norm": 0.0847950891199477, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002871103542174637, "time_sec": 124.20920252799988 }, { "epoch": 65, "train_loss": 4.273480668334961, "train_acc": 0.09808, "test_loss": 2.302585276031494, "test_acc": 0.1, "lyapunov": 2.4630366255865073, "grad_norm": 0.08372012214032937, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002730047501302267, "time_sec": 124.22656655311584 }, { "epoch": 66, "train_loss": 4.307428127746582, "train_acc": 0.09712, "test_loss": 2.302585486602783, "test_acc": 0.1, "lyapunov": 2.4764473944368874, "grad_norm": 0.12238051774317063, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00025912316294914234, "time_sec": 124.28961944580078 }, { "epoch": 67, "train_loss": 4.310281341094971, "train_acc": 0.09792, "test_loss": 2.3025853305816653, "test_acc": 0.1, "lyapunov": 2.480989251295319, "grad_norm": 0.27019424894200594, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002454792921248144, "time_sec": 124.25288558006287 }, { "epoch": 68, "train_loss": 4.282535659484863, "train_acc": 0.09756, "test_loss": 2.3025853900909423, "test_acc": 0.1, "lyapunov": 2.4676397261412246, "grad_norm": 0.1281762106524609, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00023208660251050164, "time_sec": 124.26717019081116 }, { "epoch": 69, "train_loss": 4.276787458190918, "train_acc": 0.09688, "test_loss": 2.3025852905273436, "test_acc": 0.1, "lyapunov": 2.4651669858361753, "grad_norm": 0.08124252440804115, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00021895831107393473, "time_sec": 124.23096060752869 }, { "epoch": 70, "train_loss": 4.28195741897583, "train_acc": 0.09668, "test_loss": 2.302585355377197, "test_acc": 0.1, "lyapunov": 2.468135183729479, "grad_norm": 0.11112746909721634, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376356, "time_sec": 124.27119207382202 }, { "epoch": 71, "train_loss": 4.284729679412842, "train_acc": 0.09706, "test_loss": 2.302585294342041, "test_acc": 0.1, "lyapunov": 2.469655635716665, "grad_norm": 0.12307199730963861, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019354647317351177, "time_sec": 124.23093914985657 }, { "epoch": 72, "train_loss": 4.276600415039063, "train_acc": 0.09806, "test_loss": 2.3025852252960206, "test_acc": 0.1, "lyapunov": 2.464849721440269, "grad_norm": 0.12908363321506647, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001812880051256552, "time_sec": 124.25842094421387 }, { "epoch": 73, "train_loss": 4.3069706353759765, "train_acc": 0.09654, "test_loss": 2.3025852447509765, "test_acc": 0.1, "lyapunov": 2.479751230810609, "grad_norm": 0.183601868909449, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016934406733817422, "time_sec": 124.21842932701111 }, { "epoch": 74, "train_loss": 4.287112475280762, "train_acc": 0.09722, "test_loss": 2.302585179901123, "test_acc": 0.1, "lyapunov": 2.4702408582048343, "grad_norm": 0.1331148526919891, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001577264470356557, "time_sec": 124.22039604187012 }, { "epoch": 75, "train_loss": 4.271034491882324, "train_acc": 0.09664, "test_loss": 2.3025851165771485, "test_acc": 0.1, "lyapunov": 2.461448823704439, "grad_norm": 0.08255701875769623, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014644660940672634, "time_sec": 124.30420184135437 }, { "epoch": 76, "train_loss": 4.272865072021484, "train_acc": 0.09542, "test_loss": 2.302585235977173, "test_acc": 0.1, "lyapunov": 2.462638800101512, "grad_norm": 0.08790859271963604, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001355156862892944, "time_sec": 124.23553800582886 }, { "epoch": 77, "train_loss": 4.271533363189698, "train_acc": 0.09712, "test_loss": 2.3025852149963377, "test_acc": 0.1, "lyapunov": 2.4617462914313197, "grad_norm": 0.08471091537010327, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012494446518477025, "time_sec": 124.25954508781433 }, { "epoch": 78, "train_loss": 4.290692696685791, "train_acc": 0.09754, "test_loss": 2.302585163116455, "test_acc": 0.1, "lyapunov": 2.470475591357102, "grad_norm": 0.10652401748252295, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210548, "time_sec": 124.22494149208069 }, { "epoch": 79, "train_loss": 4.274790961608887, "train_acc": 0.09758, "test_loss": 2.302585228347778, "test_acc": 0.1, "lyapunov": 2.4638520756645885, "grad_norm": 0.08078835262733591, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010492249381215483, "time_sec": 124.29019331932068 }, { "epoch": 80, "train_loss": 4.272836723175049, "train_acc": 0.09616, "test_loss": 2.3025851444244383, "test_acc": 0.1, "lyapunov": 2.462624883407827, "grad_norm": 0.08161990901444113, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252637e-05, "time_sec": 124.22851657867432 }, { "epoch": 81, "train_loss": 4.39987655090332, "train_acc": 0.0985, "test_loss": 2.302585282897949, "test_acc": 0.1, "lyapunov": 2.5367127757548067, "grad_norm": 0.6635822194594717, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.645971286271918e-05, "time_sec": 124.23617506027222 }, { "epoch": 82, "train_loss": 4.297471022949218, "train_acc": 0.0953, "test_loss": 2.3025852149963377, "test_acc": 0.1, "lyapunov": 2.475090144540343, "grad_norm": 0.729945935366233, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.78360372489926e-05, "time_sec": 124.25805640220642 }, { "epoch": 83, "train_loss": 4.269278663024902, "train_acc": 0.09916, "test_loss": 2.3025850776672363, "test_acc": 0.1, "lyapunov": 2.4603407303695484, "grad_norm": 0.09631779246548546, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.962898649802815e-05, "time_sec": 124.23541116714478 }, { "epoch": 84, "train_loss": 4.2767918655395505, "train_acc": 0.09902, "test_loss": 2.3025851837158204, "test_acc": 0.1, "lyapunov": 2.464642455815659, "grad_norm": 0.15914456443799777, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806824e-05, "time_sec": 124.2600998878479 }, { "epoch": 85, "train_loss": 4.275007407989502, "train_acc": 0.09774, "test_loss": 2.302585231781006, "test_acc": 0.1, "lyapunov": 2.4639958829221213, "grad_norm": 0.08948000358835351, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.449673790581613e-05, "time_sec": 124.19096970558167 }, { "epoch": 86, "train_loss": 4.282883452606201, "train_acc": 0.0984, "test_loss": 2.3025849563598633, "test_acc": 0.1, "lyapunov": 2.46685717294893, "grad_norm": 0.20955582940776452, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.758647376699034e-05, "time_sec": 124.28308463096619 }, { "epoch": 87, "train_loss": 4.273255398712158, "train_acc": 0.09732, "test_loss": 2.3025850818634033, "test_acc": 0.1, "lyapunov": 2.4628877334887416, "grad_norm": 0.08251896757547691, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.112268715800956e-05, "time_sec": 124.24707794189453 }, { "epoch": 88, "train_loss": 4.27318275390625, "train_acc": 0.09818, "test_loss": 2.3025852210998536, "test_acc": 0.1, "lyapunov": 2.462852593273153, "grad_norm": 0.08488796189115587, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.511175705587434e-05, "time_sec": 124.27159857749939 }, { "epoch": 89, "train_loss": 4.274446720886231, "train_acc": 0.0964, "test_loss": 2.3025852279663086, "test_acc": 0.1, "lyapunov": 2.463662301792818, "grad_norm": 0.08254333748035417, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.9559615522887284e-05, "time_sec": 124.20991706848145 }, { "epoch": 90, "train_loss": 4.282081894989013, "train_acc": 0.09898, "test_loss": 2.302585124206543, "test_acc": 0.1, "lyapunov": 2.4669584868204257, "grad_norm": 0.11057422059552115, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.447174185242324e-05, "time_sec": 124.23175573348999 }, { "epoch": 91, "train_loss": 4.270762037200928, "train_acc": 0.09742, "test_loss": 2.302585070037842, "test_acc": 0.1, "lyapunov": 2.4613021468872303, "grad_norm": 0.08094752788352252, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.9853157161528526e-05, "time_sec": 124.28751397132874 }, { "epoch": 92, "train_loss": 4.2731778295898435, "train_acc": 0.0967, "test_loss": 2.3025849838256836, "test_acc": 0.1, "lyapunov": 2.4628693057448054, "grad_norm": 0.08218150011851272, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568452e-05, "time_sec": 124.20022916793823 }, { "epoch": 93, "train_loss": 4.271317660827637, "train_acc": 0.09598, "test_loss": 2.302585059738159, "test_acc": 0.1, "lyapunov": 2.461685863602192, "grad_norm": 0.09351987385512874, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.204161903062634e-05, "time_sec": 124.32517552375793 }, { "epoch": 94, "train_loss": 4.271005298614502, "train_acc": 0.09678, "test_loss": 2.3025850238800047, "test_acc": 0.1, "lyapunov": 2.461446201100069, "grad_norm": 0.08051510852574385, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.85637463565564e-06, "time_sec": 124.25493431091309 }, { "epoch": 95, "train_loss": 4.272550579528809, "train_acc": 0.0975, "test_loss": 2.302585118865967, "test_acc": 0.1, "lyapunov": 2.462437502258574, "grad_norm": 0.08133134154526532, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.155829702431171e-06, "time_sec": 124.2907202243805 }, { "epoch": 96, "train_loss": 4.27599407836914, "train_acc": 0.09808, "test_loss": 2.302585164642334, "test_acc": 0.1, "lyapunov": 2.464714573472357, "grad_norm": 0.08129994421530186, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761118e-06, "time_sec": 124.2441520690918 }, { "epoch": 97, "train_loss": 4.27250137512207, "train_acc": 0.1, "test_loss": 2.3025850723266603, "test_acc": 0.1, "lyapunov": 2.462406137105449, "grad_norm": 0.08085760651650271, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.2190176984600023e-06, "time_sec": 124.25383496284485 }, { "epoch": 98, "train_loss": 4.272909243469238, "train_acc": 0.1, "test_loss": 2.30258510017395, "test_acc": 0.1, "lyapunov": 2.462700468195064, "grad_norm": 0.08430371763203995, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642206e-07, "time_sec": 124.2897834777832 }, { "epoch": 99, "train_loss": 4.27265819152832, "train_acc": 0.1, "test_loss": 2.302585132598877, "test_acc": 0.1, "lyapunov": 2.462563226290066, "grad_norm": 0.08009730488173318, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.467198171342e-07, "time_sec": 124.25932240486145 }, { "epoch": 100, "train_loss": 4.272679078521729, "train_acc": 0.1, "test_loss": 2.302585071182251, "test_acc": 0.1, "lyapunov": 2.462542835708774, "grad_norm": 0.08019670403901732, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 124.30135154724121 } ], "16": [ { "epoch": 1, "train_loss": 11.842812671203614, "train_acc": 0.14506, "test_loss": 2.34111376953125, "test_acc": 0.1088, "lyapunov": 5.111980842507404, "grad_norm": 6.803328171635302, "grad_max_sv": 5.664273583889008, "grad_min_sv": 2.45656453401466e-07, "grad_condition": 23556170.622745253, "lr": 0.0009997532801828658, "time_sec": 167.03577542304993 }, { "epoch": 2, "train_loss": 6.864391835327148, "train_acc": 0.1532, "test_loss": 2.3584522315979, "test_acc": 0.1126, "lyapunov": 3.7626322760911246, "grad_norm": 5.449127371208671, "grad_max_sv": 4.509619396924973, "grad_min_sv": 1.816841066926145e-07, "grad_condition": 25473679.781934455, "lr": 0.0009990133642141358, "time_sec": 167.0620617866516 }, { "epoch": 3, "train_loss": 6.632632642822266, "train_acc": 0.16122, "test_loss": 2.358525146102905, "test_acc": 0.1, "lyapunov": 3.702555048496217, "grad_norm": 3.996691628576675, "grad_max_sv": 3.4047091096639632, "grad_min_sv": 1.1248512699069124e-07, "grad_condition": 30963953.097301744, "lr": 0.00099778098230154, "time_sec": 167.01362991333008 }, { "epoch": 4, "train_loss": 6.508619455108643, "train_acc": 0.15906, "test_loss": 2.3301877449035646, "test_acc": 0.1, "lyapunov": 3.647035371312095, "grad_norm": 3.2655343849407332, "grad_max_sv": 3.0296140223741532, "grad_min_sv": 9.594998209294659e-08, "grad_condition": 32002571.000903092, "lr": 0.000996057350657239, "time_sec": 166.97752714157104 }, { "epoch": 5, "train_loss": 5.912459800109863, "train_acc": 0.13794, "test_loss": 2.3143163734436034, "test_acc": 0.1, "lyapunov": 3.364570482917454, "grad_norm": 2.882730301769821, "grad_max_sv": 2.836460363864899, "grad_min_sv": 8.620691849259288e-08, "grad_condition": 34084982.42197102, "lr": 0.0009938441702975688, "time_sec": 167.01780152320862 }, { "epoch": 6, "train_loss": 5.365990347290039, "train_acc": 0.12352, "test_loss": 2.307030549240112, "test_acc": 0.1, "lyapunov": 3.0800778951181473, "grad_norm": 2.6661229845796357, "grad_max_sv": 1.9664998756031884, "grad_min_sv": 4.7012965353151585e-08, "grad_condition": 714227055.0495954, "lr": 0.0009911436253643444, "time_sec": 166.95626974105835 }, { "epoch": 7, "train_loss": 5.098499784545899, "train_acc": 0.11974, "test_loss": 2.306401748275757, "test_acc": 0.1, "lyapunov": 2.9394846096672973, "grad_norm": 2.0425554711132987, "grad_max_sv": 1.3562358289975485, "grad_min_sv": 3.416944161021407e-08, "grad_condition": 430074872.43269414, "lr": 0.0009879583809693736, "time_sec": 167.02987694740295 }, { "epoch": 8, "train_loss": 4.836283032226563, "train_acc": 0.1193, "test_loss": 2.3056865058898928, "test_acc": 0.1, "lyapunov": 2.8134650903589584, "grad_norm": 1.9015682902174655, "grad_max_sv": 1.3965314358472825, "grad_min_sv": 2.998794566512128e-08, "grad_condition": 984527791.9432541, "lr": 0.0009842915805643154, "time_sec": 166.99379587173462 }, { "epoch": 9, "train_loss": 4.799866871795654, "train_acc": 0.11898, "test_loss": 2.3078849700927733, "test_acc": 0.1, "lyapunov": 2.7906805755537185, "grad_norm": 1.830247256824178, "grad_max_sv": 1.0446476072072983, "grad_min_sv": 2.2101311034875437e-08, "grad_condition": 6442199712.909399, "lr": 0.0009801468428384714, "time_sec": 167.04091095924377 }, { "epoch": 10, "train_loss": 4.8418486264038085, "train_acc": 0.1198, "test_loss": 2.306636996841431, "test_acc": 0.1, "lyapunov": 2.8099952402627073, "grad_norm": 2.137959073318514, "grad_max_sv": 0.7742668629978022, "grad_min_sv": 1.0732185378244782e-08, "grad_condition": 12825727231.027037, "lr": 0.0009755282581475767, "time_sec": 167.01724100112915 }, { "epoch": 11, "train_loss": 4.899544752502441, "train_acc": 0.11034, "test_loss": 2.303115463256836, "test_acc": 0.1, "lyapunov": 2.8371418083415314, "grad_norm": 1.6003418244695304, "grad_max_sv": 0.6158522295280715, "grad_min_sv": 3.796369944507449e-09, "grad_condition": 6480545635.210354, "lr": 0.0009704403844771127, "time_sec": 167.04382944107056 }, { "epoch": 12, "train_loss": 4.951635014648438, "train_acc": 0.10792, "test_loss": 2.3031677284240724, "test_acc": 0.1, "lyapunov": 2.866735147393268, "grad_norm": 2.666838044816494, "grad_max_sv": 0.5319730836898089, "grad_min_sv": 3.372458990007535e-10, "grad_condition": 39511669967.92405, "lr": 0.0009648882429441257, "time_sec": 166.9957308769226 }, { "epoch": 13, "train_loss": 6.152256243286133, "train_acc": 0.10692, "test_loss": 2.303246379852295, "test_acc": 0.1, "lyapunov": 3.4366153896312275, "grad_norm": 6.342546880123247, "grad_max_sv": 0.2403870326364995, "grad_min_sv": 2.6050612198124816e-10, "grad_condition": 34925794452.094666, "lr": 0.0009588773128419905, "time_sec": 167.01189947128296 }, { "epoch": 14, "train_loss": 6.052201841888428, "train_acc": 0.10886, "test_loss": 2.3029991958618163, "test_acc": 0.1, "lyapunov": 3.407372230154169, "grad_norm": 3.751884478526656, "grad_max_sv": 0.3085380573000293, "grad_min_sv": 1.7481779514657177e-10, "grad_condition": 69456467004.02864, "lr": 0.0009524135262330098, "time_sec": 166.99195837974548 }, { "epoch": 15, "train_loss": 6.174399379577637, "train_acc": 0.10784, "test_loss": 2.3030965816497804, "test_acc": 0.1, "lyapunov": 3.468341021891445, "grad_norm": 2.2149403643105514, "grad_max_sv": 0.2665206765946223, "grad_min_sv": 7.174466620587407e-11, "grad_condition": 25279718153.525455, "lr": 0.0009455032620941839, "time_sec": 167.02302026748657 }, { "epoch": 16, "train_loss": 5.8687522245788575, "train_acc": 0.10852, "test_loss": 2.302928673553467, "test_acc": 0.1, "lyapunov": 3.3205134075925784, "grad_norm": 2.1727798236859517, "grad_max_sv": 0.1694878804436172, "grad_min_sv": 5.284483110394732e-11, "grad_condition": 29825093550.928566, "lr": 0.0009381533400219318, "time_sec": 166.98851919174194 }, { "epoch": 17, "train_loss": 5.00506268585205, "train_acc": 0.10292, "test_loss": 2.3029050621032714, "test_acc": 0.1, "lyapunov": 2.8923883834458373, "grad_norm": 1.1450970364565718, "grad_max_sv": 0.12666865187754867, "grad_min_sv": 2.4102328364569327e-11, "grad_condition": 25147403549.501667, "lr": 0.0009303710135019719, "time_sec": 167.02036666870117 }, { "epoch": 18, "train_loss": 4.855449399719238, "train_acc": 0.104, "test_loss": 2.3028139762878417, "test_acc": 0.1, "lyapunov": 2.8120573298705507, "grad_norm": 0.7305556308720836, "grad_max_sv": 0.09714378891512751, "grad_min_sv": 8.150729035001414e-12, "grad_condition": 58264297783.12268, "lr": 0.0009221639627510076, "time_sec": 167.08689284324646 }, { "epoch": 19, "train_loss": 4.96336449584961, "train_acc": 0.1041, "test_loss": 2.3027950325012205, "test_acc": 0.1, "lyapunov": 2.8725837020922804, "grad_norm": 1.182474133176391, "grad_max_sv": 0.07083241189830006, "grad_min_sv": 7.22405413796021e-12, "grad_condition": 38280733847.458176, "lr": 0.000913540287137281, "time_sec": 167.00970244407654 }, { "epoch": 20, "train_loss": 4.743826732025147, "train_acc": 0.10382, "test_loss": 2.3027557773590086, "test_acc": 0.1, "lyapunov": 2.7483980515423942, "grad_norm": 0.6554501104680703, "grad_max_sv": 0.05732933725230396, "grad_min_sv": 5.653544739145854e-12, "grad_condition": 35503198727.48572, "lr": 0.0009045084971874739, "time_sec": 167.09380722045898 }, { "epoch": 21, "train_loss": 4.678205784606933, "train_acc": 0.10294, "test_loss": 3.7050921539306643, "test_acc": 0.1, "lyapunov": 2.712228787219738, "grad_norm": 0.9024618566776086, "grad_max_sv": 0.03976228955434635, "grad_min_sv": 5.291108131013551e-11, "grad_condition": 16349739158.901342, "lr": 0.0008950775061878452, "time_sec": 167.0224826335907 }, { "epoch": 22, "train_loss": 4.63441824432373, "train_acc": 0.09868, "test_loss": 2.678515822601318, "test_acc": 0.1, "lyapunov": 2.6848394797586113, "grad_norm": 0.9464113383195869, "grad_max_sv": 0.03219134085811674, "grad_min_sv": 3.575371656772674e-11, "grad_condition": 22552839587.69338, "lr": 0.0008852566213878947, "time_sec": 167.0608777999878 }, { "epoch": 23, "train_loss": 4.728675323486328, "train_acc": 0.09932, "test_loss": 3.68248123626709, "test_acc": 0.1, "lyapunov": 2.732565569450788, "grad_norm": 1.1845032429393016, "grad_max_sv": 0.009998515527695418, "grad_min_sv": 1.095997224005267e-20, "grad_condition": 9998514820.705112, "lr": 0.0008750555348152298, "time_sec": 167.0682075023651 }, { "epoch": 24, "train_loss": 4.65850959197998, "train_acc": 0.09912, "test_loss": 3.6423350326538086, "test_acc": 0.1, "lyapunov": 2.6980338791752105, "grad_norm": 1.5417542431510867, "grad_max_sv": 0.008353105513378978, "grad_min_sv": 1.9907194983962853e-18, "grad_condition": 8352993676.098096, "lr": 0.0008644843137107057, "time_sec": 167.08017802238464 }, { "epoch": 25, "train_loss": 4.584089448547363, "train_acc": 0.09784, "test_loss": 2.3033696189880373, "test_acc": 0.1, "lyapunov": 2.653346909891309, "grad_norm": 0.9625814425500707, "grad_max_sv": 0.0027962074615061282, "grad_min_sv": 1.8178542286825737e-15, "grad_condition": 2726213455.6624613, "lr": 0.0008535533905932737, "time_sec": 167.05963444709778 }, { "epoch": 26, "train_loss": 4.562473741149902, "train_acc": 0.0972, "test_loss": 2.5531665412902833, "test_acc": 0.1, "lyapunov": 2.6440261763989774, "grad_norm": 1.0966601277478685, "grad_max_sv": 0.0009299686178565025, "grad_min_sv": 7.864982908802376e-35, "grad_condition": 929968617.8565025, "lr": 0.0008422735529643444, "time_sec": 167.0820574760437 }, { "epoch": 27, "train_loss": 4.557928927612305, "train_acc": 0.10072, "test_loss": 2.3032149608612063, "test_acc": 0.1, "lyapunov": 2.640467453490743, "grad_norm": 1.5990578945087282, "grad_max_sv": 0.001147926412522793, "grad_min_sv": 2.0663573730241894e-15, "grad_condition": 1060288974.8907245, "lr": 0.0008306559326618259, "time_sec": 167.0413818359375 }, { "epoch": 28, "train_loss": 4.533458753051757, "train_acc": 0.09686, "test_loss": 2.303218946838379, "test_acc": 0.1, "lyapunov": 2.6252909279845253, "grad_norm": 0.6753306901464893, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0008187119948743449, "time_sec": 167.0830535888672 }, { "epoch": 29, "train_loss": 4.496531313171387, "train_acc": 0.09852, "test_loss": 2.3032687267303467, "test_acc": 0.1, "lyapunov": 2.6040675938891633, "grad_norm": 0.18386399798172356, "grad_max_sv": 0.00110331317409873, "grad_min_sv": 7.969612926285099e-35, "grad_condition": 1103313174.09873, "lr": 0.0008064535268264883, "time_sec": 167.04623770713806 }, { "epoch": 30, "train_loss": 4.504303005065918, "train_acc": 0.0976, "test_loss": 2.303500841522217, "test_acc": 0.1, "lyapunov": 2.6081804003556974, "grad_norm": 0.15236154258308318, "grad_max_sv": 0.0028056097216904163, "grad_min_sv": 0.0, "grad_condition": 2805609721.6904163, "lr": 0.0007938926261462367, "time_sec": 167.02854776382446 }, { "epoch": 31, "train_loss": 4.50321345703125, "train_acc": 0.09666, "test_loss": 2.3035490158081053, "test_acc": 0.1, "lyapunov": 2.607592426602493, "grad_norm": 0.10039091720588617, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007810416889260654, "time_sec": 167.07999300956726 }, { "epoch": 32, "train_loss": 4.501663753662109, "train_acc": 0.09806, "test_loss": 2.3034838943481444, "test_acc": 0.1, "lyapunov": 2.607143198437703, "grad_norm": 0.1048906506411198, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007679133974894983, "time_sec": 167.00407528877258 }, { "epoch": 33, "train_loss": 4.5019655114746095, "train_acc": 0.09498, "test_loss": 2.30348473739624, "test_acc": 0.1, "lyapunov": 2.607365154549289, "grad_norm": 0.09466991605122166, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007545207078751857, "time_sec": 167.04430413246155 }, { "epoch": 34, "train_loss": 4.4972885162353515, "train_acc": 0.09806, "test_loss": 2.3035587966918945, "test_acc": 0.1, "lyapunov": 2.6045894854513887, "grad_norm": 0.094802640603578, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007408768370508577, "time_sec": 167.01064467430115 }, { "epoch": 35, "train_loss": 4.496900313110352, "train_acc": 0.09916, "test_loss": 2.3035878532409666, "test_acc": 0.1, "lyapunov": 2.6043496991667294, "grad_norm": 0.08505627865784493, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007269952498697734, "time_sec": 167.04931592941284 }, { "epoch": 36, "train_loss": 4.498045174407959, "train_acc": 0.09896, "test_loss": 2.303556993865967, "test_acc": 0.1, "lyapunov": 2.6051284626621722, "grad_norm": 0.08865673943824036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0007128896457825364, "time_sec": 166.99707579612732 }, { "epoch": 37, "train_loss": 4.494941578521728, "train_acc": 0.09764, "test_loss": 2.3035079292297365, "test_acc": 0.1, "lyapunov": 2.6031092463247, "grad_norm": 0.09732931123675816, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006985739453173903, "time_sec": 167.02038192749023 }, { "epoch": 38, "train_loss": 4.496269936523437, "train_acc": 0.09764, "test_loss": 2.3035408573150633, "test_acc": 0.1, "lyapunov": 2.604000445217123, "grad_norm": 0.08852073271727623, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006840622763423391, "time_sec": 167.02108144760132 }, { "epoch": 39, "train_loss": 4.493522086791992, "train_acc": 0.09734, "test_loss": 2.303493659210205, "test_acc": 0.1, "lyapunov": 2.6023181265272446, "grad_norm": 0.08748337786673831, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006693689601226458, "time_sec": 167.05211973190308 }, { "epoch": 40, "train_loss": 4.498229814758301, "train_acc": 0.09844, "test_loss": 2.3034747520446777, "test_acc": 0.1, "lyapunov": 2.6050954608966017, "grad_norm": 0.10483613599174303, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006545084971874737, "time_sec": 167.01571893692017 }, { "epoch": 41, "train_loss": 4.498432325286865, "train_acc": 0.09692, "test_loss": 2.3034770004272462, "test_acc": 0.1, "lyapunov": 2.6052994520767876, "grad_norm": 0.09650951998583779, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006394955530196147, "time_sec": 167.06526255607605 }, { "epoch": 42, "train_loss": 4.496120017395019, "train_acc": 0.09806, "test_loss": 2.303461635971069, "test_acc": 0.1, "lyapunov": 2.6038818706941727, "grad_norm": 0.08793824539769711, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006243449435824273, "time_sec": 167.0240659713745 }, { "epoch": 43, "train_loss": 4.50342136932373, "train_acc": 0.0968, "test_loss": 3.123962462234497, "test_acc": 0.1, "lyapunov": 2.6082677432643178, "grad_norm": 0.10763460634241757, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0006090716206982714, "time_sec": 167.04283785820007 }, { "epoch": 44, "train_loss": 4.497545390930176, "train_acc": 0.0993, "test_loss": 2.30349365196228, "test_acc": 0.1, "lyapunov": 2.6048193215714086, "grad_norm": 0.0914051250208073, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005936906572928625, "time_sec": 167.00522899627686 }, { "epoch": 45, "train_loss": 4.497059263458252, "train_acc": 0.0983, "test_loss": 2.303560007476807, "test_acc": 0.1, "lyapunov": 2.604434971919145, "grad_norm": 0.09665268401606698, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005782172325201156, "time_sec": 166.98798084259033 }, { "epoch": 46, "train_loss": 4.496945586547851, "train_acc": 0.09766, "test_loss": 2.303540351486206, "test_acc": 0.1, "lyapunov": 2.6044252626121502, "grad_norm": 0.08182959271154387, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005626666167821523, "time_sec": 167.05580401420593 }, { "epoch": 47, "train_loss": 4.5494916119384765, "train_acc": 0.0975, "test_loss": 2.3035491088867186, "test_acc": 0.1, "lyapunov": 2.6250632187289655, "grad_norm": 0.16118104591565238, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005470541566592572, "time_sec": 167.02027297019958 }, { "epoch": 48, "train_loss": 4.527786728515625, "train_acc": 0.09808, "test_loss": 2.303548764038086, "test_acc": 0.1, "lyapunov": 2.6161820851933317, "grad_norm": 0.1522047852768872, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005313952597646569, "time_sec": 167.08899068832397 }, { "epoch": 49, "train_loss": 4.49808083328247, "train_acc": 0.0977, "test_loss": 2.3034967575073244, "test_acc": 0.1, "lyapunov": 2.6051423244769008, "grad_norm": 0.09227111356756569, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005157053795390643, "time_sec": 167.04247641563416 }, { "epoch": 50, "train_loss": 4.506656402282715, "train_acc": 0.09788, "test_loss": 2.3035506187438965, "test_acc": 0.1, "lyapunov": 2.6092079515042514, "grad_norm": 0.0989012749171036, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0005000000000000002, "time_sec": 167.06817507743835 }, { "epoch": 51, "train_loss": 4.518285944213867, "train_acc": 0.09874, "test_loss": 2.303562999343872, "test_acc": 0.1, "lyapunov": 2.6132117506793087, "grad_norm": 0.14702247022618603, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00048429462046093607, "time_sec": 167.00237131118774 }, { "epoch": 52, "train_loss": 4.510767389526367, "train_acc": 0.0985, "test_loss": 2.303548727416992, "test_acc": 0.1, "lyapunov": 2.611425805884554, "grad_norm": 0.12770796891288963, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004686047402353435, "time_sec": 167.03129529953003 }, { "epoch": 53, "train_loss": 4.524528532714844, "train_acc": 0.09758, "test_loss": 2.3034987804412843, "test_acc": 0.1, "lyapunov": 2.6168906950889648, "grad_norm": 0.16221922023587404, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000452945843340743, "time_sec": 167.0302333831787 }, { "epoch": 54, "train_loss": 4.514558558197021, "train_acc": 0.09898, "test_loss": 2.3035224128723146, "test_acc": 0.1, "lyapunov": 2.6116219816915214, "grad_norm": 0.11874932612009399, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00043733338321784806, "time_sec": 167.03262758255005 }, { "epoch": 55, "train_loss": 4.500117692108154, "train_acc": 0.0969, "test_loss": 2.303501333999634, "test_acc": 0.1, "lyapunov": 2.6062854854652033, "grad_norm": 0.10674428233360923, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0004217827674798847, "time_sec": 166.98121881484985 }, { "epoch": 56, "train_loss": 4.51960044921875, "train_acc": 0.09628, "test_loss": 2.30349303855896, "test_acc": 0.1, "lyapunov": 2.616247482616883, "grad_norm": 0.14277503967283073, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00040630934270713783, "time_sec": 167.03360319137573 }, { "epoch": 57, "train_loss": 4.538308909759522, "train_acc": 0.0975, "test_loss": 2.303505461502075, "test_acc": 0.1, "lyapunov": 2.624653117431094, "grad_norm": 0.17354441507562746, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.000390928379301729, "time_sec": 167.00332236289978 }, { "epoch": 58, "train_loss": 4.5402243867492675, "train_acc": 0.09768, "test_loss": 2.3034944499969483, "test_acc": 0.1, "lyapunov": 2.6235652969926213, "grad_norm": 0.18590049129605235, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003756550564175727, "time_sec": 166.94713830947876 }, { "epoch": 59, "train_loss": 4.497288510131836, "train_acc": 0.09656, "test_loss": 2.303503835296631, "test_acc": 0.1, "lyapunov": 2.60465430237753, "grad_norm": 0.08925667815477244, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00036050444698038553, "time_sec": 166.97111773490906 }, { "epoch": 60, "train_loss": 4.520837378082275, "train_acc": 0.09746, "test_loss": 2.3035025501251223, "test_acc": 0.1, "lyapunov": 2.6177086183787, "grad_norm": 0.14390327015753798, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00034549150281252655, "time_sec": 166.95851969718933 }, { "epoch": 61, "train_loss": 4.503204351348877, "train_acc": 0.09616, "test_loss": 2.3035063259124757, "test_acc": 0.1, "lyapunov": 2.6079881752238556, "grad_norm": 0.11060100204296372, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003306310398773544, "time_sec": 167.04684805870056 }, { "epoch": 62, "train_loss": 4.529549421844482, "train_acc": 0.0966, "test_loss": 2.303504373550415, "test_acc": 0.1, "lyapunov": 2.620155497889994, "grad_norm": 0.25260476730678916, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00031593772365766127, "time_sec": 166.9670557975769 }, { "epoch": 63, "train_loss": 4.504642747955322, "train_acc": 0.09824, "test_loss": 2.302585437011719, "test_acc": 0.1, "lyapunov": 2.6090027182303426, "grad_norm": 0.14482467729355822, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0003014260546826097, "time_sec": 167.07136464118958 }, { "epoch": 64, "train_loss": 4.5207818331909175, "train_acc": 0.09658, "test_loss": 2.302585619735718, "test_acc": 0.1, "lyapunov": 2.6153993130949758, "grad_norm": 0.14340140289375716, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002871103542174637, "time_sec": 167.0296709537506 }, { "epoch": 65, "train_loss": 4.514579942321777, "train_acc": 0.09692, "test_loss": 2.302585908126831, "test_acc": 0.1, "lyapunov": 2.612202508370285, "grad_norm": 0.11615853114383813, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002730047501302267, "time_sec": 167.06110525131226 }, { "epoch": 66, "train_loss": 4.539550397949219, "train_acc": 0.09668, "test_loss": 2.3025857189178467, "test_acc": 0.1, "lyapunov": 2.6239442215551194, "grad_norm": 0.24377422344866448, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00025912316294914234, "time_sec": 166.96833562850952 }, { "epoch": 67, "train_loss": 4.520765433959961, "train_acc": 0.09678, "test_loss": 2.3025856506347657, "test_acc": 0.1, "lyapunov": 2.6144380130426352, "grad_norm": 0.17143215114502838, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0002454792921248144, "time_sec": 167.06375288963318 }, { "epoch": 68, "train_loss": 4.501224665222168, "train_acc": 0.09848, "test_loss": 2.3025851860046385, "test_acc": 0.1, "lyapunov": 2.606965447935607, "grad_norm": 0.22167025880962787, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00023208660251050164, "time_sec": 166.97689723968506 }, { "epoch": 69, "train_loss": 4.516330520629883, "train_acc": 0.09716, "test_loss": 2.3025853271484373, "test_acc": 0.1, "lyapunov": 2.6127135893877815, "grad_norm": 0.1178159153430125, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00021895831107393473, "time_sec": 167.03971099853516 }, { "epoch": 70, "train_loss": 4.518335289764404, "train_acc": 0.09628, "test_loss": 2.3025851623535156, "test_acc": 0.1, "lyapunov": 2.614670734576252, "grad_norm": 0.19910468609269888, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00020610737385376356, "time_sec": 167.01087379455566 }, { "epoch": 71, "train_loss": 4.506198991699219, "train_acc": 0.0961, "test_loss": 2.3025853843688964, "test_acc": 0.1, "lyapunov": 2.6081283720557953, "grad_norm": 0.09098734124729495, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00019354647317351177, "time_sec": 167.0194799900055 }, { "epoch": 72, "train_loss": 4.49574895111084, "train_acc": 0.09856, "test_loss": 2.3025853591918946, "test_acc": 0.1, "lyapunov": 2.603733692632612, "grad_norm": 0.08176729544229487, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001812880051256552, "time_sec": 167.05306220054626 }, { "epoch": 73, "train_loss": 4.497463835449219, "train_acc": 0.09886, "test_loss": 2.3025851680755616, "test_acc": 0.1, "lyapunov": 2.604736436053615, "grad_norm": 0.082986396115534, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00016934406733817422, "time_sec": 166.98811650276184 }, { "epoch": 74, "train_loss": 4.4971358953857425, "train_acc": 0.09738, "test_loss": 2.302585493850708, "test_acc": 0.1, "lyapunov": 2.6045719363805278, "grad_norm": 0.08151196821637299, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001577264470356557, "time_sec": 167.01667833328247 }, { "epoch": 75, "train_loss": 4.50925322631836, "train_acc": 0.0967, "test_loss": 2.302585232925415, "test_acc": 0.1, "lyapunov": 2.6094926751178242, "grad_norm": 0.21190207725464844, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00014644660940672634, "time_sec": 166.97911548614502 }, { "epoch": 76, "train_loss": 4.496390933227539, "train_acc": 0.0967, "test_loss": 2.302585297393799, "test_acc": 0.1, "lyapunov": 2.6040706823549002, "grad_norm": 0.08435313407684436, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0001355156862892944, "time_sec": 167.0480306148529 }, { "epoch": 77, "train_loss": 4.496095029296875, "train_acc": 0.0965, "test_loss": 2.3025853218078614, "test_acc": 0.1, "lyapunov": 2.6039189987475306, "grad_norm": 0.1373346720572696, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00012494446518477025, "time_sec": 166.97820734977722 }, { "epoch": 78, "train_loss": 4.499068414611816, "train_acc": 0.096, "test_loss": 2.3025852237701416, "test_acc": 0.1, "lyapunov": 2.605743714305751, "grad_norm": 0.10939849657650327, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00011474337861210548, "time_sec": 166.98934531211853 }, { "epoch": 79, "train_loss": 4.4964453392028805, "train_acc": 0.09828, "test_loss": 2.302585151672363, "test_acc": 0.1, "lyapunov": 2.604178778655694, "grad_norm": 0.08774538011729731, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.00010492249381215483, "time_sec": 167.02672863006592 }, { "epoch": 80, "train_loss": 4.499743932647705, "train_acc": 0.09862, "test_loss": 2.302585228347778, "test_acc": 0.1, "lyapunov": 2.606093951808217, "grad_norm": 0.2420142867175763, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.549150281252637e-05, "time_sec": 167.10957646369934 }, { "epoch": 81, "train_loss": 4.502734872436523, "train_acc": 0.09578, "test_loss": 2.302585201263428, "test_acc": 0.1, "lyapunov": 2.6076697900776975, "grad_norm": 0.13251791023485532, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.645971286271918e-05, "time_sec": 166.9769287109375 }, { "epoch": 82, "train_loss": 4.494626608581543, "train_acc": 0.09758, "test_loss": 2.3025851295471194, "test_acc": 0.1, "lyapunov": 2.6029957383489974, "grad_norm": 0.08170465976084904, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 7.78360372489926e-05, "time_sec": 167.00449562072754 }, { "epoch": 83, "train_loss": 4.495700520019532, "train_acc": 0.09822, "test_loss": 2.3025853286743163, "test_acc": 0.1, "lyapunov": 2.6036597090913816, "grad_norm": 0.1210411913955966, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.962898649802815e-05, "time_sec": 166.96435856819153 }, { "epoch": 84, "train_loss": 4.49369448425293, "train_acc": 0.09848, "test_loss": 2.3025850296020507, "test_acc": 0.1, "lyapunov": 2.6024485061235745, "grad_norm": 0.1169116031555102, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.184665997806824e-05, "time_sec": 166.9589819908142 }, { "epoch": 85, "train_loss": 4.493269319915772, "train_acc": 0.09772, "test_loss": 2.3025851333618164, "test_acc": 0.1, "lyapunov": 2.60219204151417, "grad_norm": 0.08026909865070977, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 5.449673790581613e-05, "time_sec": 167.0204620361328 }, { "epoch": 86, "train_loss": 4.4974218487548825, "train_acc": 0.09802, "test_loss": 2.302585245895386, "test_acc": 0.1, "lyapunov": 2.604730949987231, "grad_norm": 0.08689607041758553, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.758647376699034e-05, "time_sec": 166.964524269104 }, { "epoch": 87, "train_loss": 4.495326493072509, "train_acc": 0.0982, "test_loss": 2.3025850296020507, "test_acc": 0.1, "lyapunov": 2.603457776481843, "grad_norm": 0.09583928752803095, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 4.112268715800956e-05, "time_sec": 167.03006196022034 }, { "epoch": 88, "train_loss": 4.494311538085937, "train_acc": 0.09762, "test_loss": 2.3025852684020998, "test_acc": 0.1, "lyapunov": 2.602831931980065, "grad_norm": 0.08201988600112256, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.511175705587434e-05, "time_sec": 166.98635745048523 }, { "epoch": 89, "train_loss": 4.497406745605469, "train_acc": 0.09872, "test_loss": 2.302585092926025, "test_acc": 0.1, "lyapunov": 2.6046652647540394, "grad_norm": 0.11011286998675665, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.9559615522887284e-05, "time_sec": 167.0066351890564 }, { "epoch": 90, "train_loss": 4.495393841552734, "train_acc": 0.0955, "test_loss": 2.3025851219177245, "test_acc": 0.1, "lyapunov": 2.603500037546963, "grad_norm": 0.08854801622590937, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.447174185242324e-05, "time_sec": 166.98117446899414 }, { "epoch": 91, "train_loss": 4.496799105529785, "train_acc": 0.09778, "test_loss": 2.3025851669311526, "test_acc": 0.1, "lyapunov": 2.6043886601772455, "grad_norm": 0.08317548392372451, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.9853157161528526e-05, "time_sec": 167.05606770515442 }, { "epoch": 92, "train_loss": 4.501456503753662, "train_acc": 0.09732, "test_loss": 2.302585040283203, "test_acc": 0.1, "lyapunov": 2.6069688260402826, "grad_norm": 0.09601255447418665, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.570841943568452e-05, "time_sec": 166.95690035820007 }, { "epoch": 93, "train_loss": 4.4988940646362305, "train_acc": 0.09822, "test_loss": 2.302585070037842, "test_acc": 0.1, "lyapunov": 2.6056473828337685, "grad_norm": 0.11345521860163729, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 1.204161903062634e-05, "time_sec": 167.01007437705994 }, { "epoch": 94, "train_loss": 4.500971371002198, "train_acc": 0.09656, "test_loss": 2.3025852294921876, "test_acc": 0.1, "lyapunov": 2.606662953296281, "grad_norm": 0.10989679012817173, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 8.85637463565564e-06, "time_sec": 166.93790555000305 }, { "epoch": 95, "train_loss": 4.496245345458984, "train_acc": 0.09824, "test_loss": 2.3025850425720216, "test_acc": 0.1, "lyapunov": 2.6040014677950185, "grad_norm": 0.13386825999790872, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 6.155829702431171e-06, "time_sec": 166.99875664710999 }, { "epoch": 96, "train_loss": 4.4964897052001955, "train_acc": 0.09874, "test_loss": 2.302585097122192, "test_acc": 0.1, "lyapunov": 2.6042159268313356, "grad_norm": 0.09409731933962433, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 3.942649342761118e-06, "time_sec": 166.96930813789368 }, { "epoch": 97, "train_loss": 4.499828433837891, "train_acc": 0.1, "test_loss": 2.3025849605560302, "test_acc": 0.1, "lyapunov": 2.6062122037648545, "grad_norm": 0.16887612557601597, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.2190176984600023e-06, "time_sec": 166.9714593887329 }, { "epoch": 98, "train_loss": 4.496156484069824, "train_acc": 0.1, "test_loss": 2.302585231781006, "test_acc": 0.1, "lyapunov": 2.603946977259253, "grad_norm": 0.08139214809285189, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 9.866357858642206e-07, "time_sec": 167.0184144973755 }, { "epoch": 99, "train_loss": 4.497607230377198, "train_acc": 0.1, "test_loss": 2.302585125350952, "test_acc": 0.1, "lyapunov": 2.6048427774473226, "grad_norm": 0.08064979301518677, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 2.467198171342e-07, "time_sec": 166.95221614837646 }, { "epoch": 100, "train_loss": 4.493742803955078, "train_acc": 0.1, "test_loss": 2.302585009765625, "test_acc": 0.1, "lyapunov": 2.602488872035385, "grad_norm": 0.08215126330977654, "grad_max_sv": 0.0, "grad_min_sv": 0.0, "grad_condition": 0.0, "lr": 0.0, "time_sec": 166.99254083633423 } ] } }