diff options
Diffstat (limited to 'runs/depth_scaling/cifar10_20251229-160504')
| -rw-r--r-- | runs/depth_scaling/cifar10_20251229-160504/config.json | 20 | ||||
| -rw-r--r-- | runs/depth_scaling/cifar10_20251229-160504/results.json | 11222 |
2 files changed, 11242 insertions, 0 deletions
diff --git a/runs/depth_scaling/cifar10_20251229-160504/config.json b/runs/depth_scaling/cifar10_20251229-160504/config.json new file mode 100644 index 0000000..c87b8a8 --- /dev/null +++ b/runs/depth_scaling/cifar10_20251229-160504/config.json @@ -0,0 +1,20 @@ +{ + "dataset": "cifar10", + "depths": [ + 4, + 8, + 12, + 16 + ], + "T": 4, + "epochs": 100, + "batch_size": 128, + "lr": 0.001, + "lambda_reg": 0.3, + "lambda_target": -0.1, + "data_dir": "./data", + "out_dir": "runs/depth_scaling", + "device": "cuda", + "seed": 42, + "no_progress": false +}
\ No newline at end of file diff --git a/runs/depth_scaling/cifar10_20251229-160504/results.json b/runs/depth_scaling/cifar10_20251229-160504/results.json new file mode 100644 index 0000000..2e9b6eb --- /dev/null +++ b/runs/depth_scaling/cifar10_20251229-160504/results.json @@ -0,0 +1,11222 @@ +{ + "vanilla": { + "4": [ + { + "epoch": 1, + "train_loss": 1.87523081199646, + "train_acc": 0.3904, + "test_loss": 1.3005033981323242, + "test_acc": 0.538, + "lyapunov": null, + "grad_norm": 7.167065437345997, + "grad_max_sv": 6.2841449797153475, + "grad_min_sv": 2.820393511626662e-07, + "grad_condition": 22637653.325481158, + "lr": 0.0009997532801828658, + "time_sec": 17.83638072013855 + }, + { + "epoch": 2, + "train_loss": 1.330778917236328, + "train_acc": 0.53242, + "test_loss": 1.3051589399337769, + "test_acc": 0.5299, + "lyapunov": null, + "grad_norm": 5.684293544168513, + "grad_max_sv": 4.961454087495804, + "grad_min_sv": 2.2011614504435783e-07, + "grad_condition": 23000049.3006949, + "lr": 0.0009990133642141358, + "time_sec": 15.308318853378296 + }, + { + "epoch": 3, + "train_loss": 1.1224762370300292, + "train_acc": 0.59994, + "test_loss": 1.1229688482284546, + "test_acc": 0.6085, + "lyapunov": null, + "grad_norm": 4.767601837094887, + "grad_max_sv": 4.13027862906456, + "grad_min_sv": 1.9442289698190506e-07, + "grad_condition": 21218061.296424918, + "lr": 0.00099778098230154, + "time_sec": 15.306547403335571 + }, + { + "epoch": 4, + "train_loss": 0.9929985418510437, + "train_acc": 0.6506, + "test_loss": 1.0345463452339172, + "test_acc": 0.6476, + "lyapunov": null, + "grad_norm": 4.154534311876162, + "grad_max_sv": 3.4217750519514083, + "grad_min_sv": 1.738904227721605e-07, + "grad_condition": 19945043.08817544, + "lr": 0.000996057350657239, + "time_sec": 15.302969694137573 + }, + { + "epoch": 5, + "train_loss": 0.8976026094818115, + "train_acc": 0.68438, + "test_loss": 0.8756585054397583, + "test_acc": 0.6914, + "lyapunov": null, + "grad_norm": 3.6333960771107905, + "grad_max_sv": 2.9354925364255906, + "grad_min_sv": 1.6106242668456615e-07, + "grad_condition": 18489046.232839655, + "lr": 0.0009938441702975688, + "time_sec": 15.317728281021118 + }, + { + "epoch": 6, + "train_loss": 0.8413557116317749, + "train_acc": 0.70288, + "test_loss": 1.0890468210220337, + "test_acc": 0.6361, + "lyapunov": null, + "grad_norm": 3.416502916483722, + "grad_max_sv": 2.8772784233093263, + "grad_min_sv": 1.524946609876565e-07, + "grad_condition": 19017545.32666207, + "lr": 0.0009911436253643444, + "time_sec": 15.30530047416687 + }, + { + "epoch": 7, + "train_loss": 0.780380486125946, + "train_acc": 0.72624, + "test_loss": 0.7749503490447998, + "test_acc": 0.7328, + "lyapunov": null, + "grad_norm": 3.046069709126096, + "grad_max_sv": 2.3629971712827684, + "grad_min_sv": 1.380081055657456e-07, + "grad_condition": 17149009.230771504, + "lr": 0.0009879583809693736, + "time_sec": 15.307675838470459 + }, + { + "epoch": 8, + "train_loss": 0.7390781346511841, + "train_acc": 0.7414, + "test_loss": 0.7958005157470703, + "test_acc": 0.7277, + "lyapunov": null, + "grad_norm": 2.7435338958916513, + "grad_max_sv": 2.05181370973587, + "grad_min_sv": 1.2932217341443675e-07, + "grad_condition": 16036517.768211821, + "lr": 0.0009842915805643154, + "time_sec": 15.307319641113281 + }, + { + "epoch": 9, + "train_loss": 0.7052495925521851, + "train_acc": 0.75274, + "test_loss": 1.0447007677078246, + "test_acc": 0.6745, + "lyapunov": null, + "grad_norm": 2.552586529905072, + "grad_max_sv": 2.0337040573358536, + "grad_min_sv": 1.2101497901539914e-07, + "grad_condition": 16963155.872520845, + "lr": 0.0009801468428384714, + "time_sec": 15.290063619613647 + }, + { + "epoch": 10, + "train_loss": 0.6694383864402771, + "train_acc": 0.76588, + "test_loss": 0.9462176066398621, + "test_acc": 0.6842, + "lyapunov": null, + "grad_norm": 2.3520331395340692, + "grad_max_sv": 1.7684333354234696, + "grad_min_sv": 1.1190378259584577e-07, + "grad_condition": 15955738.307438832, + "lr": 0.0009755282581475767, + "time_sec": 15.305615901947021 + }, + { + "epoch": 11, + "train_loss": 0.6340117832756043, + "train_acc": 0.77878, + "test_loss": 0.7613432981491088, + "test_acc": 0.7377, + "lyapunov": null, + "grad_norm": 2.164571307713442, + "grad_max_sv": 1.7057331085205079, + "grad_min_sv": 1.0792852087604387e-07, + "grad_condition": 15783530.208328355, + "lr": 0.0009704403844771127, + "time_sec": 15.29656457901001 + }, + { + "epoch": 12, + "train_loss": 0.6060477030181884, + "train_acc": 0.78728, + "test_loss": 0.7971237164974213, + "test_acc": 0.729, + "lyapunov": null, + "grad_norm": 1.993298876301324, + "grad_max_sv": 1.514353270828724, + "grad_min_sv": 1.009763655801521e-07, + "grad_condition": 14944755.026175302, + "lr": 0.0009648882429441257, + "time_sec": 15.30236530303955 + }, + { + "epoch": 13, + "train_loss": 0.5870892490005493, + "train_acc": 0.79524, + "test_loss": 0.8448094959259034, + "test_acc": 0.7127, + "lyapunov": null, + "grad_norm": 1.8629217723116693, + "grad_max_sv": 1.3949483826756477, + "grad_min_sv": 9.635141964281502e-08, + "grad_condition": 14581029.38399595, + "lr": 0.0009588773128419905, + "time_sec": 15.315025806427002 + }, + { + "epoch": 14, + "train_loss": 0.5539195073699951, + "train_acc": 0.80644, + "test_loss": 0.7561563467979431, + "test_acc": 0.7394, + "lyapunov": null, + "grad_norm": 1.6986166991338625, + "grad_max_sv": 1.245494757592678, + "grad_min_sv": 8.711651755533012e-08, + "grad_condition": 14401234.8235637, + "lr": 0.0009524135262330098, + "time_sec": 15.308890104293823 + }, + { + "epoch": 15, + "train_loss": 0.5333379591941834, + "train_acc": 0.8143, + "test_loss": 0.6968033623695373, + "test_acc": 0.7569, + "lyapunov": null, + "grad_norm": 1.5656089916965232, + "grad_max_sv": 1.1909169003367424, + "grad_min_sv": 8.488269482853639e-08, + "grad_condition": 14106351.27298153, + "lr": 0.0009455032620941839, + "time_sec": 15.311123609542847 + }, + { + "epoch": 16, + "train_loss": 0.5167095581436157, + "train_acc": 0.82042, + "test_loss": 0.849514400100708, + "test_acc": 0.7133, + "lyapunov": null, + "grad_norm": 1.496171987836298, + "grad_max_sv": 1.0258999049663544, + "grad_min_sv": 8.006283778172473e-08, + "grad_condition": 12841377.110361751, + "lr": 0.0009381533400219318, + "time_sec": 15.310609817504883 + }, + { + "epoch": 17, + "train_loss": 0.49894729826927187, + "train_acc": 0.8262, + "test_loss": 0.7154086270809173, + "test_acc": 0.7552, + "lyapunov": null, + "grad_norm": 1.3884031919720434, + "grad_max_sv": 0.9819801226258278, + "grad_min_sv": 7.953692726658801e-08, + "grad_condition": 12477520.833613167, + "lr": 0.0009303710135019719, + "time_sec": 15.301868200302124 + }, + { + "epoch": 18, + "train_loss": 0.4833205630302429, + "train_acc": 0.83074, + "test_loss": 0.8212436129570008, + "test_acc": 0.7372, + "lyapunov": null, + "grad_norm": 1.322943153444315, + "grad_max_sv": 0.9954353883862496, + "grad_min_sv": 7.706266931251094e-08, + "grad_condition": 12928888.561653998, + "lr": 0.0009221639627510076, + "time_sec": 15.304028987884521 + }, + { + "epoch": 19, + "train_loss": 0.46378349807739255, + "train_acc": 0.8371, + "test_loss": 0.6447551451683045, + "test_acc": 0.789, + "lyapunov": null, + "grad_norm": 1.231933968586028, + "grad_max_sv": 0.7683330580592156, + "grad_min_sv": 6.892571695615856e-08, + "grad_condition": 11194075.895721275, + "lr": 0.000913540287137281, + "time_sec": 15.304960489273071 + }, + { + "epoch": 20, + "train_loss": 0.44474551233291626, + "train_acc": 0.84504, + "test_loss": 0.6990101715087891, + "test_acc": 0.7693, + "lyapunov": null, + "grad_norm": 1.1785280692983833, + "grad_max_sv": 0.8134334728121757, + "grad_min_sv": 6.934622298615523e-08, + "grad_condition": 11771827.214910198, + "lr": 0.0009045084971874739, + "time_sec": 15.309978008270264 + }, + { + "epoch": 21, + "train_loss": 0.4328971823978424, + "train_acc": 0.8493, + "test_loss": 0.605803295135498, + "test_acc": 0.7971, + "lyapunov": null, + "grad_norm": 1.1010893792673297, + "grad_max_sv": 0.74788568764925, + "grad_min_sv": 6.635127869358826e-08, + "grad_condition": 11337903.371089932, + "lr": 0.0008950775061878452, + "time_sec": 15.304766416549683 + }, + { + "epoch": 22, + "train_loss": 0.42013943620681765, + "train_acc": 0.85398, + "test_loss": 0.6351155483245849, + "test_acc": 0.7873, + "lyapunov": null, + "grad_norm": 1.050275059187082, + "grad_max_sv": 0.733056052774191, + "grad_min_sv": 6.172693325368073e-08, + "grad_condition": 11926578.893480929, + "lr": 0.0008852566213878947, + "time_sec": 15.304250001907349 + }, + { + "epoch": 23, + "train_loss": 0.4068706720542908, + "train_acc": 0.85872, + "test_loss": 0.6962938892364502, + "test_acc": 0.7771, + "lyapunov": null, + "grad_norm": 1.0041008989601972, + "grad_max_sv": 0.6977266952395439, + "grad_min_sv": 6.174876086006975e-08, + "grad_condition": 11375115.065625418, + "lr": 0.0008750555348152298, + "time_sec": 15.29546570777893 + }, + { + "epoch": 24, + "train_loss": 0.3927080359458923, + "train_acc": 0.86198, + "test_loss": 0.6316822688102722, + "test_acc": 0.797, + "lyapunov": null, + "grad_norm": 0.9591057928108919, + "grad_max_sv": 0.6601924143731595, + "grad_min_sv": 5.981677704269828e-08, + "grad_condition": 10958128.320144685, + "lr": 0.0008644843137107057, + "time_sec": 15.319843292236328 + }, + { + "epoch": 25, + "train_loss": 0.37991392849445343, + "train_acc": 0.8662, + "test_loss": 0.7685016389846802, + "test_acc": 0.7528, + "lyapunov": null, + "grad_norm": 0.9185108543931831, + "grad_max_sv": 0.5813446715474129, + "grad_min_sv": 5.7562914257403006e-08, + "grad_condition": 10132723.13073414, + "lr": 0.0008535533905932737, + "time_sec": 15.314316272735596 + }, + { + "epoch": 26, + "train_loss": 0.3740078569984436, + "train_acc": 0.86904, + "test_loss": 0.6302923937797547, + "test_acc": 0.7894, + "lyapunov": null, + "grad_norm": 0.896823092741051, + "grad_max_sv": 0.5897809371352196, + "grad_min_sv": 5.612208120453488e-08, + "grad_condition": 10555219.724126566, + "lr": 0.0008422735529643444, + "time_sec": 15.295911312103271 + }, + { + "epoch": 27, + "train_loss": 0.35986615454673765, + "train_acc": 0.8722, + "test_loss": 0.5293433817148209, + "test_acc": 0.8255, + "lyapunov": null, + "grad_norm": 0.8414160526480361, + "grad_max_sv": 0.5433246113359929, + "grad_min_sv": 5.460546566027347e-08, + "grad_condition": 10029361.12551422, + "lr": 0.0008306559326618259, + "time_sec": 15.296611309051514 + }, + { + "epoch": 28, + "train_loss": 0.34749350198745727, + "train_acc": 0.87846, + "test_loss": 0.6013012096405029, + "test_acc": 0.8077, + "lyapunov": null, + "grad_norm": 0.8012028361027335, + "grad_max_sv": 0.5324302047491074, + "grad_min_sv": 5.343053706141632e-08, + "grad_condition": 9995030.902296156, + "lr": 0.0008187119948743449, + "time_sec": 15.314170122146606 + }, + { + "epoch": 29, + "train_loss": 0.33312201313018797, + "train_acc": 0.88212, + "test_loss": 0.5545183982849121, + "test_acc": 0.8162, + "lyapunov": null, + "grad_norm": 0.7852771005330633, + "grad_max_sv": 0.5164767228066921, + "grad_min_sv": 5.198521888516439e-08, + "grad_condition": 10107248.49432898, + "lr": 0.0008064535268264883, + "time_sec": 15.311892986297607 + }, + { + "epoch": 30, + "train_loss": 0.3230313647842407, + "train_acc": 0.88538, + "test_loss": 0.658975659275055, + "test_acc": 0.7951, + "lyapunov": null, + "grad_norm": 0.7620779575769897, + "grad_max_sv": 0.5038670122623443, + "grad_min_sv": 5.0398949014152095e-08, + "grad_condition": 10038873.739317197, + "lr": 0.0007938926261462367, + "time_sec": 15.305739402770996 + }, + { + "epoch": 31, + "train_loss": 0.318023904876709, + "train_acc": 0.88796, + "test_loss": 0.6099616609573364, + "test_acc": 0.8127, + "lyapunov": null, + "grad_norm": 0.7501021639283835, + "grad_max_sv": 0.48214229866862296, + "grad_min_sv": 5.136175964537415e-08, + "grad_condition": 9343056.264591306, + "lr": 0.0007810416889260654, + "time_sec": 15.325766324996948 + }, + { + "epoch": 32, + "train_loss": 0.31232675287246703, + "train_acc": 0.89082, + "test_loss": 0.5936648756027222, + "test_acc": 0.8109, + "lyapunov": null, + "grad_norm": 0.7279129448401558, + "grad_max_sv": 0.4431505911052227, + "grad_min_sv": 4.812153910904726e-08, + "grad_condition": 9245973.275864627, + "lr": 0.0007679133974894983, + "time_sec": 15.317164897918701 + }, + { + "epoch": 33, + "train_loss": 0.29341697571754455, + "train_acc": 0.8967, + "test_loss": 0.5134524160385132, + "test_acc": 0.8357, + "lyapunov": null, + "grad_norm": 0.6884958324446571, + "grad_max_sv": 0.4426784858107567, + "grad_min_sv": 4.9337259699910875e-08, + "grad_condition": 9173234.108017813, + "lr": 0.0007545207078751857, + "time_sec": 15.312905311584473 + }, + { + "epoch": 34, + "train_loss": 0.2897170938873291, + "train_acc": 0.89828, + "test_loss": 0.5332132309913635, + "test_acc": 0.8335, + "lyapunov": null, + "grad_norm": 0.6750271636840882, + "grad_max_sv": 0.4532689817249775, + "grad_min_sv": 4.866335441278125e-08, + "grad_condition": 9412153.339201316, + "lr": 0.0007408768370508577, + "time_sec": 15.313745260238647 + }, + { + "epoch": 35, + "train_loss": 0.28602589085578917, + "train_acc": 0.89756, + "test_loss": 0.6111867341041565, + "test_acc": 0.8164, + "lyapunov": null, + "grad_norm": 0.6693786571127541, + "grad_max_sv": 0.4255728892982006, + "grad_min_sv": 4.737296563916971e-08, + "grad_condition": 9020003.170186436, + "lr": 0.0007269952498697734, + "time_sec": 15.32437539100647 + }, + { + "epoch": 36, + "train_loss": 0.2724088624763489, + "train_acc": 0.90408, + "test_loss": 0.5054482436180114, + "test_acc": 0.8387, + "lyapunov": null, + "grad_norm": 0.6416324201224461, + "grad_max_sv": 0.4291106700897217, + "grad_min_sv": 4.6136759568327077e-08, + "grad_condition": 9385408.654433403, + "lr": 0.0007128896457825364, + "time_sec": 15.322253704071045 + }, + { + "epoch": 37, + "train_loss": 0.26598569943904876, + "train_acc": 0.90576, + "test_loss": 0.5292941621780396, + "test_acc": 0.8315, + "lyapunov": null, + "grad_norm": 0.6311835178833255, + "grad_max_sv": 0.372799988463521, + "grad_min_sv": 4.42526025601353e-08, + "grad_condition": 8432960.688056583, + "lr": 0.0006985739453173903, + "time_sec": 15.330822467803955 + }, + { + "epoch": 38, + "train_loss": 0.2548411606884003, + "train_acc": 0.90972, + "test_loss": 0.5889158064842224, + "test_acc": 0.8304, + "lyapunov": null, + "grad_norm": 0.6075907586779873, + "grad_max_sv": 0.40464401319622995, + "grad_min_sv": 4.5029356776638e-08, + "grad_condition": 9144084.308266882, + "lr": 0.0006840622763423391, + "time_sec": 15.306779623031616 + }, + { + "epoch": 39, + "train_loss": 0.2488733386993408, + "train_acc": 0.91114, + "test_loss": 0.5380938538551331, + "test_acc": 0.8325, + "lyapunov": null, + "grad_norm": 0.6071846116294305, + "grad_max_sv": 0.3960565410554409, + "grad_min_sv": 4.6051877067299075e-08, + "grad_condition": 8601152.95310002, + "lr": 0.0006693689601226458, + "time_sec": 15.341014862060547 + }, + { + "epoch": 40, + "train_loss": 0.24494112944602967, + "train_acc": 0.91272, + "test_loss": 0.5513611147403717, + "test_acc": 0.8299, + "lyapunov": null, + "grad_norm": 0.592226155692726, + "grad_max_sv": 0.3729955680668354, + "grad_min_sv": 4.293505284636012e-08, + "grad_condition": 8794710.30872355, + "lr": 0.0006545084971874737, + "time_sec": 15.389995813369751 + }, + { + "epoch": 41, + "train_loss": 0.23727083059310913, + "train_acc": 0.9153, + "test_loss": 0.516801796245575, + "test_acc": 0.8461, + "lyapunov": null, + "grad_norm": 0.5812900748217327, + "grad_max_sv": 0.38579080179333686, + "grad_min_sv": 4.4259539766500214e-08, + "grad_condition": 8748753.244401883, + "lr": 0.0006394955530196147, + "time_sec": 15.318362474441528 + }, + { + "epoch": 42, + "train_loss": 0.22481181490898133, + "train_acc": 0.92022, + "test_loss": 0.5416705925941467, + "test_acc": 0.8322, + "lyapunov": null, + "grad_norm": 0.5619779097810216, + "grad_max_sv": 0.35356797464191914, + "grad_min_sv": 4.2614826689657547e-08, + "grad_condition": 8335709.16485816, + "lr": 0.0006243449435824273, + "time_sec": 15.315505743026733 + }, + { + "epoch": 43, + "train_loss": 0.22531912160873413, + "train_acc": 0.9199, + "test_loss": 0.5833574778556824, + "test_acc": 0.8338, + "lyapunov": null, + "grad_norm": 0.557199013327348, + "grad_max_sv": 0.33938006646931174, + "grad_min_sv": 4.300346327923421e-08, + "grad_condition": 7932422.911212927, + "lr": 0.0006090716206982714, + "time_sec": 15.32206392288208 + }, + { + "epoch": 44, + "train_loss": 0.216223452000618, + "train_acc": 0.92378, + "test_loss": 0.5012358224868775, + "test_acc": 0.8491, + "lyapunov": null, + "grad_norm": 0.5383308349401124, + "grad_max_sv": 0.3396204937249422, + "grad_min_sv": 4.201267005399245e-08, + "grad_condition": 8110585.992247519, + "lr": 0.0005936906572928625, + "time_sec": 15.314954042434692 + }, + { + "epoch": 45, + "train_loss": 0.21238275866508483, + "train_acc": 0.92506, + "test_loss": 0.5394745681762695, + "test_acc": 0.8426, + "lyapunov": null, + "grad_norm": 0.5338537929467614, + "grad_max_sv": 0.34414798244833944, + "grad_min_sv": 4.2673109312829635e-08, + "grad_condition": 8155102.629835799, + "lr": 0.0005782172325201156, + "time_sec": 15.313148975372314 + }, + { + "epoch": 46, + "train_loss": 0.2043999564409256, + "train_acc": 0.9264, + "test_loss": 0.4982535705089569, + "test_acc": 0.851, + "lyapunov": null, + "grad_norm": 0.518001070564685, + "grad_max_sv": 0.3181751623749733, + "grad_min_sv": 4.258852284166892e-08, + "grad_condition": 7586177.211236173, + "lr": 0.0005626666167821523, + "time_sec": 15.31693696975708 + }, + { + "epoch": 47, + "train_loss": 0.19748862716674806, + "train_acc": 0.93056, + "test_loss": 0.511198134803772, + "test_acc": 0.8512, + "lyapunov": null, + "grad_norm": 0.5066091467854666, + "grad_max_sv": 0.3097307480871677, + "grad_min_sv": 4.0578768167875976e-08, + "grad_condition": 7694719.511876054, + "lr": 0.0005470541566592572, + "time_sec": 15.311876773834229 + }, + { + "epoch": 48, + "train_loss": 0.18840614411354065, + "train_acc": 0.93296, + "test_loss": 0.5223799973011017, + "test_acc": 0.8486, + "lyapunov": null, + "grad_norm": 0.4947799501006328, + "grad_max_sv": 0.32398409508168696, + "grad_min_sv": 3.967475805666254e-08, + "grad_condition": 8181991.0382896485, + "lr": 0.0005313952597646569, + "time_sec": 15.324450016021729 + }, + { + "epoch": 49, + "train_loss": 0.1852111140346527, + "train_acc": 0.93434, + "test_loss": 0.5372783863067627, + "test_acc": 0.8442, + "lyapunov": null, + "grad_norm": 0.49013002688624263, + "grad_max_sv": 0.3128523100167513, + "grad_min_sv": 4.042725132435976e-08, + "grad_condition": 7786375.414612537, + "lr": 0.0005157053795390643, + "time_sec": 15.311121940612793 + }, + { + "epoch": 50, + "train_loss": 0.17850845782279967, + "train_acc": 0.9363, + "test_loss": 0.5162768915176391, + "test_acc": 0.8514, + "lyapunov": null, + "grad_norm": 0.4757476361255021, + "grad_max_sv": 0.3146433509886265, + "grad_min_sv": 3.966314778836022e-08, + "grad_condition": 7931529.673702802, + "lr": 0.0005000000000000002, + "time_sec": 15.3083016872406 + }, + { + "epoch": 51, + "train_loss": 0.17266313230514527, + "train_acc": 0.9392, + "test_loss": 0.5169307453155517, + "test_acc": 0.8514, + "lyapunov": null, + "grad_norm": 0.47267825902613214, + "grad_max_sv": 0.30655047073960306, + "grad_min_sv": 3.728870501262804e-08, + "grad_condition": 8340291.307145154, + "lr": 0.00048429462046093607, + "time_sec": 15.306477308273315 + }, + { + "epoch": 52, + "train_loss": 0.1663313666152954, + "train_acc": 0.94122, + "test_loss": 0.5442662063598633, + "test_acc": 0.8474, + "lyapunov": null, + "grad_norm": 0.46294043228921017, + "grad_max_sv": 0.31195108480751516, + "grad_min_sv": 3.8414651104545784e-08, + "grad_condition": 8124213.069898104, + "lr": 0.0004686047402353435, + "time_sec": 15.31308388710022 + }, + { + "epoch": 53, + "train_loss": 0.16149800906658174, + "train_acc": 0.94246, + "test_loss": 0.580558476114273, + "test_acc": 0.8416, + "lyapunov": null, + "grad_norm": 0.4519494684602909, + "grad_max_sv": 0.2916812110692263, + "grad_min_sv": 3.7287610199499e-08, + "grad_condition": 7889287.089630139, + "lr": 0.000452945843340743, + "time_sec": 15.30961537361145 + }, + { + "epoch": 54, + "train_loss": 0.16166152165412903, + "train_acc": 0.94208, + "test_loss": 0.5555281185150146, + "test_acc": 0.8473, + "lyapunov": null, + "grad_norm": 0.45553329333157905, + "grad_max_sv": 0.2948467206209898, + "grad_min_sv": 3.7315171308449634e-08, + "grad_condition": 7971105.5751351025, + "lr": 0.00043733338321784806, + "time_sec": 15.302156925201416 + }, + { + "epoch": 55, + "train_loss": 0.1565243923521042, + "train_acc": 0.94508, + "test_loss": 0.5074358646392823, + "test_acc": 0.8554, + "lyapunov": null, + "grad_norm": 0.4482394365745094, + "grad_max_sv": 0.2973413269966841, + "grad_min_sv": 3.757956048566768e-08, + "grad_condition": 8002347.089848238, + "lr": 0.0004217827674798847, + "time_sec": 15.313871145248413 + }, + { + "epoch": 56, + "train_loss": 0.14638519546031953, + "train_acc": 0.94786, + "test_loss": 0.4880453747272491, + "test_acc": 0.8653, + "lyapunov": null, + "grad_norm": 0.4314707571224286, + "grad_max_sv": 0.2860257361084223, + "grad_min_sv": 3.907978447514893e-08, + "grad_condition": 7325521.391552436, + "lr": 0.00040630934270713783, + "time_sec": 15.315257549285889 + }, + { + "epoch": 57, + "train_loss": 0.14646475307941437, + "train_acc": 0.94766, + "test_loss": 0.576962650680542, + "test_acc": 0.847, + "lyapunov": null, + "grad_norm": 0.4344661359835185, + "grad_max_sv": 0.27631179951131346, + "grad_min_sv": 3.824539080987677e-08, + "grad_condition": 7229591.786889655, + "lr": 0.000390928379301729, + "time_sec": 15.307274341583252 + }, + { + "epoch": 58, + "train_loss": 0.13712914622783662, + "train_acc": 0.95096, + "test_loss": 0.577113539648056, + "test_acc": 0.8499, + "lyapunov": null, + "grad_norm": 0.42148317642657124, + "grad_max_sv": 0.2975440930575132, + "grad_min_sv": 3.797022123386284e-08, + "grad_condition": 7915512.058803884, + "lr": 0.0003756550564175727, + "time_sec": 15.30914568901062 + }, + { + "epoch": 59, + "train_loss": 0.13448802095890044, + "train_acc": 0.95234, + "test_loss": 0.5032788132190704, + "test_acc": 0.8625, + "lyapunov": null, + "grad_norm": 0.4112977684378401, + "grad_max_sv": 0.2814919870346785, + "grad_min_sv": 3.85102704836271e-08, + "grad_condition": 7377336.951999759, + "lr": 0.00036050444698038553, + "time_sec": 15.317845106124878 + }, + { + "epoch": 60, + "train_loss": 0.13363940123558044, + "train_acc": 0.952, + "test_loss": 0.5432449889659882, + "test_acc": 0.854, + "lyapunov": null, + "grad_norm": 0.4126784436246539, + "grad_max_sv": 0.2804244253784418, + "grad_min_sv": 3.7023297405625045e-08, + "grad_condition": 7621956.91724248, + "lr": 0.00034549150281252655, + "time_sec": 15.322251796722412 + }, + { + "epoch": 61, + "train_loss": 0.12653651702404023, + "train_acc": 0.9556, + "test_loss": 0.49968673663139346, + "test_acc": 0.8678, + "lyapunov": null, + "grad_norm": 0.4007355103640766, + "grad_max_sv": 0.27012523673474786, + "grad_min_sv": 3.795508094484035e-08, + "grad_condition": 7141541.257203001, + "lr": 0.0003306310398773544, + "time_sec": 15.314436435699463 + }, + { + "epoch": 62, + "train_loss": 0.12188665760755539, + "train_acc": 0.9566, + "test_loss": 0.5593991501808167, + "test_acc": 0.8565, + "lyapunov": null, + "grad_norm": 0.3921398359098778, + "grad_max_sv": 0.27338829450309277, + "grad_min_sv": 3.639061785243314e-08, + "grad_condition": 7584044.263979311, + "lr": 0.00031593772365766127, + "time_sec": 15.302758693695068 + }, + { + "epoch": 63, + "train_loss": 0.1223608536529541, + "train_acc": 0.95622, + "test_loss": 0.5149862161636353, + "test_acc": 0.8612, + "lyapunov": null, + "grad_norm": 0.39447951861080405, + "grad_max_sv": 0.2628227811306715, + "grad_min_sv": 3.7084175330548416e-08, + "grad_condition": 7085494.638547185, + "lr": 0.0003014260546826097, + "time_sec": 15.300389051437378 + }, + { + "epoch": 64, + "train_loss": 0.11717436948299408, + "train_acc": 0.95768, + "test_loss": 0.5029231981754303, + "test_acc": 0.8645, + "lyapunov": null, + "grad_norm": 0.3837842917710247, + "grad_max_sv": 0.2503308400511742, + "grad_min_sv": 3.676226967286311e-08, + "grad_condition": 6852674.209660569, + "lr": 0.0002871103542174637, + "time_sec": 15.306849479675293 + }, + { + "epoch": 65, + "train_loss": 0.1104171419763565, + "train_acc": 0.96138, + "test_loss": 0.5105278373241424, + "test_acc": 0.8621, + "lyapunov": null, + "grad_norm": 0.37324824392122696, + "grad_max_sv": 0.24798878654837608, + "grad_min_sv": 3.5933988673519934e-08, + "grad_condition": 6928104.161500673, + "lr": 0.0002730047501302267, + "time_sec": 15.306128978729248 + }, + { + "epoch": 66, + "train_loss": 0.11005497314453125, + "train_acc": 0.9604, + "test_loss": 0.5454881217956543, + "test_acc": 0.8593, + "lyapunov": null, + "grad_norm": 0.3740796827280413, + "grad_max_sv": 0.25094335451722144, + "grad_min_sv": 3.760543059172505e-08, + "grad_condition": 6680130.259128613, + "lr": 0.00025912316294914234, + "time_sec": 15.311371803283691 + }, + { + "epoch": 67, + "train_loss": 0.1054667473077774, + "train_acc": 0.96206, + "test_loss": 0.5242725006103516, + "test_acc": 0.8654, + "lyapunov": null, + "grad_norm": 0.368892738378212, + "grad_max_sv": 0.25266984924674035, + "grad_min_sv": 3.633599621188921e-08, + "grad_condition": 7013352.02049877, + "lr": 0.0002454792921248144, + "time_sec": 15.30515193939209 + }, + { + "epoch": 68, + "train_loss": 0.10004293047904968, + "train_acc": 0.96412, + "test_loss": 0.5743433611869811, + "test_acc": 0.8538, + "lyapunov": null, + "grad_norm": 0.3572601369548122, + "grad_max_sv": 0.24928448162972927, + "grad_min_sv": 3.5534662101710524e-08, + "grad_condition": 7054160.907809177, + "lr": 0.00023208660251050164, + "time_sec": 15.31411099433899 + }, + { + "epoch": 69, + "train_loss": 0.09898206293821335, + "train_acc": 0.96434, + "test_loss": 0.5453432657718659, + "test_acc": 0.8647, + "lyapunov": null, + "grad_norm": 0.3575462219401736, + "grad_max_sv": 0.22338325902819633, + "grad_min_sv": 3.5619033011968784e-08, + "grad_condition": 6388845.433191194, + "lr": 0.00021895831107393473, + "time_sec": 15.320244789123535 + }, + { + "epoch": 70, + "train_loss": 0.09576731202960015, + "train_acc": 0.96662, + "test_loss": 0.5289871492862701, + "test_acc": 0.8673, + "lyapunov": null, + "grad_norm": 0.3475548635629844, + "grad_max_sv": 0.22887863107025624, + "grad_min_sv": 3.558577605922153e-08, + "grad_condition": 6520932.801253774, + "lr": 0.00020610737385376356, + "time_sec": 15.312981367111206 + }, + { + "epoch": 71, + "train_loss": 0.09435438349246979, + "train_acc": 0.96552, + "test_loss": 0.5673801244735718, + "test_acc": 0.8597, + "lyapunov": null, + "grad_norm": 0.35002047617094667, + "grad_max_sv": 0.24012817665934563, + "grad_min_sv": 3.424292120968175e-08, + "grad_condition": 7037803.21914607, + "lr": 0.00019354647317351177, + "time_sec": 15.323097705841064 + }, + { + "epoch": 72, + "train_loss": 0.0899286351108551, + "train_acc": 0.96766, + "test_loss": 0.5408580667495727, + "test_acc": 0.8662, + "lyapunov": null, + "grad_norm": 0.34100528699001653, + "grad_max_sv": 0.22443376183509828, + "grad_min_sv": 3.460758826179244e-08, + "grad_condition": 6548190.204110672, + "lr": 0.0001812880051256552, + "time_sec": 15.303936243057251 + }, + { + "epoch": 73, + "train_loss": 0.08644640971183777, + "train_acc": 0.9696, + "test_loss": 0.5231532414436341, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.3297853844853395, + "grad_max_sv": 0.23831307105720043, + "grad_min_sv": 3.648763895469642e-08, + "grad_condition": 6564265.399345921, + "lr": 0.00016934406733817422, + "time_sec": 15.323826313018799 + }, + { + "epoch": 74, + "train_loss": 0.08675267961740493, + "train_acc": 0.96966, + "test_loss": 0.531370454120636, + "test_acc": 0.8724, + "lyapunov": null, + "grad_norm": 0.33474921077291964, + "grad_max_sv": 0.23228033129125833, + "grad_min_sv": 3.54595965035287e-08, + "grad_condition": 6646670.669053013, + "lr": 0.0001577264470356557, + "time_sec": 15.305448532104492 + }, + { + "epoch": 75, + "train_loss": 0.08520255417346954, + "train_acc": 0.96946, + "test_loss": 0.5489996848106384, + "test_acc": 0.8629, + "lyapunov": null, + "grad_norm": 0.333062577424503, + "grad_max_sv": 0.23861498832702638, + "grad_min_sv": 3.416034828340742e-08, + "grad_condition": 7057996.098654354, + "lr": 0.00014644660940672634, + "time_sec": 15.307157516479492 + }, + { + "epoch": 76, + "train_loss": 0.08347911696434021, + "train_acc": 0.97006, + "test_loss": 0.5250146618843079, + "test_acc": 0.8686, + "lyapunov": null, + "grad_norm": 0.3315871550000043, + "grad_max_sv": 0.23978985324501992, + "grad_min_sv": 3.5313697566152766e-08, + "grad_condition": 6836692.7541990755, + "lr": 0.0001355156862892944, + "time_sec": 15.2927827835083 + }, + { + "epoch": 77, + "train_loss": 0.08182602140903474, + "train_acc": 0.97104, + "test_loss": 0.5350998015880585, + "test_acc": 0.8704, + "lyapunov": null, + "grad_norm": 0.3273538350101595, + "grad_max_sv": 0.23843283373862506, + "grad_min_sv": 3.504422023681286e-08, + "grad_condition": 6836027.998268524, + "lr": 0.00012494446518477025, + "time_sec": 15.317047834396362 + }, + { + "epoch": 78, + "train_loss": 0.07884973392605782, + "train_acc": 0.9722, + "test_loss": 0.543610359621048, + "test_acc": 0.869, + "lyapunov": null, + "grad_norm": 0.318085721614815, + "grad_max_sv": 0.2306290850043297, + "grad_min_sv": 3.51138401910589e-08, + "grad_condition": 6598865.01839647, + "lr": 0.00011474337861210548, + "time_sec": 15.346408605575562 + }, + { + "epoch": 79, + "train_loss": 0.07515444636344909, + "train_acc": 0.97302, + "test_loss": 0.5453424057006836, + "test_acc": 0.8685, + "lyapunov": null, + "grad_norm": 0.30764732453726595, + "grad_max_sv": 0.23328058049082756, + "grad_min_sv": 3.4018917194345025e-08, + "grad_condition": 6898312.859708968, + "lr": 0.00010492249381215483, + "time_sec": 15.312849998474121 + }, + { + "epoch": 80, + "train_loss": 0.07553981874942779, + "train_acc": 0.97342, + "test_loss": 0.5447598055839539, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.3126827627293077, + "grad_max_sv": 0.22440926413983106, + "grad_min_sv": 3.5051727831358904e-08, + "grad_condition": 6508990.801328001, + "lr": 9.549150281252637e-05, + "time_sec": 15.31579327583313 + }, + { + "epoch": 81, + "train_loss": 0.0691981615459919, + "train_acc": 0.9767, + "test_loss": 0.6010801038742065, + "test_acc": 0.8592, + "lyapunov": null, + "grad_norm": 0.2964655372784287, + "grad_max_sv": 0.20926067158579825, + "grad_min_sv": 3.334633209561844e-08, + "grad_condition": 6336645.734981732, + "lr": 8.645971286271918e-05, + "time_sec": 15.311565399169922 + }, + { + "epoch": 82, + "train_loss": 0.07134237255096436, + "train_acc": 0.97564, + "test_loss": 0.5511228674888611, + "test_acc": 0.8685, + "lyapunov": null, + "grad_norm": 0.3035210287863858, + "grad_max_sv": 0.2166539143770933, + "grad_min_sv": 3.444789098416834e-08, + "grad_condition": 6316501.5285459785, + "lr": 7.78360372489926e-05, + "time_sec": 15.321164846420288 + }, + { + "epoch": 83, + "train_loss": 0.06894262619018554, + "train_acc": 0.97574, + "test_loss": 0.5341768414020538, + "test_acc": 0.8666, + "lyapunov": null, + "grad_norm": 0.3006016750160245, + "grad_max_sv": 0.214569428935647, + "grad_min_sv": 3.390297984573465e-08, + "grad_condition": 6347736.579489769, + "lr": 6.962898649802815e-05, + "time_sec": 15.31421685218811 + }, + { + "epoch": 84, + "train_loss": 0.06843596329629421, + "train_acc": 0.97558, + "test_loss": 0.5208944204807282, + "test_acc": 0.8703, + "lyapunov": null, + "grad_norm": 0.2931609715468412, + "grad_max_sv": 0.2041362512856722, + "grad_min_sv": 3.608063616766799e-08, + "grad_condition": 5852493.960090882, + "lr": 6.184665997806824e-05, + "time_sec": 15.313952445983887 + }, + { + "epoch": 85, + "train_loss": 0.06798111920118331, + "train_acc": 0.97708, + "test_loss": 0.5408778586387635, + "test_acc": 0.869, + "lyapunov": null, + "grad_norm": 0.2949462881166867, + "grad_max_sv": 0.2191694311797619, + "grad_min_sv": 3.3161099466383345e-08, + "grad_condition": 6683084.915046187, + "lr": 5.449673790581613e-05, + "time_sec": 15.323522567749023 + }, + { + "epoch": 86, + "train_loss": 0.06374187029123306, + "train_acc": 0.97854, + "test_loss": 0.534241654920578, + "test_acc": 0.8701, + "lyapunov": null, + "grad_norm": 0.28381214745100436, + "grad_max_sv": 0.21770549267530442, + "grad_min_sv": 3.4639007706616096e-08, + "grad_condition": 6392279.068014438, + "lr": 4.758647376699034e-05, + "time_sec": 15.312573432922363 + }, + { + "epoch": 87, + "train_loss": 0.06471459998726845, + "train_acc": 0.97748, + "test_loss": 0.5297845101356506, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.28897487313019665, + "grad_max_sv": 0.19332378804683686, + "grad_min_sv": 3.343392815935431e-08, + "grad_condition": 5824270.640002059, + "lr": 4.112268715800956e-05, + "time_sec": 15.310936450958252 + }, + { + "epoch": 88, + "train_loss": 0.06347171569228173, + "train_acc": 0.97814, + "test_loss": 0.5321846860408783, + "test_acc": 0.8722, + "lyapunov": null, + "grad_norm": 0.2861217885894181, + "grad_max_sv": 0.18890463691204787, + "grad_min_sv": 3.443075908826643e-08, + "grad_condition": 5578610.167209303, + "lr": 3.511175705587434e-05, + "time_sec": 15.30883502960205 + }, + { + "epoch": 89, + "train_loss": 0.06456126765966415, + "train_acc": 0.97732, + "test_loss": 0.5306058297157288, + "test_acc": 0.8724, + "lyapunov": null, + "grad_norm": 0.2911671580013793, + "grad_max_sv": 0.20169610902667046, + "grad_min_sv": 3.3340199756537456e-08, + "grad_condition": 6113921.310843622, + "lr": 2.9559615522887284e-05, + "time_sec": 15.325217247009277 + }, + { + "epoch": 90, + "train_loss": 0.05981739419221878, + "train_acc": 0.97936, + "test_loss": 0.5510406871795654, + "test_acc": 0.8698, + "lyapunov": null, + "grad_norm": 0.27406962038993515, + "grad_max_sv": 0.20393476765602828, + "grad_min_sv": 3.436182409721766e-08, + "grad_condition": 6006804.61096659, + "lr": 2.447174185242324e-05, + "time_sec": 15.308394432067871 + }, + { + "epoch": 91, + "train_loss": 0.05843851445674896, + "train_acc": 0.97988, + "test_loss": 0.5369569517612457, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.270215680703968, + "grad_max_sv": 0.19462423361837863, + "grad_min_sv": 3.2800926286213895e-08, + "grad_condition": 5976870.852957519, + "lr": 1.9853157161528526e-05, + "time_sec": 15.312544584274292 + }, + { + "epoch": 92, + "train_loss": 0.06141342503786087, + "train_acc": 0.9789, + "test_loss": 0.5492124430656433, + "test_acc": 0.8715, + "lyapunov": null, + "grad_norm": 0.28355491226552393, + "grad_max_sv": 0.20141606461256742, + "grad_min_sv": 3.389024190170176e-08, + "grad_condition": 6025484.075561702, + "lr": 1.570841943568452e-05, + "time_sec": 15.318751096725464 + }, + { + "epoch": 93, + "train_loss": 0.06185958398580551, + "train_acc": 0.9791, + "test_loss": 0.5353557282447815, + "test_acc": 0.8734, + "lyapunov": null, + "grad_norm": 0.28019086696986784, + "grad_max_sv": 0.20358563121408224, + "grad_min_sv": 3.4872499954374805e-08, + "grad_condition": 5972181.870711091, + "lr": 1.204161903062634e-05, + "time_sec": 15.310726404190063 + }, + { + "epoch": 94, + "train_loss": 0.061077375268936154, + "train_acc": 0.97862, + "test_loss": 0.5403136486530304, + "test_acc": 0.8726, + "lyapunov": null, + "grad_norm": 0.27793458972654056, + "grad_max_sv": 0.21468139700591565, + "grad_min_sv": 3.314470546911252e-08, + "grad_condition": 6531953.716980138, + "lr": 8.85637463565564e-06, + "time_sec": 15.322482585906982 + }, + { + "epoch": 95, + "train_loss": 0.059067166829109195, + "train_acc": 0.9801, + "test_loss": 0.5499792334079743, + "test_acc": 0.8706, + "lyapunov": null, + "grad_norm": 0.2726950869177449, + "grad_max_sv": 0.1847312103956938, + "grad_min_sv": 3.442832863242984e-08, + "grad_condition": 5484378.490748374, + "lr": 6.155829702431171e-06, + "time_sec": 15.331462860107422 + }, + { + "epoch": 96, + "train_loss": 0.058869197854995725, + "train_acc": 0.97992, + "test_loss": 0.5609679688453675, + "test_acc": 0.8699, + "lyapunov": null, + "grad_norm": 0.2733600212103379, + "grad_max_sv": 0.203422649204731, + "grad_min_sv": 3.4962690476092464e-08, + "grad_condition": 5877045.15462194, + "lr": 3.942649342761118e-06, + "time_sec": 15.318592071533203 + }, + { + "epoch": 97, + "train_loss": 0.05934914319038391, + "train_acc": 0.97972, + "test_loss": 0.5556031215667725, + "test_acc": 0.8687, + "lyapunov": null, + "grad_norm": 0.2765716324142509, + "grad_max_sv": 0.1996933190152049, + "grad_min_sv": 3.3284164402402895e-08, + "grad_condition": 6129925.740326188, + "lr": 2.2190176984600023e-06, + "time_sec": 15.329679727554321 + }, + { + "epoch": 98, + "train_loss": 0.05874215810537338, + "train_acc": 0.97992, + "test_loss": 0.5451333051681518, + "test_acc": 0.8712, + "lyapunov": null, + "grad_norm": 0.2696205462857481, + "grad_max_sv": 0.19026922769844531, + "grad_min_sv": 3.324827377859663e-08, + "grad_condition": 5756655.141047328, + "lr": 9.866357858642206e-07, + "time_sec": 15.31182599067688 + }, + { + "epoch": 99, + "train_loss": 0.059339061715602874, + "train_acc": 0.98046, + "test_loss": 0.5511723966598511, + "test_acc": 0.8694, + "lyapunov": null, + "grad_norm": 0.2722387278016211, + "grad_max_sv": 0.17949199080467224, + "grad_min_sv": 3.178271090753526e-08, + "grad_condition": 5671386.367227938, + "lr": 2.467198171342e-07, + "time_sec": 15.313301801681519 + }, + { + "epoch": 100, + "train_loss": 0.05937783687353134, + "train_acc": 0.97908, + "test_loss": 0.5341217585086823, + "test_acc": 0.8723, + "lyapunov": null, + "grad_norm": 0.275408042809645, + "grad_max_sv": 0.19940215721726418, + "grad_min_sv": 3.299201711826072e-08, + "grad_condition": 6121670.713258359, + "lr": 0.0, + "time_sec": 15.337401151657104 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 2.1551968896484377, + "train_acc": 0.2953, + "test_loss": 1.8477057243347168, + "test_acc": 0.3437, + "lyapunov": null, + "grad_norm": 8.144943624656428, + "grad_max_sv": 7.675079941749573, + "grad_min_sv": 2.827612160416493e-07, + "grad_condition": 28317355.270070046, + "lr": 0.0009997532801828658, + "time_sec": 32.46485447883606 + }, + { + "epoch": 2, + "train_loss": 1.6082625040054321, + "train_acc": 0.42284, + "test_loss": 1.6673745800018311, + "test_acc": 0.406, + "lyapunov": null, + "grad_norm": 6.065037474589551, + "grad_max_sv": 5.5711340546607975, + "grad_min_sv": 2.234880795981553e-07, + "grad_condition": 25327173.99046154, + "lr": 0.0009990133642141358, + "time_sec": 32.39758110046387 + }, + { + "epoch": 3, + "train_loss": 1.4377277154159547, + "train_acc": 0.48488, + "test_loss": 1.5402760635375976, + "test_acc": 0.4555, + "lyapunov": null, + "grad_norm": 5.494687491087257, + "grad_max_sv": 4.691517299413681, + "grad_min_sv": 1.9618108950680835e-07, + "grad_condition": 24150344.903272796, + "lr": 0.00099778098230154, + "time_sec": 32.400826930999756 + }, + { + "epoch": 4, + "train_loss": 1.2879639573669435, + "train_acc": 0.53716, + "test_loss": 1.8371749683380127, + "test_acc": 0.4098, + "lyapunov": null, + "grad_norm": 4.741620609793776, + "grad_max_sv": 4.525534170866012, + "grad_min_sv": 1.8297150106150184e-07, + "grad_condition": 24870782.059164062, + "lr": 0.000996057350657239, + "time_sec": 32.39713406562805 + }, + { + "epoch": 5, + "train_loss": 1.196011114768982, + "train_acc": 0.5717, + "test_loss": 1.1917746976852417, + "test_acc": 0.5662, + "lyapunov": null, + "grad_norm": 4.225084445671327, + "grad_max_sv": 3.8811924695968627, + "grad_min_sv": 1.7304786759098079e-07, + "grad_condition": 22788363.03168846, + "lr": 0.0009938441702975688, + "time_sec": 32.39927625656128 + }, + { + "epoch": 6, + "train_loss": 1.1017011584854126, + "train_acc": 0.60624, + "test_loss": 1.2156044723510742, + "test_acc": 0.5524, + "lyapunov": null, + "grad_norm": 3.8500733224578765, + "grad_max_sv": 3.3867243230342865, + "grad_min_sv": 1.5910630946081028e-07, + "grad_condition": 21517993.207089722, + "lr": 0.0009911436253643444, + "time_sec": 32.41104435920715 + }, + { + "epoch": 7, + "train_loss": 1.019956372566223, + "train_acc": 0.63884, + "test_loss": 1.0341911317825316, + "test_acc": 0.6312, + "lyapunov": null, + "grad_norm": 3.4050623209558424, + "grad_max_sv": 2.8642074435949327, + "grad_min_sv": 1.3970929391149411e-07, + "grad_condition": 20503012.26948414, + "lr": 0.0009879583809693736, + "time_sec": 32.39900183677673 + }, + { + "epoch": 8, + "train_loss": 0.952932172832489, + "train_acc": 0.66154, + "test_loss": 0.9561027820587158, + "test_acc": 0.6654, + "lyapunov": null, + "grad_norm": 3.069081296040065, + "grad_max_sv": 2.5316490083932877, + "grad_min_sv": 1.2806189264580325e-07, + "grad_condition": 19934874.23822563, + "lr": 0.0009842915805643154, + "time_sec": 32.39242911338806 + }, + { + "epoch": 9, + "train_loss": 0.8849921081352234, + "train_acc": 0.68628, + "test_loss": 1.0301121936798097, + "test_acc": 0.6342, + "lyapunov": null, + "grad_norm": 2.63645918277651, + "grad_max_sv": 2.232751601934433, + "grad_min_sv": 1.2227004724252312e-07, + "grad_condition": 18401740.489395566, + "lr": 0.0009801468428384714, + "time_sec": 32.409496545791626 + }, + { + "epoch": 10, + "train_loss": 0.8236279186630249, + "train_acc": 0.70854, + "test_loss": 0.8807288621902466, + "test_acc": 0.682, + "lyapunov": null, + "grad_norm": 2.300239690915013, + "grad_max_sv": 1.9658639460802079, + "grad_min_sv": 1.1437598530505966e-07, + "grad_condition": 17605252.06510754, + "lr": 0.0009755282581475767, + "time_sec": 32.40023136138916 + }, + { + "epoch": 11, + "train_loss": 0.788265288658142, + "train_acc": 0.72186, + "test_loss": 0.8550062474250794, + "test_acc": 0.6904, + "lyapunov": null, + "grad_norm": 2.12020034951075, + "grad_max_sv": 1.6186737358570098, + "grad_min_sv": 1.0332133957291489e-07, + "grad_condition": 15780748.729030486, + "lr": 0.0009704403844771127, + "time_sec": 32.40667533874512 + }, + { + "epoch": 12, + "train_loss": 0.7433690148735046, + "train_acc": 0.73772, + "test_loss": 0.8008458862304687, + "test_acc": 0.7171, + "lyapunov": null, + "grad_norm": 1.8897751819834427, + "grad_max_sv": 1.448184822499752, + "grad_min_sv": 9.324852872083511e-08, + "grad_condition": 15545592.26156075, + "lr": 0.0009648882429441257, + "time_sec": 32.4004065990448 + }, + { + "epoch": 13, + "train_loss": 0.7159804575920105, + "train_acc": 0.74844, + "test_loss": 0.8449424732208252, + "test_acc": 0.7107, + "lyapunov": null, + "grad_norm": 1.7162684736286458, + "grad_max_sv": 1.387939277291298, + "grad_min_sv": 9.02613965791943e-08, + "grad_condition": 15516859.545498159, + "lr": 0.0009588773128419905, + "time_sec": 32.39161419868469 + }, + { + "epoch": 14, + "train_loss": 0.6710689739608765, + "train_acc": 0.7652, + "test_loss": 0.8030969514846802, + "test_acc": 0.7199, + "lyapunov": null, + "grad_norm": 1.5415310022642745, + "grad_max_sv": 1.124143162369728, + "grad_min_sv": 7.788519358342683e-08, + "grad_condition": 14586378.513744438, + "lr": 0.0009524135262330098, + "time_sec": 32.40552067756653 + }, + { + "epoch": 15, + "train_loss": 0.6438176040267944, + "train_acc": 0.77396, + "test_loss": 0.7497868657112121, + "test_acc": 0.7401, + "lyapunov": null, + "grad_norm": 1.4186644873786285, + "grad_max_sv": 1.0314671725034714, + "grad_min_sv": 7.5272734179066e-08, + "grad_condition": 13653093.352212925, + "lr": 0.0009455032620941839, + "time_sec": 32.40474534034729 + }, + { + "epoch": 16, + "train_loss": 0.615869576702118, + "train_acc": 0.7829, + "test_loss": 0.7672984195709228, + "test_acc": 0.7337, + "lyapunov": null, + "grad_norm": 1.2847059491767132, + "grad_max_sv": 0.8981582961976529, + "grad_min_sv": 7.069710665774664e-08, + "grad_condition": 12774971.99569363, + "lr": 0.0009381533400219318, + "time_sec": 32.411378145217896 + }, + { + "epoch": 17, + "train_loss": 0.5916317593765259, + "train_acc": 0.79332, + "test_loss": 0.6773865149497986, + "test_acc": 0.7673, + "lyapunov": null, + "grad_norm": 1.1905850089737686, + "grad_max_sv": 0.8305475980043411, + "grad_min_sv": 6.581527465243652e-08, + "grad_condition": 12649477.259974267, + "lr": 0.0009303710135019719, + "time_sec": 32.40375375747681 + }, + { + "epoch": 18, + "train_loss": 0.5710988390541076, + "train_acc": 0.80148, + "test_loss": 0.6730817820549011, + "test_acc": 0.7658, + "lyapunov": null, + "grad_norm": 1.1184745092261044, + "grad_max_sv": 0.8092691361904144, + "grad_min_sv": 6.20087442726458e-08, + "grad_condition": 13237272.581055809, + "lr": 0.0009221639627510076, + "time_sec": 32.403624534606934 + }, + { + "epoch": 19, + "train_loss": 0.5524461611747742, + "train_acc": 0.80704, + "test_loss": 0.7162760413169861, + "test_acc": 0.7602, + "lyapunov": null, + "grad_norm": 1.023562615452227, + "grad_max_sv": 0.6794823326170445, + "grad_min_sv": 5.88299432280337e-08, + "grad_condition": 11704217.317878243, + "lr": 0.000913540287137281, + "time_sec": 32.39382600784302 + }, + { + "epoch": 20, + "train_loss": 0.5298428584098815, + "train_acc": 0.81452, + "test_loss": 0.7450216589927673, + "test_acc": 0.752, + "lyapunov": null, + "grad_norm": 0.9359144343942514, + "grad_max_sv": 0.5905756287276744, + "grad_min_sv": 5.571528873815623e-08, + "grad_condition": 10693233.182217773, + "lr": 0.0009045084971874739, + "time_sec": 32.40094780921936 + }, + { + "epoch": 21, + "train_loss": 0.5077325123977661, + "train_acc": 0.82174, + "test_loss": 0.63943037815094, + "test_acc": 0.7812, + "lyapunov": null, + "grad_norm": 0.8805285251076611, + "grad_max_sv": 0.615053903311491, + "grad_min_sv": 5.4429192175575734e-08, + "grad_condition": 11327012.575821584, + "lr": 0.0008950775061878452, + "time_sec": 32.38740086555481 + }, + { + "epoch": 22, + "train_loss": 0.4933246819114685, + "train_acc": 0.8259, + "test_loss": 0.718407027053833, + "test_acc": 0.7614, + "lyapunov": null, + "grad_norm": 0.8303617086611039, + "grad_max_sv": 0.5229416653513909, + "grad_min_sv": 5.0371477122723717e-08, + "grad_condition": 10417728.60900723, + "lr": 0.0008852566213878947, + "time_sec": 32.404406785964966 + }, + { + "epoch": 23, + "train_loss": 0.47660592782020567, + "train_acc": 0.83498, + "test_loss": 0.6119730060577393, + "test_acc": 0.7951, + "lyapunov": null, + "grad_norm": 0.7772569962051041, + "grad_max_sv": 0.5228113703429699, + "grad_min_sv": 4.883190189985953e-08, + "grad_condition": 10840281.592058718, + "lr": 0.0008750555348152298, + "time_sec": 32.41756844520569 + }, + { + "epoch": 24, + "train_loss": 0.4621484722900391, + "train_acc": 0.8354, + "test_loss": 0.6255874982833862, + "test_acc": 0.7921, + "lyapunov": null, + "grad_norm": 0.7435129116165293, + "grad_max_sv": 0.5028938911855221, + "grad_min_sv": 4.940657198915232e-08, + "grad_condition": 10262672.7433966, + "lr": 0.0008644843137107057, + "time_sec": 32.40160775184631 + }, + { + "epoch": 25, + "train_loss": 0.44543547362804414, + "train_acc": 0.84322, + "test_loss": 0.6244046552658081, + "test_acc": 0.8003, + "lyapunov": null, + "grad_norm": 0.7057766135770664, + "grad_max_sv": 0.45453565418720243, + "grad_min_sv": 4.47153126970079e-08, + "grad_condition": 10235918.99223967, + "lr": 0.0008535533905932737, + "time_sec": 32.397634983062744 + }, + { + "epoch": 26, + "train_loss": 0.4291659313964844, + "train_acc": 0.85028, + "test_loss": 0.586253802204132, + "test_acc": 0.8053, + "lyapunov": null, + "grad_norm": 0.6653011352683553, + "grad_max_sv": 0.40432176999747754, + "grad_min_sv": 4.4079006933372964e-08, + "grad_condition": 9263382.4971398, + "lr": 0.0008422735529643444, + "time_sec": 32.408364057540894 + }, + { + "epoch": 27, + "train_loss": 0.41755434021949767, + "train_acc": 0.8537, + "test_loss": 0.6190900807380676, + "test_acc": 0.8031, + "lyapunov": null, + "grad_norm": 0.634844213604884, + "grad_max_sv": 0.38489293307065964, + "grad_min_sv": 4.278397165435877e-08, + "grad_condition": 9083713.307072137, + "lr": 0.0008306559326618259, + "time_sec": 32.3781955242157 + }, + { + "epoch": 28, + "train_loss": 0.409987173576355, + "train_acc": 0.85588, + "test_loss": 0.6381987627029418, + "test_acc": 0.7967, + "lyapunov": null, + "grad_norm": 0.6208575070285024, + "grad_max_sv": 0.3849256232380867, + "grad_min_sv": 4.156698754087529e-08, + "grad_condition": 9343591.955088045, + "lr": 0.0008187119948743449, + "time_sec": 32.424397468566895 + }, + { + "epoch": 29, + "train_loss": 0.39254301443099976, + "train_acc": 0.86148, + "test_loss": 0.6114391220092773, + "test_acc": 0.8072, + "lyapunov": null, + "grad_norm": 0.5930731028782803, + "grad_max_sv": 0.35281661339104176, + "grad_min_sv": 3.97135552887562e-08, + "grad_condition": 8878121.049382607, + "lr": 0.0008064535268264883, + "time_sec": 32.40766763687134 + }, + { + "epoch": 30, + "train_loss": 0.3785347310256958, + "train_acc": 0.86726, + "test_loss": 0.6049399808883666, + "test_acc": 0.811, + "lyapunov": null, + "grad_norm": 0.5794796026042499, + "grad_max_sv": 0.36831745132803917, + "grad_min_sv": 4.032110121343635e-08, + "grad_condition": 9212028.38827365, + "lr": 0.0007938926261462367, + "time_sec": 32.40119290351868 + }, + { + "epoch": 31, + "train_loss": 0.3689020803642273, + "train_acc": 0.87034, + "test_loss": 0.6224831011772156, + "test_acc": 0.8103, + "lyapunov": null, + "grad_norm": 0.5518777770693967, + "grad_max_sv": 0.34497435614466665, + "grad_min_sv": 3.993250263789605e-08, + "grad_condition": 8691890.072923485, + "lr": 0.0007810416889260654, + "time_sec": 32.42319178581238 + }, + { + "epoch": 32, + "train_loss": 0.3600490350532532, + "train_acc": 0.87378, + "test_loss": 0.6563146770000458, + "test_acc": 0.7989, + "lyapunov": null, + "grad_norm": 0.5344416918727563, + "grad_max_sv": 0.3161147892475128, + "grad_min_sv": 3.79914633530376e-08, + "grad_condition": 8391808.948301231, + "lr": 0.0007679133974894983, + "time_sec": 32.40037226676941 + }, + { + "epoch": 33, + "train_loss": 0.3552369830417633, + "train_acc": 0.876, + "test_loss": 0.5918597935676575, + "test_acc": 0.8191, + "lyapunov": null, + "grad_norm": 0.5223477954823382, + "grad_max_sv": 0.32091905549168587, + "grad_min_sv": 3.692389771714488e-08, + "grad_condition": 8735655.499988783, + "lr": 0.0007545207078751857, + "time_sec": 32.39385366439819 + }, + { + "epoch": 34, + "train_loss": 0.3357627202987671, + "train_acc": 0.88192, + "test_loss": 0.6601162696361542, + "test_acc": 0.8074, + "lyapunov": null, + "grad_norm": 0.5010170887656177, + "grad_max_sv": 0.3139246258884668, + "grad_min_sv": 3.658822085306213e-08, + "grad_condition": 8606732.681616401, + "lr": 0.0007408768370508577, + "time_sec": 32.40888476371765 + }, + { + "epoch": 35, + "train_loss": 0.32540871870040894, + "train_acc": 0.88428, + "test_loss": 0.6114396753549576, + "test_acc": 0.8112, + "lyapunov": null, + "grad_norm": 0.4852002465463357, + "grad_max_sv": 0.3033136323094368, + "grad_min_sv": 3.599271058973841e-08, + "grad_condition": 8499862.031601336, + "lr": 0.0007269952498697734, + "time_sec": 32.40857720375061 + }, + { + "epoch": 36, + "train_loss": 0.32421252524375915, + "train_acc": 0.8847, + "test_loss": 0.6881836595535278, + "test_acc": 0.8116, + "lyapunov": null, + "grad_norm": 0.47585625371919826, + "grad_max_sv": 0.28932417593896387, + "grad_min_sv": 3.663087517757902e-08, + "grad_condition": 7933220.2527872, + "lr": 0.0007128896457825364, + "time_sec": 32.39529776573181 + }, + { + "epoch": 37, + "train_loss": 0.3108924944496155, + "train_acc": 0.88942, + "test_loss": 0.7008573976516723, + "test_acc": 0.8098, + "lyapunov": null, + "grad_norm": 0.46276747011208014, + "grad_max_sv": 0.2795715734362602, + "grad_min_sv": 3.448033547570617e-08, + "grad_condition": 8262563.079640454, + "lr": 0.0006985739453173903, + "time_sec": 32.38434648513794 + }, + { + "epoch": 38, + "train_loss": 0.31133034090042117, + "train_acc": 0.88992, + "test_loss": 0.6698009629249573, + "test_acc": 0.81, + "lyapunov": null, + "grad_norm": 0.4586602799362298, + "grad_max_sv": 0.2844005227088928, + "grad_min_sv": 3.324500559287458e-08, + "grad_condition": 8714467.747357922, + "lr": 0.0006840622763423391, + "time_sec": 32.396021366119385 + }, + { + "epoch": 39, + "train_loss": 0.29518098635673523, + "train_acc": 0.89552, + "test_loss": 0.7677701180458069, + "test_acc": 0.7991, + "lyapunov": null, + "grad_norm": 0.43830085967668675, + "grad_max_sv": 0.2725641973316669, + "grad_min_sv": 3.3406064270380397e-08, + "grad_condition": 8255466.038533419, + "lr": 0.0006693689601226458, + "time_sec": 32.40195083618164 + }, + { + "epoch": 40, + "train_loss": 0.2831247230243683, + "train_acc": 0.89996, + "test_loss": 0.6842746494293213, + "test_acc": 0.8148, + "lyapunov": null, + "grad_norm": 0.4331819538283316, + "grad_max_sv": 0.26449211575090886, + "grad_min_sv": 3.399684476157461e-08, + "grad_condition": 7879060.46068686, + "lr": 0.0006545084971874737, + "time_sec": 32.418256521224976 + }, + { + "epoch": 41, + "train_loss": 0.27670828733444214, + "train_acc": 0.90256, + "test_loss": 0.701638517665863, + "test_acc": 0.8105, + "lyapunov": null, + "grad_norm": 0.42402034759846713, + "grad_max_sv": 0.26597036607563496, + "grad_min_sv": 3.2260157212249396e-08, + "grad_condition": 8290157.649110466, + "lr": 0.0006394955530196147, + "time_sec": 32.40391206741333 + }, + { + "epoch": 42, + "train_loss": 0.26722780378341676, + "train_acc": 0.90478, + "test_loss": 0.676421770954132, + "test_acc": 0.8152, + "lyapunov": null, + "grad_norm": 0.41593559749987674, + "grad_max_sv": 0.26356035731732846, + "grad_min_sv": 3.2800773563934625e-08, + "grad_condition": 8080555.103613043, + "lr": 0.0006243449435824273, + "time_sec": 32.413851737976074 + }, + { + "epoch": 43, + "train_loss": 0.2611290577888489, + "train_acc": 0.9069, + "test_loss": 0.7091101724147797, + "test_acc": 0.8165, + "lyapunov": null, + "grad_norm": 0.40890139043798995, + "grad_max_sv": 0.2530216708779335, + "grad_min_sv": 3.0997858102566053e-08, + "grad_condition": 8224218.543131987, + "lr": 0.0006090716206982714, + "time_sec": 32.60969662666321 + }, + { + "epoch": 44, + "train_loss": 0.2530948238658905, + "train_acc": 0.90982, + "test_loss": 0.6961516171455383, + "test_acc": 0.8214, + "lyapunov": null, + "grad_norm": 0.39919304872434885, + "grad_max_sv": 0.24201009832322598, + "grad_min_sv": 3.264100985056473e-08, + "grad_condition": 7496864.741894746, + "lr": 0.0005936906572928625, + "time_sec": 32.40188717842102 + }, + { + "epoch": 45, + "train_loss": 0.23889887328147888, + "train_acc": 0.91386, + "test_loss": 0.7265622617721558, + "test_acc": 0.8196, + "lyapunov": null, + "grad_norm": 0.39216552760863915, + "grad_max_sv": 0.25172842368483545, + "grad_min_sv": 3.196390450099784e-08, + "grad_condition": 7939664.340514863, + "lr": 0.0005782172325201156, + "time_sec": 32.40084266662598 + }, + { + "epoch": 46, + "train_loss": 0.23805784145355224, + "train_acc": 0.91674, + "test_loss": 0.6975640031337738, + "test_acc": 0.8226, + "lyapunov": null, + "grad_norm": 0.3825430754006707, + "grad_max_sv": 0.23831223957240583, + "grad_min_sv": 2.971923072081495e-08, + "grad_condition": 8085204.090791678, + "lr": 0.0005626666167821523, + "time_sec": 32.42257380485535 + }, + { + "epoch": 47, + "train_loss": 0.23282361968994142, + "train_acc": 0.91824, + "test_loss": 0.6992193672657013, + "test_acc": 0.8311, + "lyapunov": null, + "grad_norm": 0.3814486121413188, + "grad_max_sv": 0.23424655832350255, + "grad_min_sv": 3.104032040290861e-08, + "grad_condition": 7643726.892298067, + "lr": 0.0005470541566592572, + "time_sec": 32.40861511230469 + }, + { + "epoch": 48, + "train_loss": 0.22799833922863005, + "train_acc": 0.91886, + "test_loss": 0.6951349193096161, + "test_acc": 0.8282, + "lyapunov": null, + "grad_norm": 0.38166215011498245, + "grad_max_sv": 0.24571430422365664, + "grad_min_sv": 3.0606541878697156e-08, + "grad_condition": 8099711.568480073, + "lr": 0.0005313952597646569, + "time_sec": 32.382601499557495 + }, + { + "epoch": 49, + "train_loss": 0.21888560410499572, + "train_acc": 0.92208, + "test_loss": 0.6775056694984436, + "test_acc": 0.8377, + "lyapunov": null, + "grad_norm": 0.3681781600012364, + "grad_max_sv": 0.22858488224446774, + "grad_min_sv": 3.0608208811955254e-08, + "grad_condition": 7499521.525014189, + "lr": 0.0005157053795390643, + "time_sec": 32.38293170928955 + }, + { + "epoch": 50, + "train_loss": 0.2106206985092163, + "train_acc": 0.9252, + "test_loss": 0.6563802011966705, + "test_acc": 0.8396, + "lyapunov": null, + "grad_norm": 0.36053809946906845, + "grad_max_sv": 0.2215539276599884, + "grad_min_sv": 2.9670953960447833e-08, + "grad_condition": 7567975.97315415, + "lr": 0.0005000000000000002, + "time_sec": 32.3891761302948 + }, + { + "epoch": 51, + "train_loss": 0.19901366895198822, + "train_acc": 0.92832, + "test_loss": 0.6814763808727264, + "test_acc": 0.837, + "lyapunov": null, + "grad_norm": 0.3509310663538234, + "grad_max_sv": 0.21552756875753404, + "grad_min_sv": 3.0066001732720335e-08, + "grad_condition": 7264544.488552595, + "lr": 0.00048429462046093607, + "time_sec": 32.41236758232117 + }, + { + "epoch": 52, + "train_loss": 0.19969978581905365, + "train_acc": 0.9285, + "test_loss": 0.6935202028274536, + "test_acc": 0.8339, + "lyapunov": null, + "grad_norm": 0.3520257382758021, + "grad_max_sv": 0.22391790114343166, + "grad_min_sv": 3.0129751982244104e-08, + "grad_condition": 7509087.830538243, + "lr": 0.0004686047402353435, + "time_sec": 32.39413237571716 + }, + { + "epoch": 53, + "train_loss": 0.19100741683721542, + "train_acc": 0.93138, + "test_loss": 0.686068691778183, + "test_acc": 0.8361, + "lyapunov": null, + "grad_norm": 0.3426294963785598, + "grad_max_sv": 0.22632624246180058, + "grad_min_sv": 2.9659243594437613e-08, + "grad_condition": 7652635.339128266, + "lr": 0.000452945843340743, + "time_sec": 32.40613842010498 + }, + { + "epoch": 54, + "train_loss": 0.18032077651500703, + "train_acc": 0.9362, + "test_loss": 0.7067575240373611, + "test_acc": 0.8336, + "lyapunov": null, + "grad_norm": 0.3322012382733825, + "grad_max_sv": 0.20586859565228224, + "grad_min_sv": 2.850985989510946e-08, + "grad_condition": 7314687.938871255, + "lr": 0.00043733338321784806, + "time_sec": 32.4026734828949 + }, + { + "epoch": 55, + "train_loss": 0.17773653375148774, + "train_acc": 0.93586, + "test_loss": 0.7423279015541077, + "test_acc": 0.8264, + "lyapunov": null, + "grad_norm": 0.3304441924446054, + "grad_max_sv": 0.21223607212305068, + "grad_min_sv": 2.8433270138350508e-08, + "grad_condition": 7539548.749518724, + "lr": 0.0004217827674798847, + "time_sec": 32.404977560043335 + }, + { + "epoch": 56, + "train_loss": 0.17266820957183837, + "train_acc": 0.93834, + "test_loss": 0.7072871742248535, + "test_acc": 0.8362, + "lyapunov": null, + "grad_norm": 0.3213443005744008, + "grad_max_sv": 0.20142054706811904, + "grad_min_sv": 2.726542889242012e-08, + "grad_condition": 7440941.08660387, + "lr": 0.00040630934270713783, + "time_sec": 32.39922308921814 + }, + { + "epoch": 57, + "train_loss": 0.16320502066612244, + "train_acc": 0.9411, + "test_loss": 0.7605734568834305, + "test_acc": 0.8318, + "lyapunov": null, + "grad_norm": 0.31657510227372176, + "grad_max_sv": 0.20284682027995588, + "grad_min_sv": 2.7356661469468692e-08, + "grad_condition": 7474082.923928386, + "lr": 0.000390928379301729, + "time_sec": 32.39910292625427 + }, + { + "epoch": 58, + "train_loss": 0.15670019901275634, + "train_acc": 0.94476, + "test_loss": 0.784366103553772, + "test_acc": 0.8311, + "lyapunov": null, + "grad_norm": 0.30805235096734923, + "grad_max_sv": 0.20260103438049554, + "grad_min_sv": 2.8483807401613605e-08, + "grad_condition": 7164125.0338090565, + "lr": 0.0003756550564175727, + "time_sec": 32.38076663017273 + }, + { + "epoch": 59, + "train_loss": 0.1490273987340927, + "train_acc": 0.94576, + "test_loss": 0.7455846133232117, + "test_acc": 0.8376, + "lyapunov": null, + "grad_norm": 0.303406267580447, + "grad_max_sv": 0.19556450732052327, + "grad_min_sv": 2.8112297023596967e-08, + "grad_condition": 7040746.144049543, + "lr": 0.00036050444698038553, + "time_sec": 32.39811587333679 + }, + { + "epoch": 60, + "train_loss": 0.14525161782741547, + "train_acc": 0.94758, + "test_loss": 0.7790617815971375, + "test_acc": 0.8344, + "lyapunov": null, + "grad_norm": 0.30155039989577326, + "grad_max_sv": 0.19981648530811072, + "grad_min_sv": 2.756223151934023e-08, + "grad_condition": 7325326.926472412, + "lr": 0.00034549150281252655, + "time_sec": 32.389100313186646 + }, + { + "epoch": 61, + "train_loss": 0.1412713815355301, + "train_acc": 0.94936, + "test_loss": 0.7642439495563507, + "test_acc": 0.836, + "lyapunov": null, + "grad_norm": 0.29749874721325253, + "grad_max_sv": 0.19452713318169118, + "grad_min_sv": 2.9010603075363407e-08, + "grad_condition": 6769308.704484415, + "lr": 0.0003306310398773544, + "time_sec": 32.38328981399536 + }, + { + "epoch": 62, + "train_loss": 0.1323081604719162, + "train_acc": 0.95234, + "test_loss": 0.7581991817474365, + "test_acc": 0.8398, + "lyapunov": null, + "grad_norm": 0.29116698502726973, + "grad_max_sv": 0.18757329024374486, + "grad_min_sv": 2.7799571622466603e-08, + "grad_condition": 6802391.979822846, + "lr": 0.00031593772365766127, + "time_sec": 32.38175868988037 + }, + { + "epoch": 63, + "train_loss": 0.12890920341968537, + "train_acc": 0.95402, + "test_loss": 0.7480168062210083, + "test_acc": 0.8421, + "lyapunov": null, + "grad_norm": 0.286611612578029, + "grad_max_sv": 0.1843133084475994, + "grad_min_sv": 2.6867626612414597e-08, + "grad_condition": 6929516.973504146, + "lr": 0.0003014260546826097, + "time_sec": 32.42565321922302 + }, + { + "epoch": 64, + "train_loss": 0.1265330140542984, + "train_acc": 0.9554, + "test_loss": 0.8281557668209076, + "test_acc": 0.8301, + "lyapunov": null, + "grad_norm": 0.2827852267700905, + "grad_max_sv": 0.18494715746492146, + "grad_min_sv": 2.7603675123444305e-08, + "grad_condition": 6836444.701068824, + "lr": 0.0002871103542174637, + "time_sec": 32.41487503051758 + }, + { + "epoch": 65, + "train_loss": 0.1179364563369751, + "train_acc": 0.95766, + "test_loss": 0.8201508460521698, + "test_acc": 0.8301, + "lyapunov": null, + "grad_norm": 0.27559434018913526, + "grad_max_sv": 0.1801072470843792, + "grad_min_sv": 2.659138749194767e-08, + "grad_condition": 6847688.983849314, + "lr": 0.0002730047501302267, + "time_sec": 32.39773344993591 + }, + { + "epoch": 66, + "train_loss": 0.11676965503931046, + "train_acc": 0.9583, + "test_loss": 0.8626040154457092, + "test_acc": 0.8299, + "lyapunov": null, + "grad_norm": 0.2739785879338369, + "grad_max_sv": 0.181886912509799, + "grad_min_sv": 2.726705781164185e-08, + "grad_condition": 6765344.039900659, + "lr": 0.00025912316294914234, + "time_sec": 32.3981568813324 + }, + { + "epoch": 67, + "train_loss": 0.1134087336063385, + "train_acc": 0.95968, + "test_loss": 0.8600147367477416, + "test_acc": 0.8307, + "lyapunov": null, + "grad_norm": 0.27359780558028896, + "grad_max_sv": 0.17809443082660437, + "grad_min_sv": 2.617720586961525e-08, + "grad_condition": 6850097.709154141, + "lr": 0.0002454792921248144, + "time_sec": 32.39709424972534 + }, + { + "epoch": 68, + "train_loss": 0.10615333132266998, + "train_acc": 0.96164, + "test_loss": 0.7972221804141998, + "test_acc": 0.8376, + "lyapunov": null, + "grad_norm": 0.2659183144921437, + "grad_max_sv": 0.18308131918311119, + "grad_min_sv": 2.689645892672843e-08, + "grad_condition": 6797772.602815667, + "lr": 0.00023208660251050164, + "time_sec": 32.41845703125 + }, + { + "epoch": 69, + "train_loss": 0.10183365075588226, + "train_acc": 0.9635, + "test_loss": 0.826421448802948, + "test_acc": 0.8419, + "lyapunov": null, + "grad_norm": 0.25781252098700996, + "grad_max_sv": 0.16897555273026227, + "grad_min_sv": 2.6931133589869206e-08, + "grad_condition": 6306456.524677806, + "lr": 0.00021895831107393473, + "time_sec": 32.397175788879395 + }, + { + "epoch": 70, + "train_loss": 0.10107698081731796, + "train_acc": 0.96376, + "test_loss": 0.8561173896312714, + "test_acc": 0.831, + "lyapunov": null, + "grad_norm": 0.25760306881898437, + "grad_max_sv": 0.17646125555038453, + "grad_min_sv": 2.669760297280277e-08, + "grad_condition": 6679362.317952393, + "lr": 0.00020610737385376356, + "time_sec": 32.403748512268066 + }, + { + "epoch": 71, + "train_loss": 0.09157823500394821, + "train_acc": 0.9672, + "test_loss": 0.819078180027008, + "test_acc": 0.8435, + "lyapunov": null, + "grad_norm": 0.24819829552233322, + "grad_max_sv": 0.1644124612212181, + "grad_min_sv": 2.60399903861952e-08, + "grad_condition": 6357922.646001594, + "lr": 0.00019354647317351177, + "time_sec": 32.40361571311951 + }, + { + "epoch": 72, + "train_loss": 0.09161295493125915, + "train_acc": 0.9674, + "test_loss": 0.8579238404273987, + "test_acc": 0.8382, + "lyapunov": null, + "grad_norm": 0.2471838058669454, + "grad_max_sv": 0.18323104958981276, + "grad_min_sv": 2.6274890752020497e-08, + "grad_condition": 7043842.298456557, + "lr": 0.0001812880051256552, + "time_sec": 32.40220522880554 + }, + { + "epoch": 73, + "train_loss": 0.08914089821338654, + "train_acc": 0.9689, + "test_loss": 0.822793147277832, + "test_acc": 0.8428, + "lyapunov": null, + "grad_norm": 0.24800643716145856, + "grad_max_sv": 0.17686894070357084, + "grad_min_sv": 2.5135920411756273e-08, + "grad_condition": 7047438.025677231, + "lr": 0.00016934406733817422, + "time_sec": 32.38602375984192 + }, + { + "epoch": 74, + "train_loss": 0.08674161068916321, + "train_acc": 0.96972, + "test_loss": 0.9136243630409241, + "test_acc": 0.832, + "lyapunov": null, + "grad_norm": 0.24475644922641637, + "grad_max_sv": 0.1730644192546606, + "grad_min_sv": 2.701796373294485e-08, + "grad_condition": 6442891.2485314775, + "lr": 0.0001577264470356557, + "time_sec": 32.388394594192505 + }, + { + "epoch": 75, + "train_loss": 0.08695965735673905, + "train_acc": 0.96928, + "test_loss": 0.8845508131980896, + "test_acc": 0.8384, + "lyapunov": null, + "grad_norm": 0.2459968799202821, + "grad_max_sv": 0.17426501363515853, + "grad_min_sv": 2.6569961386613273e-08, + "grad_condition": 6640201.158479671, + "lr": 0.00014644660940672634, + "time_sec": 32.41233015060425 + }, + { + "epoch": 76, + "train_loss": 0.08056579726457595, + "train_acc": 0.97162, + "test_loss": 0.8616433102607727, + "test_acc": 0.843, + "lyapunov": null, + "grad_norm": 0.2370989720124241, + "grad_max_sv": 0.17729146480560304, + "grad_min_sv": 2.568868753272113e-08, + "grad_condition": 6934864.636315972, + "lr": 0.0001355156862892944, + "time_sec": 32.40184926986694 + }, + { + "epoch": 77, + "train_loss": 0.0778916252565384, + "train_acc": 0.97266, + "test_loss": 0.8366258358001709, + "test_acc": 0.846, + "lyapunov": null, + "grad_norm": 0.2285631358810043, + "grad_max_sv": 0.15610157009214162, + "grad_min_sv": 2.4703725332031468e-08, + "grad_condition": 6441768.40822393, + "lr": 0.00012494446518477025, + "time_sec": 32.39042067527771 + }, + { + "epoch": 78, + "train_loss": 0.07181410483896733, + "train_acc": 0.97442, + "test_loss": 0.8555541298389435, + "test_acc": 0.8426, + "lyapunov": null, + "grad_norm": 0.21751467049933892, + "grad_max_sv": 0.15433428399264812, + "grad_min_sv": 2.665557081726888e-08, + "grad_condition": 5918219.605492928, + "lr": 0.00011474337861210548, + "time_sec": 32.394978523254395 + }, + { + "epoch": 79, + "train_loss": 0.07194108392477036, + "train_acc": 0.9751, + "test_loss": 0.8495045845985413, + "test_acc": 0.8448, + "lyapunov": null, + "grad_norm": 0.22114745807083974, + "grad_max_sv": 0.1569668130017817, + "grad_min_sv": 2.5639288958601015e-08, + "grad_condition": 6206249.934502038, + "lr": 0.00010492249381215483, + "time_sec": 32.40589165687561 + }, + { + "epoch": 80, + "train_loss": 0.07222781093478203, + "train_acc": 0.97412, + "test_loss": 0.8713514517307281, + "test_acc": 0.8394, + "lyapunov": null, + "grad_norm": 0.22263796587188234, + "grad_max_sv": 0.14711420265957714, + "grad_min_sv": 2.5633022726623266e-08, + "grad_condition": 5761666.097039051, + "lr": 9.549150281252637e-05, + "time_sec": 32.37701368331909 + }, + { + "epoch": 81, + "train_loss": 0.06728733582258224, + "train_acc": 0.97644, + "test_loss": 0.8841948908805847, + "test_acc": 0.8471, + "lyapunov": null, + "grad_norm": 0.2167084382178911, + "grad_max_sv": 0.150007457844913, + "grad_min_sv": 2.4493604877662278e-08, + "grad_condition": 6166534.410663934, + "lr": 8.645971286271918e-05, + "time_sec": 32.398573875427246 + }, + { + "epoch": 82, + "train_loss": 0.06532315739750862, + "train_acc": 0.97664, + "test_loss": 0.8479381636619567, + "test_acc": 0.8476, + "lyapunov": null, + "grad_norm": 0.21360344563146125, + "grad_max_sv": 0.14955835351720453, + "grad_min_sv": 2.5209754284105657e-08, + "grad_condition": 5995150.4945804905, + "lr": 7.78360372489926e-05, + "time_sec": 32.39670705795288 + }, + { + "epoch": 83, + "train_loss": 0.06434115768909454, + "train_acc": 0.97796, + "test_loss": 0.8688706632614136, + "test_acc": 0.8462, + "lyapunov": null, + "grad_norm": 0.208142142739157, + "grad_max_sv": 0.14977061534300445, + "grad_min_sv": 2.4894345518333694e-08, + "grad_condition": 6089831.719725271, + "lr": 6.962898649802815e-05, + "time_sec": 32.399760007858276 + }, + { + "epoch": 84, + "train_loss": 0.06394571399211883, + "train_acc": 0.9776, + "test_loss": 0.8629561246871948, + "test_acc": 0.8473, + "lyapunov": null, + "grad_norm": 0.2090274768795119, + "grad_max_sv": 0.1535501467064023, + "grad_min_sv": 2.6076664383367643e-08, + "grad_condition": 5914212.49570628, + "lr": 6.184665997806824e-05, + "time_sec": 32.38430905342102 + }, + { + "epoch": 85, + "train_loss": 0.062020836523771286, + "train_acc": 0.97872, + "test_loss": 0.875181820678711, + "test_acc": 0.8453, + "lyapunov": null, + "grad_norm": 0.2063308108071089, + "grad_max_sv": 0.14753851415589453, + "grad_min_sv": 2.432188375145472e-08, + "grad_condition": 6144261.18306755, + "lr": 5.449673790581613e-05, + "time_sec": 32.41748404502869 + }, + { + "epoch": 86, + "train_loss": 0.06044566638708115, + "train_acc": 0.9789, + "test_loss": 0.872238347530365, + "test_acc": 0.8476, + "lyapunov": null, + "grad_norm": 0.20133211072179052, + "grad_max_sv": 0.148629211448133, + "grad_min_sv": 2.4942497534041762e-08, + "grad_condition": 6060679.3216307415, + "lr": 4.758647376699034e-05, + "time_sec": 32.391072273254395 + }, + { + "epoch": 87, + "train_loss": 0.061503240056037904, + "train_acc": 0.97832, + "test_loss": 0.8733239276885987, + "test_acc": 0.8431, + "lyapunov": null, + "grad_norm": 0.2056722075536268, + "grad_max_sv": 0.14386752797290683, + "grad_min_sv": 2.4274280185920816e-08, + "grad_condition": 5915342.2569472315, + "lr": 4.112268715800956e-05, + "time_sec": 32.393316984176636 + }, + { + "epoch": 88, + "train_loss": 0.057686230409145355, + "train_acc": 0.98028, + "test_loss": 0.9238866704940796, + "test_acc": 0.8441, + "lyapunov": null, + "grad_norm": 0.19849445098013146, + "grad_max_sv": 0.14159611044451595, + "grad_min_sv": 2.40493778669304e-08, + "grad_condition": 5894624.093493214, + "lr": 3.511175705587434e-05, + "time_sec": 32.38528490066528 + }, + { + "epoch": 89, + "train_loss": 0.05870611476659775, + "train_acc": 0.9798, + "test_loss": 0.8742481526374817, + "test_acc": 0.8481, + "lyapunov": null, + "grad_norm": 0.20012200731407057, + "grad_max_sv": 0.15360670480877162, + "grad_min_sv": 2.5219260857411995e-08, + "grad_condition": 6191506.157967448, + "lr": 2.9559615522887284e-05, + "time_sec": 32.393001079559326 + }, + { + "epoch": 90, + "train_loss": 0.05783582457482815, + "train_acc": 0.9801, + "test_loss": 0.8813467388153076, + "test_acc": 0.8475, + "lyapunov": null, + "grad_norm": 0.19996222144489287, + "grad_max_sv": 0.1403856192715466, + "grad_min_sv": 2.448204212690541e-08, + "grad_condition": 5742298.053374326, + "lr": 2.447174185242324e-05, + "time_sec": 32.38493609428406 + }, + { + "epoch": 91, + "train_loss": 0.05505133232176304, + "train_acc": 0.9811, + "test_loss": 0.8983916495323181, + "test_acc": 0.8462, + "lyapunov": null, + "grad_norm": 0.1922888220223182, + "grad_max_sv": 0.13430234417319298, + "grad_min_sv": 2.4953015476114616e-08, + "grad_condition": 5451203.641164561, + "lr": 1.9853157161528526e-05, + "time_sec": 32.399288177490234 + }, + { + "epoch": 92, + "train_loss": 0.05489971268892288, + "train_acc": 0.98124, + "test_loss": 0.8997103338241577, + "test_acc": 0.843, + "lyapunov": null, + "grad_norm": 0.1914882132186981, + "grad_max_sv": 0.13863548981025814, + "grad_min_sv": 2.579038138605938e-08, + "grad_condition": 5398596.905280545, + "lr": 1.570841943568452e-05, + "time_sec": 32.40613651275635 + }, + { + "epoch": 93, + "train_loss": 0.05393671277284622, + "train_acc": 0.9816, + "test_loss": 0.8570820412635803, + "test_acc": 0.847, + "lyapunov": null, + "grad_norm": 0.19247907609747256, + "grad_max_sv": 0.14507245384156703, + "grad_min_sv": 2.4785522878545406e-08, + "grad_condition": 5879853.769356969, + "lr": 1.204161903062634e-05, + "time_sec": 32.38154458999634 + }, + { + "epoch": 94, + "train_loss": 0.05565428542852402, + "train_acc": 0.98092, + "test_loss": 0.8699159992218017, + "test_acc": 0.8494, + "lyapunov": null, + "grad_norm": 0.1950428660443827, + "grad_max_sv": 0.15786617370322348, + "grad_min_sv": 2.5128920544403855e-08, + "grad_condition": 6342900.039114647, + "lr": 8.85637463565564e-06, + "time_sec": 32.408872842788696 + }, + { + "epoch": 95, + "train_loss": 0.0554716275537014, + "train_acc": 0.98074, + "test_loss": 0.8724354814529419, + "test_acc": 0.848, + "lyapunov": null, + "grad_norm": 0.1953551453056335, + "grad_max_sv": 0.14595830552279948, + "grad_min_sv": 2.4523609010174142e-08, + "grad_condition": 6097998.471070435, + "lr": 6.155829702431171e-06, + "time_sec": 32.37954640388489 + }, + { + "epoch": 96, + "train_loss": 0.055670329051017764, + "train_acc": 0.98156, + "test_loss": 0.8982214247703553, + "test_acc": 0.8452, + "lyapunov": null, + "grad_norm": 0.19496196662820392, + "grad_max_sv": 0.1501585453748703, + "grad_min_sv": 2.5934764646962095e-08, + "grad_condition": 5869735.378663734, + "lr": 3.942649342761118e-06, + "time_sec": 32.4021053314209 + }, + { + "epoch": 97, + "train_loss": 0.05344248455762863, + "train_acc": 0.9813, + "test_loss": 0.9114454601287841, + "test_acc": 0.8468, + "lyapunov": null, + "grad_norm": 0.19018664442063118, + "grad_max_sv": 0.14032225906848908, + "grad_min_sv": 2.502056415387699e-08, + "grad_condition": 5745975.090099884, + "lr": 2.2190176984600023e-06, + "time_sec": 32.38188123703003 + }, + { + "epoch": 98, + "train_loss": 0.053135186285972594, + "train_acc": 0.9819, + "test_loss": 0.869631242275238, + "test_acc": 0.8508, + "lyapunov": null, + "grad_norm": 0.18824134211058935, + "grad_max_sv": 0.13075507152825594, + "grad_min_sv": 2.4252965857840536e-08, + "grad_condition": 5397614.905736231, + "lr": 9.866357858642206e-07, + "time_sec": 32.386441230773926 + }, + { + "epoch": 99, + "train_loss": 0.05097491117954254, + "train_acc": 0.983, + "test_loss": 0.8943203839302063, + "test_acc": 0.8483, + "lyapunov": null, + "grad_norm": 0.18445756568932634, + "grad_max_sv": 0.13804081929847598, + "grad_min_sv": 2.4356519201518267e-08, + "grad_condition": 5702871.134726013, + "lr": 2.467198171342e-07, + "time_sec": 32.405375480651855 + }, + { + "epoch": 100, + "train_loss": 0.05390245022058487, + "train_acc": 0.9809, + "test_loss": 0.871891166973114, + "test_acc": 0.8498, + "lyapunov": null, + "grad_norm": 0.1935152752615153, + "grad_max_sv": 0.14720266554504632, + "grad_min_sv": 2.436729609200938e-08, + "grad_condition": 6104513.732861901, + "lr": 0.0, + "time_sec": 32.40170097351074 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 2.4167917232513427, + "train_acc": 0.21668, + "test_loss": 2.5600556365966796, + "test_acc": 0.1426, + "lyapunov": null, + "grad_norm": 8.183371300480916, + "grad_max_sv": 7.386911773681641, + "grad_min_sv": 2.415331181282454e-07, + "grad_condition": 30373000.643941343, + "lr": 0.0009997532801828658, + "time_sec": 49.45663261413574 + }, + { + "epoch": 2, + "train_loss": 1.9079357604217528, + "train_acc": 0.31534, + "test_loss": 2.481009757232666, + "test_acc": 0.1736, + "lyapunov": null, + "grad_norm": 6.225007320887903, + "grad_max_sv": 6.023341983556747, + "grad_min_sv": 2.0562342122332212e-07, + "grad_condition": 29136429.527644336, + "lr": 0.0009990133642141358, + "time_sec": 49.483285427093506 + }, + { + "epoch": 3, + "train_loss": 1.7475298168945312, + "train_acc": 0.36588, + "test_loss": 2.8285199867248534, + "test_acc": 0.131, + "lyapunov": null, + "grad_norm": 5.1420950067433004, + "grad_max_sv": 4.660892617702484, + "grad_min_sv": 1.8032060928874215e-07, + "grad_condition": 26358047.987367053, + "lr": 0.00099778098230154, + "time_sec": 49.57265663146973 + }, + { + "epoch": 4, + "train_loss": 1.648739521408081, + "train_acc": 0.40166, + "test_loss": 2.3356450172424315, + "test_acc": 0.1751, + "lyapunov": null, + "grad_norm": 4.371713821921025, + "grad_max_sv": 3.9185040295124054, + "grad_min_sv": 1.6463919898512814e-07, + "grad_condition": 23923294.770848013, + "lr": 0.000996057350657239, + "time_sec": 49.45625138282776 + }, + { + "epoch": 5, + "train_loss": 1.5810089331436157, + "train_acc": 0.4251, + "test_loss": 2.673109909439087, + "test_acc": 0.1544, + "lyapunov": null, + "grad_norm": 3.4555186506953595, + "grad_max_sv": 2.900471958518028, + "grad_min_sv": 1.4436529607309013e-07, + "grad_condition": 20173199.710391533, + "lr": 0.0009938441702975688, + "time_sec": 49.46467709541321 + }, + { + "epoch": 6, + "train_loss": 1.5207538050079346, + "train_acc": 0.44858, + "test_loss": 2.5345509658813477, + "test_acc": 0.1699, + "lyapunov": null, + "grad_norm": 2.64949967993879, + "grad_max_sv": 2.2037453174591066, + "grad_min_sv": 1.0903019624919352e-07, + "grad_condition": 20443245.381738927, + "lr": 0.0009911436253643444, + "time_sec": 49.46764326095581 + }, + { + "epoch": 7, + "train_loss": 1.4697360105133057, + "train_acc": 0.46474, + "test_loss": 2.8721789810180662, + "test_acc": 0.1272, + "lyapunov": null, + "grad_norm": 2.07791741270765, + "grad_max_sv": 1.6007355004549026, + "grad_min_sv": 8.760053766820875e-08, + "grad_condition": 18373378.661422264, + "lr": 0.0009879583809693736, + "time_sec": 49.47743082046509 + }, + { + "epoch": 8, + "train_loss": 1.4266535543823242, + "train_acc": 0.48382, + "test_loss": 3.240042792892456, + "test_acc": 0.1388, + "lyapunov": null, + "grad_norm": 1.6671990756280735, + "grad_max_sv": 1.2928156778216362, + "grad_min_sv": 7.22438866951336e-08, + "grad_condition": 18264606.350417227, + "lr": 0.0009842915805643154, + "time_sec": 49.462923526763916 + }, + { + "epoch": 9, + "train_loss": 1.394312504272461, + "train_acc": 0.49708, + "test_loss": 2.92084864654541, + "test_acc": 0.1515, + "lyapunov": null, + "grad_norm": 1.4501900520177538, + "grad_max_sv": 1.0461901366710662, + "grad_min_sv": 6.580800739897086e-08, + "grad_condition": 16086880.216684576, + "lr": 0.0009801468428384714, + "time_sec": 49.47783327102661 + }, + { + "epoch": 10, + "train_loss": 1.3646438373184204, + "train_acc": 0.50782, + "test_loss": 2.4641769153594972, + "test_acc": 0.2432, + "lyapunov": null, + "grad_norm": 1.291271889799819, + "grad_max_sv": 0.9352933883666992, + "grad_min_sv": 6.025941292620019e-08, + "grad_condition": 15737334.845315147, + "lr": 0.0009755282581475767, + "time_sec": 49.47376465797424 + }, + { + "epoch": 11, + "train_loss": 1.3376501561355592, + "train_acc": 0.51558, + "test_loss": 2.9219178497314453, + "test_acc": 0.2438, + "lyapunov": null, + "grad_norm": 1.1555098680383777, + "grad_max_sv": 0.7429820895195007, + "grad_min_sv": 5.2901568192709195e-08, + "grad_condition": 14266011.744750757, + "lr": 0.0009704403844771127, + "time_sec": 49.47013974189758 + }, + { + "epoch": 12, + "train_loss": 1.3112868671417237, + "train_acc": 0.5284, + "test_loss": 2.74031083946228, + "test_acc": 0.2031, + "lyapunov": null, + "grad_norm": 1.0738955371821308, + "grad_max_sv": 0.748549421876669, + "grad_min_sv": 4.978303538294426e-08, + "grad_condition": 15210211.076616298, + "lr": 0.0009648882429441257, + "time_sec": 49.46808075904846 + }, + { + "epoch": 13, + "train_loss": 1.287481568031311, + "train_acc": 0.53728, + "test_loss": 3.040859108734131, + "test_acc": 0.1924, + "lyapunov": null, + "grad_norm": 0.9771624206683323, + "grad_max_sv": 0.64529999345541, + "grad_min_sv": 4.393245678357971e-08, + "grad_condition": 14761475.748675447, + "lr": 0.0009588773128419905, + "time_sec": 49.47308921813965 + }, + { + "epoch": 14, + "train_loss": 1.2648405401992797, + "train_acc": 0.54502, + "test_loss": 2.792311123275757, + "test_acc": 0.1915, + "lyapunov": null, + "grad_norm": 0.9467244901324925, + "grad_max_sv": 0.6184789575636387, + "grad_min_sv": 4.4816473465658643e-08, + "grad_condition": 14165375.345471447, + "lr": 0.0009524135262330098, + "time_sec": 49.483009815216064 + }, + { + "epoch": 15, + "train_loss": 1.241471286087036, + "train_acc": 0.55048, + "test_loss": 2.3441864311218263, + "test_acc": 0.2456, + "lyapunov": null, + "grad_norm": 0.8759338877958681, + "grad_max_sv": 0.5726857863366603, + "grad_min_sv": 3.894658555658736e-08, + "grad_condition": 14972228.263231587, + "lr": 0.0009455032620941839, + "time_sec": 49.48427653312683 + }, + { + "epoch": 16, + "train_loss": 1.2250818849945069, + "train_acc": 0.55916, + "test_loss": 2.4376744468688964, + "test_acc": 0.2811, + "lyapunov": null, + "grad_norm": 0.8280125995789305, + "grad_max_sv": 0.5269983820617199, + "grad_min_sv": 3.957679450827811e-08, + "grad_condition": 13458638.5630938, + "lr": 0.0009381533400219318, + "time_sec": 49.491514921188354 + }, + { + "epoch": 17, + "train_loss": 1.2011407931518554, + "train_acc": 0.5681, + "test_loss": 3.077988208389282, + "test_acc": 0.2372, + "lyapunov": null, + "grad_norm": 0.7903623783049802, + "grad_max_sv": 0.5003585621714592, + "grad_min_sv": 3.7936934749183135e-08, + "grad_condition": 13344237.683557762, + "lr": 0.0009303710135019719, + "time_sec": 49.4895544052124 + }, + { + "epoch": 18, + "train_loss": 1.1899376231193541, + "train_acc": 0.57472, + "test_loss": 2.3918450389862063, + "test_acc": 0.2518, + "lyapunov": null, + "grad_norm": 0.7718039520215193, + "grad_max_sv": 0.47414265275001527, + "grad_min_sv": 3.554989529419572e-08, + "grad_condition": 13438942.364842063, + "lr": 0.0009221639627510076, + "time_sec": 49.456658124923706 + }, + { + "epoch": 19, + "train_loss": 1.168603648300171, + "train_acc": 0.57972, + "test_loss": 2.283582151031494, + "test_acc": 0.2237, + "lyapunov": null, + "grad_norm": 0.7146309518059523, + "grad_max_sv": 0.4340610824525356, + "grad_min_sv": 3.228430212054434e-08, + "grad_condition": 13543039.003440287, + "lr": 0.000913540287137281, + "time_sec": 49.45988321304321 + }, + { + "epoch": 20, + "train_loss": 1.151336190109253, + "train_acc": 0.58574, + "test_loss": 2.2708426193237305, + "test_acc": 0.2755, + "lyapunov": null, + "grad_norm": 0.6983120785552407, + "grad_max_sv": 0.4454373300075531, + "grad_min_sv": 3.350230577403579e-08, + "grad_condition": 13641891.236675229, + "lr": 0.0009045084971874739, + "time_sec": 49.4855215549469 + }, + { + "epoch": 21, + "train_loss": 1.1312933298873902, + "train_acc": 0.5941, + "test_loss": 2.002239217376709, + "test_acc": 0.3398, + "lyapunov": null, + "grad_norm": 0.6668029786621408, + "grad_max_sv": 0.4022377036511898, + "grad_min_sv": 3.0301077691419207e-08, + "grad_condition": 13290330.075167935, + "lr": 0.0008950775061878452, + "time_sec": 49.5133171081543 + }, + { + "epoch": 22, + "train_loss": 1.1186233515167237, + "train_acc": 0.59978, + "test_loss": 3.6749740661621093, + "test_acc": 0.2938, + "lyapunov": null, + "grad_norm": 0.6355160393463501, + "grad_max_sv": 0.3662328697741032, + "grad_min_sv": 2.919807395862506e-08, + "grad_condition": 12676455.229119861, + "lr": 0.0008852566213878947, + "time_sec": 49.47933578491211 + }, + { + "epoch": 23, + "train_loss": 1.0992162245941162, + "train_acc": 0.60538, + "test_loss": 2.2956289947509765, + "test_acc": 0.3419, + "lyapunov": null, + "grad_norm": 0.6289434264719856, + "grad_max_sv": 0.3852032497525215, + "grad_min_sv": 2.838916279834791e-08, + "grad_condition": 13726993.354284357, + "lr": 0.0008750555348152298, + "time_sec": 49.46930289268494 + }, + { + "epoch": 24, + "train_loss": 1.09261875541687, + "train_acc": 0.6078, + "test_loss": 2.194385333251953, + "test_acc": 0.3862, + "lyapunov": null, + "grad_norm": 0.6127565268862699, + "grad_max_sv": 0.3749225478619337, + "grad_min_sv": 2.902605293897409e-08, + "grad_condition": 12941629.392305708, + "lr": 0.0008644843137107057, + "time_sec": 49.45948123931885 + }, + { + "epoch": 25, + "train_loss": 1.0722477124023437, + "train_acc": 0.61656, + "test_loss": 2.4663957664489744, + "test_acc": 0.3925, + "lyapunov": null, + "grad_norm": 0.5897825535844798, + "grad_max_sv": 0.371936571970582, + "grad_min_sv": 2.8421365216857452e-08, + "grad_condition": 13252758.329758141, + "lr": 0.0008535533905932737, + "time_sec": 49.479785442352295 + }, + { + "epoch": 26, + "train_loss": 1.0658014038848878, + "train_acc": 0.62154, + "test_loss": 2.2172969047546385, + "test_acc": 0.3602, + "lyapunov": null, + "grad_norm": 0.5970948959400837, + "grad_max_sv": 0.3504005130380392, + "grad_min_sv": 2.822866052021311e-08, + "grad_condition": 12516728.270259932, + "lr": 0.0008422735529643444, + "time_sec": 49.46492099761963 + }, + { + "epoch": 27, + "train_loss": 1.04928136428833, + "train_acc": 0.62394, + "test_loss": 2.3098046798706053, + "test_acc": 0.3753, + "lyapunov": null, + "grad_norm": 0.5799982623396496, + "grad_max_sv": 0.3511035542935133, + "grad_min_sv": 2.871881275012811e-08, + "grad_condition": 12420577.990074852, + "lr": 0.0008306559326618259, + "time_sec": 49.463754177093506 + }, + { + "epoch": 28, + "train_loss": 1.033934779319763, + "train_acc": 0.6312, + "test_loss": 2.5853637130737304, + "test_acc": 0.3827, + "lyapunov": null, + "grad_norm": 0.5626766992798455, + "grad_max_sv": 0.3680811390280724, + "grad_min_sv": 2.860611223454157e-08, + "grad_condition": 13030738.458713688, + "lr": 0.0008187119948743449, + "time_sec": 49.46650528907776 + }, + { + "epoch": 29, + "train_loss": 1.0245469808578491, + "train_acc": 0.63318, + "test_loss": 2.421029793548584, + "test_acc": 0.3777, + "lyapunov": null, + "grad_norm": 0.540434209171599, + "grad_max_sv": 0.33249553516507147, + "grad_min_sv": 2.5725369168227985e-08, + "grad_condition": 13074923.559065297, + "lr": 0.0008064535268264883, + "time_sec": 49.46920871734619 + }, + { + "epoch": 30, + "train_loss": 1.0157002903938293, + "train_acc": 0.63876, + "test_loss": 2.5748968841552733, + "test_acc": 0.353, + "lyapunov": null, + "grad_norm": 0.5335667641481916, + "grad_max_sv": 0.31497838646173476, + "grad_min_sv": 2.4617009453109516e-08, + "grad_condition": 12878002.467485525, + "lr": 0.0007938926261462367, + "time_sec": 49.47658443450928 + }, + { + "epoch": 31, + "train_loss": 1.0092763556671143, + "train_acc": 0.64072, + "test_loss": 2.575096744155884, + "test_acc": 0.3689, + "lyapunov": null, + "grad_norm": 0.5319602288309537, + "grad_max_sv": 0.33714523129165175, + "grad_min_sv": 2.6278444886784767e-08, + "grad_condition": 12997099.648816537, + "lr": 0.0007810416889260654, + "time_sec": 49.48014044761658 + }, + { + "epoch": 32, + "train_loss": 0.9945861617660523, + "train_acc": 0.64606, + "test_loss": 2.18585274848938, + "test_acc": 0.3591, + "lyapunov": null, + "grad_norm": 0.5207883539385971, + "grad_max_sv": 0.30190461575984956, + "grad_min_sv": 2.498473832268644e-08, + "grad_condition": 12302495.137337226, + "lr": 0.0007679133974894983, + "time_sec": 49.48141527175903 + }, + { + "epoch": 33, + "train_loss": 0.9839789762878418, + "train_acc": 0.65072, + "test_loss": 2.067453681182861, + "test_acc": 0.4015, + "lyapunov": null, + "grad_norm": 0.5202120303096632, + "grad_max_sv": 0.3107115812599659, + "grad_min_sv": 2.559975968985384e-08, + "grad_condition": 12183076.283694824, + "lr": 0.0007545207078751857, + "time_sec": 49.50013208389282 + }, + { + "epoch": 34, + "train_loss": 0.9741807369995117, + "train_acc": 0.6534, + "test_loss": 2.3987243717193603, + "test_acc": 0.3907, + "lyapunov": null, + "grad_norm": 0.5156705695841731, + "grad_max_sv": 0.3042212676256895, + "grad_min_sv": 2.4721938141070156e-08, + "grad_condition": 12439098.422273466, + "lr": 0.0007408768370508577, + "time_sec": 49.4883246421814 + }, + { + "epoch": 35, + "train_loss": 0.960876017742157, + "train_acc": 0.6604, + "test_loss": 2.952223745727539, + "test_acc": 0.3772, + "lyapunov": null, + "grad_norm": 0.49534065997567395, + "grad_max_sv": 0.3189103938639164, + "grad_min_sv": 2.6160001853625657e-08, + "grad_condition": 12245579.759729771, + "lr": 0.0007269952498697734, + "time_sec": 49.49185800552368 + }, + { + "epoch": 36, + "train_loss": 0.9563328867340087, + "train_acc": 0.66094, + "test_loss": 2.5444390853881838, + "test_acc": 0.3748, + "lyapunov": null, + "grad_norm": 0.5015211388674911, + "grad_max_sv": 0.301097634062171, + "grad_min_sv": 2.4840815004978368e-08, + "grad_condition": 12193384.34751702, + "lr": 0.0007128896457825364, + "time_sec": 49.473448038101196 + }, + { + "epoch": 37, + "train_loss": 0.9456947842597961, + "train_acc": 0.66318, + "test_loss": 2.8305119338989257, + "test_acc": 0.3608, + "lyapunov": null, + "grad_norm": 0.5027801927119517, + "grad_max_sv": 0.3191258400678635, + "grad_min_sv": 2.5498967737291876e-08, + "grad_condition": 12721385.179239903, + "lr": 0.0006985739453173903, + "time_sec": 49.47532916069031 + }, + { + "epoch": 38, + "train_loss": 0.9344060453033447, + "train_acc": 0.66828, + "test_loss": 2.3942235221862793, + "test_acc": 0.3846, + "lyapunov": null, + "grad_norm": 0.4893981754322751, + "grad_max_sv": 0.27843328677117823, + "grad_min_sv": 2.3813316207821345e-08, + "grad_condition": 11809731.27063098, + "lr": 0.0006840622763423391, + "time_sec": 49.466092109680176 + }, + { + "epoch": 39, + "train_loss": 0.9299031619262695, + "train_acc": 0.6701, + "test_loss": 2.5896951622009277, + "test_acc": 0.3377, + "lyapunov": null, + "grad_norm": 0.4877056898105668, + "grad_max_sv": 0.2895252756774426, + "grad_min_sv": 2.313919011953658e-08, + "grad_condition": 12624897.370656734, + "lr": 0.0006693689601226458, + "time_sec": 49.47689652442932 + }, + { + "epoch": 40, + "train_loss": 0.9202397887802124, + "train_acc": 0.67222, + "test_loss": 2.3479004539489745, + "test_acc": 0.3652, + "lyapunov": null, + "grad_norm": 0.48378803227864736, + "grad_max_sv": 0.2827453903853893, + "grad_min_sv": 2.3820017647224744e-08, + "grad_condition": 11971929.846932925, + "lr": 0.0006545084971874737, + "time_sec": 49.48384690284729 + }, + { + "epoch": 41, + "train_loss": 0.9035198735237122, + "train_acc": 0.67674, + "test_loss": 2.4544072883605956, + "test_acc": 0.4098, + "lyapunov": null, + "grad_norm": 0.48414477684461676, + "grad_max_sv": 0.2927399341017008, + "grad_min_sv": 2.5373001699691144e-08, + "grad_condition": 11722800.874950778, + "lr": 0.0006394955530196147, + "time_sec": 49.49253749847412 + }, + { + "epoch": 42, + "train_loss": 0.8996260007095337, + "train_acc": 0.67922, + "test_loss": 2.7968482540130615, + "test_acc": 0.3717, + "lyapunov": null, + "grad_norm": 0.47529519443329865, + "grad_max_sv": 0.2862662900239229, + "grad_min_sv": 2.4432264433826845e-08, + "grad_condition": 11830651.602965241, + "lr": 0.0006243449435824273, + "time_sec": 49.472256898880005 + }, + { + "epoch": 43, + "train_loss": 0.8935702981376648, + "train_acc": 0.68226, + "test_loss": 2.7968372314453127, + "test_acc": 0.3814, + "lyapunov": null, + "grad_norm": 0.47246322948696845, + "grad_max_sv": 0.2997207723557949, + "grad_min_sv": 2.4396437803275717e-08, + "grad_condition": 12442839.021676019, + "lr": 0.0006090716206982714, + "time_sec": 49.47343039512634 + }, + { + "epoch": 44, + "train_loss": 0.8839340761566162, + "train_acc": 0.68406, + "test_loss": 2.1332605548858643, + "test_acc": 0.4518, + "lyapunov": null, + "grad_norm": 0.4773353798688752, + "grad_max_sv": 0.287653349712491, + "grad_min_sv": 2.485683419095608e-08, + "grad_condition": 11744954.507169517, + "lr": 0.0005936906572928625, + "time_sec": 49.483134508132935 + }, + { + "epoch": 45, + "train_loss": 0.8809750416755676, + "train_acc": 0.6871, + "test_loss": 2.3744767669677733, + "test_acc": 0.4104, + "lyapunov": null, + "grad_norm": 0.47171575077424854, + "grad_max_sv": 0.2800353281199932, + "grad_min_sv": 2.4150169553038835e-08, + "grad_condition": 11697732.41688976, + "lr": 0.0005782172325201156, + "time_sec": 49.47827482223511 + }, + { + "epoch": 46, + "train_loss": 0.8651049407958984, + "train_acc": 0.69358, + "test_loss": 2.6672937103271486, + "test_acc": 0.4106, + "lyapunov": null, + "grad_norm": 0.46225804490680006, + "grad_max_sv": 0.2764727082103491, + "grad_min_sv": 2.4165243095453092e-08, + "grad_condition": 11539194.901861329, + "lr": 0.0005626666167821523, + "time_sec": 49.482288122177124 + }, + { + "epoch": 47, + "train_loss": 0.855909815826416, + "train_acc": 0.6953, + "test_loss": 2.1082290111541746, + "test_acc": 0.4302, + "lyapunov": null, + "grad_norm": 0.46665587567927413, + "grad_max_sv": 0.2777487523853779, + "grad_min_sv": 2.3157732442768975e-08, + "grad_condition": 12021773.98709596, + "lr": 0.0005470541566592572, + "time_sec": 49.48243308067322 + }, + { + "epoch": 48, + "train_loss": 0.8559737893295288, + "train_acc": 0.69554, + "test_loss": 2.6735187637329103, + "test_acc": 0.3758, + "lyapunov": null, + "grad_norm": 0.4613852081362787, + "grad_max_sv": 0.2753657314926386, + "grad_min_sv": 2.358262860546745e-08, + "grad_condition": 11826265.97781797, + "lr": 0.0005313952597646569, + "time_sec": 49.471890687942505 + }, + { + "epoch": 49, + "train_loss": 0.8440363460159301, + "train_acc": 0.69974, + "test_loss": 2.318854873275757, + "test_acc": 0.4239, + "lyapunov": null, + "grad_norm": 0.46468634824792515, + "grad_max_sv": 0.2798832211643457, + "grad_min_sv": 2.5059412145367333e-08, + "grad_condition": 11328180.182026755, + "lr": 0.0005157053795390643, + "time_sec": 49.46786379814148 + }, + { + "epoch": 50, + "train_loss": 0.8407046744155884, + "train_acc": 0.69938, + "test_loss": 2.2581016651153565, + "test_acc": 0.4586, + "lyapunov": null, + "grad_norm": 0.4552999687027473, + "grad_max_sv": 0.27262482419610023, + "grad_min_sv": 2.3505009449920066e-08, + "grad_condition": 11655869.156098623, + "lr": 0.0005000000000000002, + "time_sec": 49.46631741523743 + }, + { + "epoch": 51, + "train_loss": 0.8328268578910828, + "train_acc": 0.70616, + "test_loss": 2.021052066421509, + "test_acc": 0.4663, + "lyapunov": null, + "grad_norm": 0.45398371093616957, + "grad_max_sv": 0.2551860522478819, + "grad_min_sv": 2.261276339510232e-08, + "grad_condition": 11423398.903523896, + "lr": 0.00048429462046093607, + "time_sec": 49.49492907524109 + }, + { + "epoch": 52, + "train_loss": 0.8242957615280151, + "train_acc": 0.70608, + "test_loss": 2.4299042922973633, + "test_acc": 0.4339, + "lyapunov": null, + "grad_norm": 0.4518491350882313, + "grad_max_sv": 0.2677639227360487, + "grad_min_sv": 2.340493003849531e-08, + "grad_condition": 11498272.982724927, + "lr": 0.0004686047402353435, + "time_sec": 49.47549295425415 + }, + { + "epoch": 53, + "train_loss": 0.8202688133239746, + "train_acc": 0.70788, + "test_loss": 2.0557694828033446, + "test_acc": 0.4729, + "lyapunov": null, + "grad_norm": 0.45155452834894444, + "grad_max_sv": 0.2765634849667549, + "grad_min_sv": 2.294847063488703e-08, + "grad_condition": 12152279.677541133, + "lr": 0.000452945843340743, + "time_sec": 49.47136735916138 + }, + { + "epoch": 54, + "train_loss": 0.8075869009590149, + "train_acc": 0.71144, + "test_loss": 2.2601095848083497, + "test_acc": 0.469, + "lyapunov": null, + "grad_norm": 0.44703257607115265, + "grad_max_sv": 0.28669003024697304, + "grad_min_sv": 2.3961542838790707e-08, + "grad_condition": 11972426.895574057, + "lr": 0.00043733338321784806, + "time_sec": 49.472840785980225 + }, + { + "epoch": 55, + "train_loss": 0.8038845987319946, + "train_acc": 0.71234, + "test_loss": 1.9625594703674316, + "test_acc": 0.4966, + "lyapunov": null, + "grad_norm": 0.45158056349279113, + "grad_max_sv": 0.2616859499365091, + "grad_min_sv": 2.319859899735377e-08, + "grad_condition": 11323136.132990547, + "lr": 0.0004217827674798847, + "time_sec": 49.475728034973145 + }, + { + "epoch": 56, + "train_loss": 0.7961191424942017, + "train_acc": 0.71566, + "test_loss": 2.24710135345459, + "test_acc": 0.4678, + "lyapunov": null, + "grad_norm": 0.45114634744336685, + "grad_max_sv": 0.27140378654003144, + "grad_min_sv": 2.345107636969601e-08, + "grad_condition": 11702309.047382332, + "lr": 0.00040630934270713783, + "time_sec": 49.46745586395264 + }, + { + "epoch": 57, + "train_loss": 0.7886269653129577, + "train_acc": 0.71928, + "test_loss": 2.332701706314087, + "test_acc": 0.4392, + "lyapunov": null, + "grad_norm": 0.44691251964783024, + "grad_max_sv": 0.2512993272393942, + "grad_min_sv": 2.3577591501400263e-08, + "grad_condition": 10797942.504272973, + "lr": 0.000390928379301729, + "time_sec": 49.487914085388184 + }, + { + "epoch": 58, + "train_loss": 0.7809809253120422, + "train_acc": 0.72054, + "test_loss": 2.163261636352539, + "test_acc": 0.4825, + "lyapunov": null, + "grad_norm": 0.44707505885973187, + "grad_max_sv": 0.27487311884760857, + "grad_min_sv": 2.305816853009901e-08, + "grad_condition": 11921937.091947556, + "lr": 0.0003756550564175727, + "time_sec": 49.477548360824585 + }, + { + "epoch": 59, + "train_loss": 0.7728579918098449, + "train_acc": 0.72464, + "test_loss": 2.4211140827178954, + "test_acc": 0.4792, + "lyapunov": null, + "grad_norm": 0.442207932790873, + "grad_max_sv": 0.2551064256578684, + "grad_min_sv": 2.3925818348757842e-08, + "grad_condition": 10733599.660670992, + "lr": 0.00036050444698038553, + "time_sec": 49.47178077697754 + }, + { + "epoch": 60, + "train_loss": 0.7646781494522095, + "train_acc": 0.72672, + "test_loss": 2.02176361579895, + "test_acc": 0.4897, + "lyapunov": null, + "grad_norm": 0.4430698668925349, + "grad_max_sv": 0.26053123250603677, + "grad_min_sv": 2.3670396620545377e-08, + "grad_condition": 11170288.922506649, + "lr": 0.00034549150281252655, + "time_sec": 49.46177387237549 + }, + { + "epoch": 61, + "train_loss": 0.7588282846641541, + "train_acc": 0.7286, + "test_loss": 2.670531511688232, + "test_acc": 0.4198, + "lyapunov": null, + "grad_norm": 0.43898999083578233, + "grad_max_sv": 0.26667738817632197, + "grad_min_sv": 2.325178121154181e-08, + "grad_condition": 11623927.174902633, + "lr": 0.0003306310398773544, + "time_sec": 49.49580407142639 + }, + { + "epoch": 62, + "train_loss": 0.7492313718986511, + "train_acc": 0.73298, + "test_loss": 2.4778705802917482, + "test_acc": 0.449, + "lyapunov": null, + "grad_norm": 0.4417738790617677, + "grad_max_sv": 0.2574993997812271, + "grad_min_sv": 2.3859390374525445e-08, + "grad_condition": 10899105.692467105, + "lr": 0.00031593772365766127, + "time_sec": 49.486817836761475 + }, + { + "epoch": 63, + "train_loss": 0.7480638890266419, + "train_acc": 0.73324, + "test_loss": 2.1940598976135255, + "test_acc": 0.4734, + "lyapunov": null, + "grad_norm": 0.4366591281226868, + "grad_max_sv": 0.2512634038925171, + "grad_min_sv": 2.326989370082799e-08, + "grad_condition": 10851343.919251464, + "lr": 0.0003014260546826097, + "time_sec": 49.494584798812866 + }, + { + "epoch": 64, + "train_loss": 0.7451907014846801, + "train_acc": 0.73538, + "test_loss": 2.3143032501220704, + "test_acc": 0.4762, + "lyapunov": null, + "grad_norm": 0.4362314837898005, + "grad_max_sv": 0.2649652697145939, + "grad_min_sv": 2.3657484859995748e-08, + "grad_condition": 11323682.220760768, + "lr": 0.0002871103542174637, + "time_sec": 49.46461892127991 + }, + { + "epoch": 65, + "train_loss": 0.7316487748908996, + "train_acc": 0.73868, + "test_loss": 2.132633139801025, + "test_acc": 0.4893, + "lyapunov": null, + "grad_norm": 0.43117564557331234, + "grad_max_sv": 0.2554838340729475, + "grad_min_sv": 2.3040169683241628e-08, + "grad_condition": 11170455.423079647, + "lr": 0.0002730047501302267, + "time_sec": 49.4881227016449 + }, + { + "epoch": 66, + "train_loss": 0.7290266520881653, + "train_acc": 0.7408, + "test_loss": 2.396712022781372, + "test_acc": 0.4793, + "lyapunov": null, + "grad_norm": 0.43225303341958693, + "grad_max_sv": 0.2486136831343174, + "grad_min_sv": 2.2949348021938932e-08, + "grad_condition": 10962824.963370848, + "lr": 0.00025912316294914234, + "time_sec": 49.47016882896423 + }, + { + "epoch": 67, + "train_loss": 0.7191537443733216, + "train_acc": 0.74308, + "test_loss": 2.1576420639038085, + "test_acc": 0.4941, + "lyapunov": null, + "grad_norm": 0.42657147393758854, + "grad_max_sv": 0.2438450776040554, + "grad_min_sv": 2.3898531642529975e-08, + "grad_condition": 10287595.631951943, + "lr": 0.0002454792921248144, + "time_sec": 49.49215388298035 + }, + { + "epoch": 68, + "train_loss": 0.7169496524429322, + "train_acc": 0.74418, + "test_loss": 2.4695981254577637, + "test_acc": 0.4807, + "lyapunov": null, + "grad_norm": 0.4234097941028663, + "grad_max_sv": 0.24577417597174644, + "grad_min_sv": 2.2813544342525915e-08, + "grad_condition": 10779009.57251847, + "lr": 0.00023208660251050164, + "time_sec": 49.531681299209595 + }, + { + "epoch": 69, + "train_loss": 0.7072784723091126, + "train_acc": 0.74744, + "test_loss": 2.27939485244751, + "test_acc": 0.4853, + "lyapunov": null, + "grad_norm": 0.4251678846869415, + "grad_max_sv": 0.241105442866683, + "grad_min_sv": 2.3618906030975496e-08, + "grad_condition": 10243169.91188918, + "lr": 0.00021895831107393473, + "time_sec": 49.46745848655701 + }, + { + "epoch": 70, + "train_loss": 0.7093459980392456, + "train_acc": 0.74668, + "test_loss": 2.2168941738128662, + "test_acc": 0.4993, + "lyapunov": null, + "grad_norm": 0.4187232599688298, + "grad_max_sv": 0.2437821462750435, + "grad_min_sv": 2.330924906424059e-08, + "grad_condition": 10529543.438680641, + "lr": 0.00020610737385376356, + "time_sec": 49.46611166000366 + }, + { + "epoch": 71, + "train_loss": 0.7046173419761658, + "train_acc": 0.74866, + "test_loss": 2.6486716678619384, + "test_acc": 0.4604, + "lyapunov": null, + "grad_norm": 0.43152156311922873, + "grad_max_sv": 0.26821285113692284, + "grad_min_sv": 2.3308388552578663e-08, + "grad_condition": 11585490.938807528, + "lr": 0.00019354647317351177, + "time_sec": 49.484049558639526 + }, + { + "epoch": 72, + "train_loss": 0.6916852585601807, + "train_acc": 0.75164, + "test_loss": 2.4044878028869627, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 0.42974614402520106, + "grad_max_sv": 0.2577272642403841, + "grad_min_sv": 2.3734259935181968e-08, + "grad_condition": 10929944.700492647, + "lr": 0.0001812880051256552, + "time_sec": 49.47321033477783 + }, + { + "epoch": 73, + "train_loss": 0.6914860160255432, + "train_acc": 0.75462, + "test_loss": 2.459467795562744, + "test_acc": 0.4755, + "lyapunov": null, + "grad_norm": 0.4235499199054343, + "grad_max_sv": 0.2499073389917612, + "grad_min_sv": 2.312090292555524e-08, + "grad_condition": 10928192.758700397, + "lr": 0.00016934406733817422, + "time_sec": 49.47536325454712 + }, + { + "epoch": 74, + "train_loss": 0.6900841831016541, + "train_acc": 0.75346, + "test_loss": 2.529036985015869, + "test_acc": 0.4694, + "lyapunov": null, + "grad_norm": 0.4200493463432216, + "grad_max_sv": 0.24829606115818023, + "grad_min_sv": 2.3347005217999595e-08, + "grad_condition": 10777473.575533265, + "lr": 0.0001577264470356557, + "time_sec": 49.47671389579773 + }, + { + "epoch": 75, + "train_loss": 0.6844219914627075, + "train_acc": 0.75664, + "test_loss": 2.7192491188049317, + "test_acc": 0.4659, + "lyapunov": null, + "grad_norm": 0.41891725324120427, + "grad_max_sv": 0.2549721471965313, + "grad_min_sv": 2.308645701276646e-08, + "grad_condition": 11178421.697050892, + "lr": 0.00014644660940672634, + "time_sec": 49.475868701934814 + }, + { + "epoch": 76, + "train_loss": 0.6757127567672729, + "train_acc": 0.76002, + "test_loss": 2.228153326416016, + "test_acc": 0.4719, + "lyapunov": null, + "grad_norm": 0.41518783756559813, + "grad_max_sv": 0.24106829576194286, + "grad_min_sv": 2.3467413079458765e-08, + "grad_condition": 10331945.898118276, + "lr": 0.0001355156862892944, + "time_sec": 49.47853899002075 + }, + { + "epoch": 77, + "train_loss": 0.6663033656692505, + "train_acc": 0.7606, + "test_loss": 2.5164624114990235, + "test_acc": 0.4627, + "lyapunov": null, + "grad_norm": 0.41866630242016806, + "grad_max_sv": 0.2701979674398899, + "grad_min_sv": 2.4135091125643272e-08, + "grad_condition": 11260755.273271866, + "lr": 0.00012494446518477025, + "time_sec": 49.47706151008606 + }, + { + "epoch": 78, + "train_loss": 0.6645314185142517, + "train_acc": 0.76252, + "test_loss": 2.8226414447784425, + "test_acc": 0.4614, + "lyapunov": null, + "grad_norm": 0.4173542916715373, + "grad_max_sv": 0.2490392465144396, + "grad_min_sv": 2.3206901200722994e-08, + "grad_condition": 10823280.058633823, + "lr": 0.00011474337861210548, + "time_sec": 49.483954191207886 + }, + { + "epoch": 79, + "train_loss": 0.6665540114593506, + "train_acc": 0.76016, + "test_loss": 2.2122913623809812, + "test_acc": 0.4819, + "lyapunov": null, + "grad_norm": 0.4188547510844498, + "grad_max_sv": 0.25715495869517324, + "grad_min_sv": 2.4195212988686877e-08, + "grad_condition": 10755821.867443344, + "lr": 0.00010492249381215483, + "time_sec": 49.46640372276306 + }, + { + "epoch": 80, + "train_loss": 0.6579594387054444, + "train_acc": 0.76406, + "test_loss": 2.328022619628906, + "test_acc": 0.4922, + "lyapunov": null, + "grad_norm": 0.41446019268915407, + "grad_max_sv": 0.2467421844601631, + "grad_min_sv": 2.3609747978881047e-08, + "grad_condition": 10542743.78062649, + "lr": 9.549150281252637e-05, + "time_sec": 49.47466158866882 + }, + { + "epoch": 81, + "train_loss": 0.6575078699111938, + "train_acc": 0.76504, + "test_loss": 2.435921426773071, + "test_acc": 0.4706, + "lyapunov": null, + "grad_norm": 0.41722587257024396, + "grad_max_sv": 0.2460654556751251, + "grad_min_sv": 2.2818005085412097e-08, + "grad_condition": 10871762.933690486, + "lr": 8.645971286271918e-05, + "time_sec": 49.48575758934021 + }, + { + "epoch": 82, + "train_loss": 0.6540266362380981, + "train_acc": 0.7668, + "test_loss": 2.420010438537598, + "test_acc": 0.4873, + "lyapunov": null, + "grad_norm": 0.4134489054266664, + "grad_max_sv": 0.24872095324099064, + "grad_min_sv": 2.4063159953513492e-08, + "grad_condition": 10418409.724400165, + "lr": 7.78360372489926e-05, + "time_sec": 49.4517502784729 + }, + { + "epoch": 83, + "train_loss": 0.6572029878616333, + "train_acc": 0.76728, + "test_loss": 2.509574550628662, + "test_acc": 0.4741, + "lyapunov": null, + "grad_norm": 0.40888921626022273, + "grad_max_sv": 0.24261515885591506, + "grad_min_sv": 2.325806733871616e-08, + "grad_condition": 10519103.211694924, + "lr": 6.962898649802815e-05, + "time_sec": 49.47699522972107 + }, + { + "epoch": 84, + "train_loss": 0.648239343738556, + "train_acc": 0.76774, + "test_loss": 2.2645148223876954, + "test_acc": 0.485, + "lyapunov": null, + "grad_norm": 0.4120785615672335, + "grad_max_sv": 0.24379208087921142, + "grad_min_sv": 2.272370744904606e-08, + "grad_condition": 10771039.526767144, + "lr": 6.184665997806824e-05, + "time_sec": 49.461183071136475 + }, + { + "epoch": 85, + "train_loss": 0.6412541982460022, + "train_acc": 0.77106, + "test_loss": 2.5437144912719725, + "test_acc": 0.4865, + "lyapunov": null, + "grad_norm": 0.41805406865324773, + "grad_max_sv": 0.2572408441454172, + "grad_min_sv": 2.2814066324983172e-08, + "grad_condition": 11337861.01159941, + "lr": 5.449673790581613e-05, + "time_sec": 49.47793769836426 + }, + { + "epoch": 86, + "train_loss": 0.6463544520187378, + "train_acc": 0.76662, + "test_loss": 2.9264222496032715, + "test_acc": 0.4471, + "lyapunov": null, + "grad_norm": 0.4118969055764605, + "grad_max_sv": 0.2387235414236784, + "grad_min_sv": 2.2642364694291928e-08, + "grad_condition": 10550361.803450387, + "lr": 4.758647376699034e-05, + "time_sec": 49.4726197719574 + }, + { + "epoch": 87, + "train_loss": 0.6428634425735473, + "train_acc": 0.7704, + "test_loss": 2.5568968086242676, + "test_acc": 0.4759, + "lyapunov": null, + "grad_norm": 0.415046593792845, + "grad_max_sv": 0.2535580638796091, + "grad_min_sv": 2.363120126247509e-08, + "grad_condition": 10837761.433894884, + "lr": 4.112268715800956e-05, + "time_sec": 49.48099684715271 + }, + { + "epoch": 88, + "train_loss": 0.6407405834579468, + "train_acc": 0.77184, + "test_loss": 2.4600058319091795, + "test_acc": 0.475, + "lyapunov": null, + "grad_norm": 0.4135582126787873, + "grad_max_sv": 0.25508003048598765, + "grad_min_sv": 2.376858407870941e-08, + "grad_condition": 10837781.081215866, + "lr": 3.511175705587434e-05, + "time_sec": 49.47017812728882 + }, + { + "epoch": 89, + "train_loss": 0.6344939192008973, + "train_acc": 0.77288, + "test_loss": 2.4250204902648926, + "test_acc": 0.4787, + "lyapunov": null, + "grad_norm": 0.4160361292383021, + "grad_max_sv": 0.25198650658130645, + "grad_min_sv": 2.3671872506625392e-08, + "grad_condition": 10764847.245073054, + "lr": 2.9559615522887284e-05, + "time_sec": 49.48287224769592 + }, + { + "epoch": 90, + "train_loss": 0.6344009274482727, + "train_acc": 0.77354, + "test_loss": 2.7001010314941407, + "test_acc": 0.4623, + "lyapunov": null, + "grad_norm": 0.4089648902673904, + "grad_max_sv": 0.24975020438432693, + "grad_min_sv": 2.2971467306120984e-08, + "grad_condition": 10990208.207150657, + "lr": 2.447174185242324e-05, + "time_sec": 49.50636339187622 + }, + { + "epoch": 91, + "train_loss": 0.6388888354110718, + "train_acc": 0.77322, + "test_loss": 2.4007692584991456, + "test_acc": 0.482, + "lyapunov": null, + "grad_norm": 0.41394740295503574, + "grad_max_sv": 0.24785541072487832, + "grad_min_sv": 2.4093225903243366e-08, + "grad_condition": 10380601.978368312, + "lr": 1.9853157161528526e-05, + "time_sec": 49.47446608543396 + }, + { + "epoch": 92, + "train_loss": 0.6364776765632629, + "train_acc": 0.7745, + "test_loss": 2.399016780090332, + "test_acc": 0.4893, + "lyapunov": null, + "grad_norm": 0.4144776850028884, + "grad_max_sv": 0.23398316986858844, + "grad_min_sv": 2.3364770829203963e-08, + "grad_condition": 10152213.637178902, + "lr": 1.570841943568452e-05, + "time_sec": 49.4903450012207 + }, + { + "epoch": 93, + "train_loss": 0.6323039393615723, + "train_acc": 0.7761, + "test_loss": 2.5661166526794434, + "test_acc": 0.4799, + "lyapunov": null, + "grad_norm": 0.4148058440423859, + "grad_max_sv": 0.25038140527904035, + "grad_min_sv": 2.3675201843431638e-08, + "grad_condition": 10621575.74650034, + "lr": 1.204161903062634e-05, + "time_sec": 49.47283339500427 + }, + { + "epoch": 94, + "train_loss": 0.6312036778831482, + "train_acc": 0.77456, + "test_loss": 2.4954245025634765, + "test_acc": 0.4884, + "lyapunov": null, + "grad_norm": 0.41190158928123094, + "grad_max_sv": 0.23922828286886216, + "grad_min_sv": 2.3207600818864195e-08, + "grad_condition": 10426944.434691576, + "lr": 8.85637463565564e-06, + "time_sec": 49.4705286026001 + }, + { + "epoch": 95, + "train_loss": 0.631898609752655, + "train_acc": 0.77374, + "test_loss": 2.496735878753662, + "test_acc": 0.484, + "lyapunov": null, + "grad_norm": 0.4118919272482802, + "grad_max_sv": 0.2545221421867609, + "grad_min_sv": 2.265429692727139e-08, + "grad_condition": 11229071.176658351, + "lr": 6.155829702431171e-06, + "time_sec": 49.45284724235535 + }, + { + "epoch": 96, + "train_loss": 0.6379076655197143, + "train_acc": 0.77178, + "test_loss": 2.6363272483825684, + "test_acc": 0.476, + "lyapunov": null, + "grad_norm": 0.4109637736779776, + "grad_max_sv": 0.23244931511580944, + "grad_min_sv": 2.2822463163763017e-08, + "grad_condition": 10301145.344649881, + "lr": 3.942649342761118e-06, + "time_sec": 49.47940802574158 + }, + { + "epoch": 97, + "train_loss": 0.6325872544288635, + "train_acc": 0.77334, + "test_loss": 2.7118479751586912, + "test_acc": 0.4606, + "lyapunov": null, + "grad_norm": 0.4111072193471729, + "grad_max_sv": 0.23797121047973632, + "grad_min_sv": 2.2607291239040707e-08, + "grad_condition": 10688228.14219837, + "lr": 2.2190176984600023e-06, + "time_sec": 49.482439041137695 + }, + { + "epoch": 98, + "train_loss": 0.6342727423286438, + "train_acc": 0.77484, + "test_loss": 2.50120391998291, + "test_acc": 0.4868, + "lyapunov": null, + "grad_norm": 0.4137394255148928, + "grad_max_sv": 0.24089130759239197, + "grad_min_sv": 2.424639040654597e-08, + "grad_condition": 10056603.153747398, + "lr": 9.866357858642206e-07, + "time_sec": 49.48271298408508 + }, + { + "epoch": 99, + "train_loss": 0.628259766407013, + "train_acc": 0.77486, + "test_loss": 2.447319179916382, + "test_acc": 0.4885, + "lyapunov": null, + "grad_norm": 0.4076037809536703, + "grad_max_sv": 0.25056461431086063, + "grad_min_sv": 2.3701171647516616e-08, + "grad_condition": 10626762.207877642, + "lr": 2.467198171342e-07, + "time_sec": 49.45984363555908 + }, + { + "epoch": 100, + "train_loss": 0.6313758395767212, + "train_acc": 0.77534, + "test_loss": 2.4442952224731447, + "test_acc": 0.4905, + "lyapunov": null, + "grad_norm": 0.40858498927976306, + "grad_max_sv": 0.23060753419995308, + "grad_min_sv": 2.2785150743942496e-08, + "grad_condition": 10116355.973472353, + "lr": 0.0, + "time_sec": 49.46379518508911 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 2.717775194091797, + "train_acc": 0.12228, + "test_loss": 3.3459623817443847, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 7.716699984005914, + "grad_max_sv": 7.287460565567017, + "grad_min_sv": 2.5165389772041635e-07, + "grad_condition": 29456429.211788226, + "lr": 0.0009997532801828658, + "time_sec": 66.53277444839478 + }, + { + "epoch": 2, + "train_loss": 2.2721379792785643, + "train_acc": 0.17654, + "test_loss": 4.04989028930664, + "test_acc": 0.1003, + "lyapunov": null, + "grad_norm": 6.63637414556116, + "grad_max_sv": 6.237935948371887, + "grad_min_sv": 2.2601446723058415e-07, + "grad_condition": 28188789.96425259, + "lr": 0.0009990133642141358, + "time_sec": 66.55316853523254 + }, + { + "epoch": 3, + "train_loss": 2.137921618881226, + "train_acc": 0.2105, + "test_loss": 5.869428012084961, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 5.7520031644476814, + "grad_max_sv": 5.452845233678818, + "grad_min_sv": 1.9201941405810886e-07, + "grad_condition": 28919609.465649594, + "lr": 0.00099778098230154, + "time_sec": 66.56071186065674 + }, + { + "epoch": 4, + "train_loss": 2.0486733519744873, + "train_acc": 0.23394, + "test_loss": 5.161107911682129, + "test_acc": 0.1097, + "lyapunov": null, + "grad_norm": 4.91519980042541, + "grad_max_sv": 4.5814680576324465, + "grad_min_sv": 1.6788343710771868e-07, + "grad_condition": 27707547.33712595, + "lr": 0.000996057350657239, + "time_sec": 66.55148816108704 + }, + { + "epoch": 5, + "train_loss": 1.9897926804351806, + "train_acc": 0.25822, + "test_loss": 4.115356592559815, + "test_acc": 0.1203, + "lyapunov": null, + "grad_norm": 4.476936137063571, + "grad_max_sv": 4.264879077672958, + "grad_min_sv": 1.6287330311115512e-07, + "grad_condition": 27434565.90350554, + "lr": 0.0009938441702975688, + "time_sec": 66.53483939170837 + }, + { + "epoch": 6, + "train_loss": 1.950422788543701, + "train_acc": 0.26598, + "test_loss": 6.161662875366211, + "test_acc": 0.1038, + "lyapunov": null, + "grad_norm": 4.078084494569751, + "grad_max_sv": 3.8316186487674715, + "grad_min_sv": 1.5860823996405315e-07, + "grad_condition": 24946451.178036533, + "lr": 0.0009911436253643444, + "time_sec": 66.544926404953 + }, + { + "epoch": 7, + "train_loss": 1.9193549822998046, + "train_acc": 0.28804, + "test_loss": 6.333303915405273, + "test_acc": 0.1006, + "lyapunov": null, + "grad_norm": 3.9544625089709906, + "grad_max_sv": 3.660486602783203, + "grad_min_sv": 1.3159545346752567e-07, + "grad_condition": 27858533.203216422, + "lr": 0.0009879583809693736, + "time_sec": 66.54343152046204 + }, + { + "epoch": 8, + "train_loss": 1.8974505254364014, + "train_acc": 0.29166, + "test_loss": 6.595959260559082, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 3.7716319720252063, + "grad_max_sv": 3.4488155782222747, + "grad_min_sv": 1.3156188991558792e-07, + "grad_condition": 26979104.149509914, + "lr": 0.0009842915805643154, + "time_sec": 66.53689360618591 + }, + { + "epoch": 9, + "train_loss": 1.8757565868377686, + "train_acc": 0.2988, + "test_loss": 8.294800563049316, + "test_acc": 0.1001, + "lyapunov": null, + "grad_norm": 3.606736816077247, + "grad_max_sv": 3.276396805047989, + "grad_min_sv": 1.2148574111137122e-07, + "grad_condition": 27354129.68622259, + "lr": 0.0009801468428384714, + "time_sec": 66.53859829902649 + }, + { + "epoch": 10, + "train_loss": 1.853810763168335, + "train_acc": 0.30818, + "test_loss": 7.528170121765137, + "test_acc": 0.1002, + "lyapunov": null, + "grad_norm": 3.590286745766664, + "grad_max_sv": 3.3836376488208773, + "grad_min_sv": 1.2300289498057282e-07, + "grad_condition": 28478996.179412544, + "lr": 0.0009755282581475767, + "time_sec": 66.54752492904663 + }, + { + "epoch": 11, + "train_loss": 1.8360865605926513, + "train_acc": 0.31554, + "test_loss": 8.300324632263184, + "test_acc": 0.1004, + "lyapunov": null, + "grad_norm": 3.4184867147228633, + "grad_max_sv": 3.2137346804141997, + "grad_min_sv": 1.2349632871888616e-07, + "grad_condition": 27052165.93028751, + "lr": 0.0009704403844771127, + "time_sec": 66.54567265510559 + }, + { + "epoch": 12, + "train_loss": 1.822631957397461, + "train_acc": 0.32436, + "test_loss": 7.752643719482422, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 3.4268104192911824, + "grad_max_sv": 3.0984551936388014, + "grad_min_sv": 1.1916837276970682e-07, + "grad_condition": 26678795.929163624, + "lr": 0.0009648882429441257, + "time_sec": 66.54143714904785 + }, + { + "epoch": 13, + "train_loss": 1.8042937320327759, + "train_acc": 0.33052, + "test_loss": 6.320642838287354, + "test_acc": 0.1016, + "lyapunov": null, + "grad_norm": 3.26500321242579, + "grad_max_sv": 3.034997683763504, + "grad_min_sv": 1.1198519924704443e-07, + "grad_condition": 27516714.34616376, + "lr": 0.0009588773128419905, + "time_sec": 66.54663801193237 + }, + { + "epoch": 14, + "train_loss": 1.7935633684539796, + "train_acc": 0.33378, + "test_loss": 8.591533955383301, + "test_acc": 0.1001, + "lyapunov": null, + "grad_norm": 3.205935962438017, + "grad_max_sv": 2.9335897117853165, + "grad_min_sv": 1.0952790088225584e-07, + "grad_condition": 27285541.83012454, + "lr": 0.0009524135262330098, + "time_sec": 66.54473447799683 + }, + { + "epoch": 15, + "train_loss": 1.7773359481811524, + "train_acc": 0.34102, + "test_loss": 9.823327029418945, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 3.107803718888726, + "grad_max_sv": 2.8818213611841204, + "grad_min_sv": 1.1047076302617142e-07, + "grad_condition": 26466849.950957365, + "lr": 0.0009455032620941839, + "time_sec": 66.54632878303528 + }, + { + "epoch": 16, + "train_loss": 1.7638415741348266, + "train_acc": 0.3494, + "test_loss": 10.98111782836914, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 2.991047436873543, + "grad_max_sv": 2.6788798362016677, + "grad_min_sv": 9.756340197952796e-08, + "grad_condition": 27546377.57163794, + "lr": 0.0009381533400219318, + "time_sec": 66.5387659072876 + }, + { + "epoch": 17, + "train_loss": 1.7545028717422486, + "train_acc": 0.3524, + "test_loss": 8.496100090026856, + "test_acc": 0.1005, + "lyapunov": null, + "grad_norm": 2.9405206102474817, + "grad_max_sv": 2.7797821670770646, + "grad_min_sv": 1.0545847413112597e-07, + "grad_condition": 26402272.837948732, + "lr": 0.0009303710135019719, + "time_sec": 66.53228521347046 + }, + { + "epoch": 18, + "train_loss": 1.7399513541412353, + "train_acc": 0.35946, + "test_loss": 9.442770735168457, + "test_acc": 0.1002, + "lyapunov": null, + "grad_norm": 2.876673477887061, + "grad_max_sv": 2.652202320098877, + "grad_min_sv": 1.0433013795108081e-07, + "grad_condition": 26098642.755907767, + "lr": 0.0009221639627510076, + "time_sec": 66.52799201011658 + }, + { + "epoch": 19, + "train_loss": 1.7275141513061523, + "train_acc": 0.36564, + "test_loss": 8.60740804901123, + "test_acc": 0.1, + "lyapunov": null, + "grad_norm": 2.820914668477109, + "grad_max_sv": 2.8074967473745347, + "grad_min_sv": 1.0515814725664541e-07, + "grad_condition": 27554948.172257036, + "lr": 0.000913540287137281, + "time_sec": 66.53072094917297 + }, + { + "epoch": 20, + "train_loss": 1.7184981283187866, + "train_acc": 0.36706, + "test_loss": 5.74347527923584, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 2.755999508826315, + "grad_max_sv": 2.4683564633131025, + "grad_min_sv": 9.147877104709323e-08, + "grad_condition": 27108387.83832861, + "lr": 0.0009045084971874739, + "time_sec": 66.53930997848511 + }, + { + "epoch": 21, + "train_loss": 1.7127495180892944, + "train_acc": 0.36988, + "test_loss": 5.374083380126953, + "test_acc": 0.1038, + "lyapunov": null, + "grad_norm": 2.7076782774581156, + "grad_max_sv": 2.415825995802879, + "grad_min_sv": 9.989069553739682e-08, + "grad_condition": 24996642.26521779, + "lr": 0.0008950775061878452, + "time_sec": 66.5274007320404 + }, + { + "epoch": 22, + "train_loss": 1.7080568863677978, + "train_acc": 0.37366, + "test_loss": 5.8365667526245115, + "test_acc": 0.1074, + "lyapunov": null, + "grad_norm": 2.777540200252398, + "grad_max_sv": 2.682383918762207, + "grad_min_sv": 1.0115953053002613e-07, + "grad_condition": 27062321.26943115, + "lr": 0.0008852566213878947, + "time_sec": 66.52736306190491 + }, + { + "epoch": 23, + "train_loss": 1.6937433179473877, + "train_acc": 0.378, + "test_loss": 5.908844201660156, + "test_acc": 0.102, + "lyapunov": null, + "grad_norm": 2.5943120813718052, + "grad_max_sv": 2.4230685472488402, + "grad_min_sv": 9.802377860523848e-08, + "grad_condition": 25663315.966033876, + "lr": 0.0008750555348152298, + "time_sec": 66.55514574050903 + }, + { + "epoch": 24, + "train_loss": 1.685849613647461, + "train_acc": 0.38486, + "test_loss": 6.484691570281982, + "test_acc": 0.1015, + "lyapunov": null, + "grad_norm": 2.470392685402757, + "grad_max_sv": 2.3409340023994445, + "grad_min_sv": 9.386610759776204e-08, + "grad_condition": 25307930.60423732, + "lr": 0.0008644843137107057, + "time_sec": 66.55581784248352 + }, + { + "epoch": 25, + "train_loss": 1.6830421477890014, + "train_acc": 0.38556, + "test_loss": 7.468188558959961, + "test_acc": 0.1022, + "lyapunov": null, + "grad_norm": 2.548563020510745, + "grad_max_sv": 2.1459918454289437, + "grad_min_sv": 8.803468158902205e-08, + "grad_condition": 24944715.33907653, + "lr": 0.0008535533905932737, + "time_sec": 66.53887248039246 + }, + { + "epoch": 26, + "train_loss": 1.6700520505523682, + "train_acc": 0.38856, + "test_loss": 7.895222584533691, + "test_acc": 0.1009, + "lyapunov": null, + "grad_norm": 2.5359070370837204, + "grad_max_sv": 2.4539994060993195, + "grad_min_sv": 9.640742533179037e-08, + "grad_condition": 26335532.748314124, + "lr": 0.0008422735529643444, + "time_sec": 66.54404091835022 + }, + { + "epoch": 27, + "train_loss": 1.6605180406951905, + "train_acc": 0.39334, + "test_loss": 6.994429248046875, + "test_acc": 0.101, + "lyapunov": null, + "grad_norm": 2.4258405770471474, + "grad_max_sv": 2.320448189973831, + "grad_min_sv": 9.107987271050888e-08, + "grad_condition": 26102152.790860306, + "lr": 0.0008306559326618259, + "time_sec": 66.53805947303772 + }, + { + "epoch": 28, + "train_loss": 1.6567610062408447, + "train_acc": 0.395, + "test_loss": 6.368250694274902, + "test_acc": 0.1099, + "lyapunov": null, + "grad_norm": 2.4482138479454654, + "grad_max_sv": 2.1421856224536895, + "grad_min_sv": 8.29846632299791e-08, + "grad_condition": 25968573.760956615, + "lr": 0.0008187119948743449, + "time_sec": 66.56613659858704 + }, + { + "epoch": 29, + "train_loss": 1.643007601623535, + "train_acc": 0.39978, + "test_loss": 5.360125735473633, + "test_acc": 0.1039, + "lyapunov": null, + "grad_norm": 2.4260201472737237, + "grad_max_sv": 2.2909662395715715, + "grad_min_sv": 9.427450295973471e-08, + "grad_condition": 24999199.08130427, + "lr": 0.0008064535268264883, + "time_sec": 66.5019998550415 + }, + { + "epoch": 30, + "train_loss": 1.6426652933120727, + "train_acc": 0.40242, + "test_loss": 5.846046133422852, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 2.4104230560175877, + "grad_max_sv": 2.2003868728876115, + "grad_min_sv": 8.557402386699664e-08, + "grad_condition": 26105024.01238749, + "lr": 0.0007938926261462367, + "time_sec": 66.54244065284729 + }, + { + "epoch": 31, + "train_loss": 1.6377650901031495, + "train_acc": 0.4032, + "test_loss": 5.6720462432861325, + "test_acc": 0.1037, + "lyapunov": null, + "grad_norm": 2.3941082742204367, + "grad_max_sv": 2.1774697691202163, + "grad_min_sv": 8.963231525882521e-08, + "grad_condition": 24809583.231536172, + "lr": 0.0007810416889260654, + "time_sec": 66.54210758209229 + }, + { + "epoch": 32, + "train_loss": 1.6306892547607421, + "train_acc": 0.40602, + "test_loss": 6.530587504577637, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 2.310788163521601, + "grad_max_sv": 2.3168098986148835, + "grad_min_sv": 8.591319300421674e-08, + "grad_condition": 27429040.418645225, + "lr": 0.0007679133974894983, + "time_sec": 66.54988598823547 + }, + { + "epoch": 33, + "train_loss": 1.616210421142578, + "train_acc": 0.41068, + "test_loss": 6.481897874450683, + "test_acc": 0.1047, + "lyapunov": null, + "grad_norm": 2.280822445658443, + "grad_max_sv": 2.0465356022119523, + "grad_min_sv": 8.811248948248363e-08, + "grad_condition": 23945215.471904326, + "lr": 0.0007545207078751857, + "time_sec": 66.54384207725525 + }, + { + "epoch": 34, + "train_loss": 1.6103173712921142, + "train_acc": 0.4129, + "test_loss": 7.558738642883301, + "test_acc": 0.1004, + "lyapunov": null, + "grad_norm": 2.268328370380239, + "grad_max_sv": 1.9925297170877456, + "grad_min_sv": 8.015654646698067e-08, + "grad_condition": 25172747.9746131, + "lr": 0.0007408768370508577, + "time_sec": 66.53899669647217 + }, + { + "epoch": 35, + "train_loss": 1.6033166294860839, + "train_acc": 0.41878, + "test_loss": 7.87334995880127, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 2.1857354046879727, + "grad_max_sv": 1.9975714191794396, + "grad_min_sv": 7.650004620884943e-08, + "grad_condition": 26089987.057969414, + "lr": 0.0007269952498697734, + "time_sec": 66.5277693271637 + }, + { + "epoch": 36, + "train_loss": 1.6046894992446898, + "train_acc": 0.41892, + "test_loss": 8.474886727905274, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 2.192178860403557, + "grad_max_sv": 2.002661418914795, + "grad_min_sv": 8.41961090181087e-08, + "grad_condition": 24123592.75292515, + "lr": 0.0007128896457825364, + "time_sec": 66.54011392593384 + }, + { + "epoch": 37, + "train_loss": 1.5938314058685303, + "train_acc": 0.42164, + "test_loss": 7.729584867858887, + "test_acc": 0.1023, + "lyapunov": null, + "grad_norm": 2.181177891654343, + "grad_max_sv": 2.0365157604217528, + "grad_min_sv": 8.0202053975853e-08, + "grad_condition": 26197254.249608647, + "lr": 0.0006985739453173903, + "time_sec": 66.53632307052612 + }, + { + "epoch": 38, + "train_loss": 1.5886405113220214, + "train_acc": 0.42264, + "test_loss": 5.7885481513977055, + "test_acc": 0.1062, + "lyapunov": null, + "grad_norm": 2.138587269147521, + "grad_max_sv": 1.933423602581024, + "grad_min_sv": 7.520017115680844e-08, + "grad_condition": 25928003.19539905, + "lr": 0.0006840622763423391, + "time_sec": 66.54145908355713 + }, + { + "epoch": 39, + "train_loss": 1.5804911177825929, + "train_acc": 0.42612, + "test_loss": 6.7240009689331055, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 2.146582724428281, + "grad_max_sv": 1.8961839854717255, + "grad_min_sv": 7.674624242781647e-08, + "grad_condition": 24938086.191727363, + "lr": 0.0006693689601226458, + "time_sec": 66.54460453987122 + }, + { + "epoch": 40, + "train_loss": 1.5785979819488525, + "train_acc": 0.42734, + "test_loss": 6.793812344360352, + "test_acc": 0.1033, + "lyapunov": null, + "grad_norm": 2.0524354853565967, + "grad_max_sv": 1.9275713503360747, + "grad_min_sv": 7.654831097880788e-08, + "grad_condition": 25599705.595900334, + "lr": 0.0006545084971874737, + "time_sec": 66.78280329704285 + }, + { + "epoch": 41, + "train_loss": 1.5828138892364503, + "train_acc": 0.42612, + "test_loss": 6.44511951751709, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 2.1085813246105163, + "grad_max_sv": 1.9095334649085998, + "grad_min_sv": 7.941251247700621e-08, + "grad_condition": 24686632.04929278, + "lr": 0.0006394955530196147, + "time_sec": 66.53900074958801 + }, + { + "epoch": 42, + "train_loss": 1.5717257321548461, + "train_acc": 0.42996, + "test_loss": 8.174863388061523, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 2.0568855518830627, + "grad_max_sv": 1.8603438019752503, + "grad_min_sv": 8.168111662598676e-08, + "grad_condition": 23782864.12280636, + "lr": 0.0006243449435824273, + "time_sec": 66.54205513000488 + }, + { + "epoch": 43, + "train_loss": 1.562401286239624, + "train_acc": 0.43392, + "test_loss": 7.7131751495361325, + "test_acc": 0.1014, + "lyapunov": null, + "grad_norm": 2.0119184672620642, + "grad_max_sv": 1.8657386392354964, + "grad_min_sv": 7.582975278808135e-08, + "grad_condition": 24942971.18450144, + "lr": 0.0006090716206982714, + "time_sec": 66.53042316436768 + }, + { + "epoch": 44, + "train_loss": 1.5541102393341064, + "train_acc": 0.43712, + "test_loss": 8.247987678527831, + "test_acc": 0.1011, + "lyapunov": null, + "grad_norm": 1.9482695609274137, + "grad_max_sv": 1.6971077546477318, + "grad_min_sv": 7.249982623136474e-08, + "grad_condition": 23783887.230844818, + "lr": 0.0005936906572928625, + "time_sec": 66.5365047454834 + }, + { + "epoch": 45, + "train_loss": 1.551253000793457, + "train_acc": 0.43906, + "test_loss": 7.164133547973633, + "test_acc": 0.1021, + "lyapunov": null, + "grad_norm": 1.9478309625288126, + "grad_max_sv": 1.7972041130065919, + "grad_min_sv": 7.798710131012853e-08, + "grad_condition": 23697966.26066207, + "lr": 0.0005782172325201156, + "time_sec": 66.54136061668396 + }, + { + "epoch": 46, + "train_loss": 1.541000611190796, + "train_acc": 0.44134, + "test_loss": 6.376314013671875, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 1.8630241109997108, + "grad_max_sv": 1.6913443714380265, + "grad_min_sv": 7.214549819778427e-08, + "grad_condition": 23808757.926116575, + "lr": 0.0005626666167821523, + "time_sec": 66.55902171134949 + }, + { + "epoch": 47, + "train_loss": 1.5372591391754151, + "train_acc": 0.44398, + "test_loss": 6.5030721710205075, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 1.9024590490680153, + "grad_max_sv": 1.814224436879158, + "grad_min_sv": 7.368249033135044e-08, + "grad_condition": 25117471.09981022, + "lr": 0.0005470541566592572, + "time_sec": 66.52199673652649 + }, + { + "epoch": 48, + "train_loss": 1.5375283456802369, + "train_acc": 0.44544, + "test_loss": 7.119714102935791, + "test_acc": 0.1016, + "lyapunov": null, + "grad_norm": 1.8585907694205182, + "grad_max_sv": 1.7394830703735351, + "grad_min_sv": 7.501465217885084e-08, + "grad_condition": 23906344.012628905, + "lr": 0.0005313952597646569, + "time_sec": 66.54580640792847 + }, + { + "epoch": 49, + "train_loss": 1.5338307555770874, + "train_acc": 0.4442, + "test_loss": 5.397337831115722, + "test_acc": 0.1059, + "lyapunov": null, + "grad_norm": 1.7902731589528738, + "grad_max_sv": 1.6494132414460183, + "grad_min_sv": 6.831805556828386e-08, + "grad_condition": 24615282.56582328, + "lr": 0.0005157053795390643, + "time_sec": 66.53534126281738 + }, + { + "epoch": 50, + "train_loss": 1.5284276412963866, + "train_acc": 0.44778, + "test_loss": 5.524033654785156, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 1.7713612838130008, + "grad_max_sv": 1.5726667106151582, + "grad_min_sv": 6.907176626214096e-08, + "grad_condition": 22960902.516891498, + "lr": 0.0005000000000000002, + "time_sec": 66.5325882434845 + }, + { + "epoch": 51, + "train_loss": 1.5330605014801026, + "train_acc": 0.44666, + "test_loss": 6.847183532714844, + "test_acc": 0.1031, + "lyapunov": null, + "grad_norm": 1.7792073911302086, + "grad_max_sv": 1.6382696747779846, + "grad_min_sv": 6.6116589625409e-08, + "grad_condition": 24861349.651776347, + "lr": 0.00048429462046093607, + "time_sec": 66.53938388824463 + }, + { + "epoch": 52, + "train_loss": 1.515211699180603, + "train_acc": 0.45132, + "test_loss": 6.849605633544922, + "test_acc": 0.1046, + "lyapunov": null, + "grad_norm": 1.7110848232260776, + "grad_max_sv": 1.4070507645606996, + "grad_min_sv": 6.268320333902011e-08, + "grad_condition": 22502851.341604523, + "lr": 0.0004686047402353435, + "time_sec": 66.54575228691101 + }, + { + "epoch": 53, + "train_loss": 1.511851570777893, + "train_acc": 0.44984, + "test_loss": 6.742161424255371, + "test_acc": 0.1035, + "lyapunov": null, + "grad_norm": 1.6990701953393579, + "grad_max_sv": 1.5247679650783539, + "grad_min_sv": 6.360552236017725e-08, + "grad_condition": 24187524.31056104, + "lr": 0.000452945843340743, + "time_sec": 66.55630564689636 + }, + { + "epoch": 54, + "train_loss": 1.5134658539581298, + "train_acc": 0.45194, + "test_loss": 6.076722029113769, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 1.67595650149666, + "grad_max_sv": 1.521102523803711, + "grad_min_sv": 6.705203148271721e-08, + "grad_condition": 23102185.373464666, + "lr": 0.00043733338321784806, + "time_sec": 66.54796624183655 + }, + { + "epoch": 55, + "train_loss": 1.5127635479736328, + "train_acc": 0.45416, + "test_loss": 6.099140180969238, + "test_acc": 0.1054, + "lyapunov": null, + "grad_norm": 1.669713615396416, + "grad_max_sv": 1.4162977203726768, + "grad_min_sv": 5.9198181379116475e-08, + "grad_condition": 24265418.333155036, + "lr": 0.0004217827674798847, + "time_sec": 66.56652212142944 + }, + { + "epoch": 56, + "train_loss": 1.5037149493789672, + "train_acc": 0.45674, + "test_loss": 5.881203063964843, + "test_acc": 0.106, + "lyapunov": null, + "grad_norm": 1.6488336383475701, + "grad_max_sv": 1.5071144998073578, + "grad_min_sv": 6.376719170475554e-08, + "grad_condition": 23818554.434521496, + "lr": 0.00040630934270713783, + "time_sec": 66.53574323654175 + }, + { + "epoch": 57, + "train_loss": 1.504850189590454, + "train_acc": 0.459, + "test_loss": 5.68402534790039, + "test_acc": 0.1076, + "lyapunov": null, + "grad_norm": 1.6129911107480968, + "grad_max_sv": 1.4527282550930978, + "grad_min_sv": 6.286840470437483e-08, + "grad_condition": 23483060.334747117, + "lr": 0.000390928379301729, + "time_sec": 66.54559707641602 + }, + { + "epoch": 58, + "train_loss": 1.4977053466033936, + "train_acc": 0.45916, + "test_loss": 5.9823997062683105, + "test_acc": 0.1071, + "lyapunov": null, + "grad_norm": 1.6061924832487942, + "grad_max_sv": 1.3888853162527084, + "grad_min_sv": 6.253125484079192e-08, + "grad_condition": 22608679.418678027, + "lr": 0.0003756550564175727, + "time_sec": 66.55387783050537 + }, + { + "epoch": 59, + "train_loss": 1.4972542272949219, + "train_acc": 0.45872, + "test_loss": 5.0882811370849605, + "test_acc": 0.1151, + "lyapunov": null, + "grad_norm": 1.5591682163016796, + "grad_max_sv": 1.3346713334321976, + "grad_min_sv": 5.8280132453347735e-08, + "grad_condition": 23069467.539254077, + "lr": 0.00036050444698038553, + "time_sec": 66.54211473464966 + }, + { + "epoch": 60, + "train_loss": 1.4907029873657227, + "train_acc": 0.46126, + "test_loss": 7.020564842224121, + "test_acc": 0.1048, + "lyapunov": null, + "grad_norm": 1.5345406038505094, + "grad_max_sv": 1.4284722179174423, + "grad_min_sv": 6.001468877414595e-08, + "grad_condition": 24162295.485593982, + "lr": 0.00034549150281252655, + "time_sec": 66.55491805076599 + }, + { + "epoch": 61, + "train_loss": 1.4877613472366333, + "train_acc": 0.4653, + "test_loss": 4.854167632293701, + "test_acc": 0.1114, + "lyapunov": null, + "grad_norm": 1.5324361061772793, + "grad_max_sv": 1.325933101773262, + "grad_min_sv": 5.964644183009682e-08, + "grad_condition": 22280923.908054985, + "lr": 0.0003306310398773544, + "time_sec": 66.54050326347351 + }, + { + "epoch": 62, + "train_loss": 1.4875999914550782, + "train_acc": 0.4609, + "test_loss": 6.024991397094727, + "test_acc": 0.1045, + "lyapunov": null, + "grad_norm": 1.5157035873578593, + "grad_max_sv": 1.2820105284452439, + "grad_min_sv": 5.6854590901878056e-08, + "grad_condition": 22744392.831777684, + "lr": 0.00031593772365766127, + "time_sec": 66.56322026252747 + }, + { + "epoch": 63, + "train_loss": 1.4804442275238037, + "train_acc": 0.46586, + "test_loss": 6.877338618469238, + "test_acc": 0.1028, + "lyapunov": null, + "grad_norm": 1.5037529747226948, + "grad_max_sv": 1.3301736950874328, + "grad_min_sv": 6.064568385255597e-08, + "grad_condition": 22458783.805724658, + "lr": 0.0003014260546826097, + "time_sec": 66.55420660972595 + }, + { + "epoch": 64, + "train_loss": 1.4785625118637085, + "train_acc": 0.4676, + "test_loss": 5.8289501716613765, + "test_acc": 0.1058, + "lyapunov": null, + "grad_norm": 1.4955609555476688, + "grad_max_sv": 1.2231090664863586, + "grad_min_sv": 5.909942020210224e-08, + "grad_condition": 21200746.17398096, + "lr": 0.0002871103542174637, + "time_sec": 66.55184054374695 + }, + { + "epoch": 65, + "train_loss": 1.474054185218811, + "train_acc": 0.4692, + "test_loss": 6.821263113403321, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.4816881050330082, + "grad_max_sv": 1.304422627389431, + "grad_min_sv": 6.126439071607592e-08, + "grad_condition": 22262717.79019341, + "lr": 0.0002730047501302267, + "time_sec": 66.54631876945496 + }, + { + "epoch": 66, + "train_loss": 1.468451905593872, + "train_acc": 0.46872, + "test_loss": 6.21660086593628, + "test_acc": 0.1049, + "lyapunov": null, + "grad_norm": 1.4471343716270808, + "grad_max_sv": 1.2118137910962106, + "grad_min_sv": 5.677175121121536e-08, + "grad_condition": 21833909.31574912, + "lr": 0.00025912316294914234, + "time_sec": 66.54650139808655 + }, + { + "epoch": 67, + "train_loss": 1.473218607635498, + "train_acc": 0.46886, + "test_loss": 5.585741909790039, + "test_acc": 0.1093, + "lyapunov": null, + "grad_norm": 1.4454249735567377, + "grad_max_sv": 1.344612455368042, + "grad_min_sv": 5.805593232821593e-08, + "grad_condition": 23703781.24599778, + "lr": 0.0002454792921248144, + "time_sec": 66.54963803291321 + }, + { + "epoch": 68, + "train_loss": 1.464357560043335, + "train_acc": 0.47134, + "test_loss": 6.43534487915039, + "test_acc": 0.1036, + "lyapunov": null, + "grad_norm": 1.4158825945249984, + "grad_max_sv": 1.216756673157215, + "grad_min_sv": 5.594884520121468e-08, + "grad_condition": 22117575.184218023, + "lr": 0.00023208660251050164, + "time_sec": 66.53380155563354 + }, + { + "epoch": 69, + "train_loss": 1.4605754261016846, + "train_acc": 0.47354, + "test_loss": 6.361464812469483, + "test_acc": 0.1041, + "lyapunov": null, + "grad_norm": 1.4102858398212452, + "grad_max_sv": 1.2650031745433807, + "grad_min_sv": 5.616340708058942e-08, + "grad_condition": 22755240.415779583, + "lr": 0.00021895831107393473, + "time_sec": 66.55379509925842 + }, + { + "epoch": 70, + "train_loss": 1.4566728033065797, + "train_acc": 0.4732, + "test_loss": 7.030058961486817, + "test_acc": 0.1052, + "lyapunov": null, + "grad_norm": 1.4004542368068666, + "grad_max_sv": 1.1733321487903594, + "grad_min_sv": 5.324388059335661e-08, + "grad_condition": 22428640.626706712, + "lr": 0.00020610737385376356, + "time_sec": 66.53196001052856 + }, + { + "epoch": 71, + "train_loss": 1.4595127109909058, + "train_acc": 0.4747, + "test_loss": 6.251192915344238, + "test_acc": 0.1055, + "lyapunov": null, + "grad_norm": 1.4007518176750748, + "grad_max_sv": 1.2036359310150146, + "grad_min_sv": 5.3584219283919765e-08, + "grad_condition": 22661079.860923886, + "lr": 0.00019354647317351177, + "time_sec": 66.53831934928894 + }, + { + "epoch": 72, + "train_loss": 1.4561804718780518, + "train_acc": 0.47592, + "test_loss": 6.078685757446289, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.3882159701453969, + "grad_max_sv": 1.1710434511303902, + "grad_min_sv": 5.193670311598453e-08, + "grad_condition": 22617697.621583022, + "lr": 0.0001812880051256552, + "time_sec": 66.53273725509644 + }, + { + "epoch": 73, + "train_loss": 1.456334539833069, + "train_acc": 0.47646, + "test_loss": 6.318551240539551, + "test_acc": 0.1053, + "lyapunov": null, + "grad_norm": 1.3893052276682352, + "grad_max_sv": 1.262186436355114, + "grad_min_sv": 5.998066114898392e-08, + "grad_condition": 21695066.67305842, + "lr": 0.00016934406733817422, + "time_sec": 66.53349781036377 + }, + { + "epoch": 74, + "train_loss": 1.450936794128418, + "train_acc": 0.48046, + "test_loss": 5.979817550659179, + "test_acc": 0.105, + "lyapunov": null, + "grad_norm": 1.3659009379358413, + "grad_max_sv": 1.2089540883898735, + "grad_min_sv": 5.6734091380405974e-08, + "grad_condition": 21453559.245642237, + "lr": 0.0001577264470356557, + "time_sec": 66.5519745349884 + }, + { + "epoch": 75, + "train_loss": 1.4469789163970947, + "train_acc": 0.47906, + "test_loss": 6.295627461242676, + "test_acc": 0.1067, + "lyapunov": null, + "grad_norm": 1.3551347445295552, + "grad_max_sv": 1.1976817324757576, + "grad_min_sv": 5.458875831365617e-08, + "grad_condition": 22252931.086762276, + "lr": 0.00014644660940672634, + "time_sec": 66.55559992790222 + }, + { + "epoch": 76, + "train_loss": 1.4463843099212645, + "train_acc": 0.47934, + "test_loss": 6.197264282226563, + "test_acc": 0.1079, + "lyapunov": null, + "grad_norm": 1.3380208446863917, + "grad_max_sv": 1.2127704448997974, + "grad_min_sv": 5.3017609769057116e-08, + "grad_condition": 23070185.252038278, + "lr": 0.0001355156862892944, + "time_sec": 66.54188418388367 + }, + { + "epoch": 77, + "train_loss": 1.4422340731430054, + "train_acc": 0.47956, + "test_loss": 6.095625473022461, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.319834743092097, + "grad_max_sv": 1.0997839123010635, + "grad_min_sv": 5.253857917608684e-08, + "grad_condition": 21034235.602306478, + "lr": 0.00012494446518477025, + "time_sec": 66.54432153701782 + }, + { + "epoch": 78, + "train_loss": 1.4469564128875732, + "train_acc": 0.48036, + "test_loss": 5.388970955657959, + "test_acc": 0.11, + "lyapunov": null, + "grad_norm": 1.3475784983368762, + "grad_max_sv": 1.2046680554747582, + "grad_min_sv": 5.585839417676652e-08, + "grad_condition": 21905924.79288598, + "lr": 0.00011474337861210548, + "time_sec": 66.53302836418152 + }, + { + "epoch": 79, + "train_loss": 1.4366684397125244, + "train_acc": 0.4798, + "test_loss": 6.206115145874024, + "test_acc": 0.1069, + "lyapunov": null, + "grad_norm": 1.3130109628098805, + "grad_max_sv": 1.1744658067822455, + "grad_min_sv": 5.508810989596213e-08, + "grad_condition": 21715398.426144313, + "lr": 0.00010492249381215483, + "time_sec": 66.53135848045349 + }, + { + "epoch": 80, + "train_loss": 1.4392537023544312, + "train_acc": 0.48228, + "test_loss": 6.179986186218262, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 1.3256940413341314, + "grad_max_sv": 1.1846244156360626, + "grad_min_sv": 5.3839901603680576e-08, + "grad_condition": 22125564.09370377, + "lr": 9.549150281252637e-05, + "time_sec": 66.5379912853241 + }, + { + "epoch": 81, + "train_loss": 1.4338660355377197, + "train_acc": 0.48616, + "test_loss": 6.177688023376465, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.331304941867422, + "grad_max_sv": 1.2059139341115952, + "grad_min_sv": 5.419374078385886e-08, + "grad_condition": 22342309.054380674, + "lr": 8.645971286271918e-05, + "time_sec": 66.5526373386383 + }, + { + "epoch": 82, + "train_loss": 1.4322706761550903, + "train_acc": 0.48346, + "test_loss": 6.39905592956543, + "test_acc": 0.1049, + "lyapunov": null, + "grad_norm": 1.3160308800060254, + "grad_max_sv": 1.1150345966219901, + "grad_min_sv": 5.504024436220334e-08, + "grad_condition": 20495998.096470684, + "lr": 7.78360372489926e-05, + "time_sec": 66.53385639190674 + }, + { + "epoch": 83, + "train_loss": 1.4299918703460692, + "train_acc": 0.48306, + "test_loss": 6.442905668640137, + "test_acc": 0.1051, + "lyapunov": null, + "grad_norm": 1.3113912638515688, + "grad_max_sv": 1.0838071212172509, + "grad_min_sv": 5.43203230840561e-08, + "grad_condition": 20241235.03989599, + "lr": 6.962898649802815e-05, + "time_sec": 66.52077317237854 + }, + { + "epoch": 84, + "train_loss": 1.4280065909194946, + "train_acc": 0.4822, + "test_loss": 6.0934767837524415, + "test_acc": 0.1077, + "lyapunov": null, + "grad_norm": 1.3219999598887227, + "grad_max_sv": 1.1636987075209617, + "grad_min_sv": 5.4432569296380964e-08, + "grad_condition": 21698960.666762732, + "lr": 6.184665997806824e-05, + "time_sec": 66.54324150085449 + }, + { + "epoch": 85, + "train_loss": 1.426846856918335, + "train_acc": 0.4865, + "test_loss": 5.9188161468505855, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 1.2965845421535789, + "grad_max_sv": 1.1792906790971756, + "grad_min_sv": 5.5100021434384416e-08, + "grad_condition": 21690369.73733188, + "lr": 5.449673790581613e-05, + "time_sec": 66.53187370300293 + }, + { + "epoch": 86, + "train_loss": 1.4228094031524658, + "train_acc": 0.48556, + "test_loss": 6.137683601379394, + "test_acc": 0.108, + "lyapunov": null, + "grad_norm": 1.292831856620217, + "grad_max_sv": 1.0124387323856354, + "grad_min_sv": 5.2233392278111523e-08, + "grad_condition": 19602805.79996558, + "lr": 4.758647376699034e-05, + "time_sec": 66.53067183494568 + }, + { + "epoch": 87, + "train_loss": 1.429165520362854, + "train_acc": 0.48332, + "test_loss": 5.927753118133545, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 1.3101745862822605, + "grad_max_sv": 1.1612930461764335, + "grad_min_sv": 5.276717347513227e-08, + "grad_condition": 22472879.957919728, + "lr": 4.112268715800956e-05, + "time_sec": 66.53908562660217 + }, + { + "epoch": 88, + "train_loss": 1.4288117279052734, + "train_acc": 0.48666, + "test_loss": 6.013241593933105, + "test_acc": 0.1075, + "lyapunov": null, + "grad_norm": 1.3007188330408852, + "grad_max_sv": 1.139727284014225, + "grad_min_sv": 5.308784185587001e-08, + "grad_condition": 21649216.459450316, + "lr": 3.511175705587434e-05, + "time_sec": 66.52465963363647 + }, + { + "epoch": 89, + "train_loss": 1.4234879583358764, + "train_acc": 0.48672, + "test_loss": 5.440691387176513, + "test_acc": 0.1132, + "lyapunov": null, + "grad_norm": 1.286797693166196, + "grad_max_sv": 1.1378898680210114, + "grad_min_sv": 5.206395803369901e-08, + "grad_condition": 22299317.66856014, + "lr": 2.9559615522887284e-05, + "time_sec": 66.52217221260071 + }, + { + "epoch": 90, + "train_loss": 1.4255534106445313, + "train_acc": 0.4873, + "test_loss": 5.6889183303833, + "test_acc": 0.1089, + "lyapunov": null, + "grad_norm": 1.2907871997501676, + "grad_max_sv": 1.1832163825631141, + "grad_min_sv": 5.3787662057658284e-08, + "grad_condition": 22287194.786688134, + "lr": 2.447174185242324e-05, + "time_sec": 66.53036832809448 + }, + { + "epoch": 91, + "train_loss": 1.4252548498916626, + "train_acc": 0.48792, + "test_loss": 6.261311422729492, + "test_acc": 0.1064, + "lyapunov": null, + "grad_norm": 1.3031797280361905, + "grad_max_sv": 1.1937354177236557, + "grad_min_sv": 5.396164546311866e-08, + "grad_condition": 22285756.773222417, + "lr": 1.9853157161528526e-05, + "time_sec": 66.53405451774597 + }, + { + "epoch": 92, + "train_loss": 1.4257716689300537, + "train_acc": 0.48484, + "test_loss": 5.9496440505981445, + "test_acc": 0.1083, + "lyapunov": null, + "grad_norm": 1.2963951565864091, + "grad_max_sv": 1.1119507551193237, + "grad_min_sv": 5.530857025703995e-08, + "grad_condition": 20517700.461063318, + "lr": 1.570841943568452e-05, + "time_sec": 66.55413794517517 + }, + { + "epoch": 93, + "train_loss": 1.4217627249526978, + "train_acc": 0.48994, + "test_loss": 5.984926200866699, + "test_acc": 0.1075, + "lyapunov": null, + "grad_norm": 1.264014206865248, + "grad_max_sv": 1.0518594324588775, + "grad_min_sv": 4.926823864437324e-08, + "grad_condition": 21435816.94874554, + "lr": 1.204161903062634e-05, + "time_sec": 66.52945113182068 + }, + { + "epoch": 94, + "train_loss": 1.4220651029205322, + "train_acc": 0.48712, + "test_loss": 5.9274788650512695, + "test_acc": 0.107, + "lyapunov": null, + "grad_norm": 1.2852744864782746, + "grad_max_sv": 1.194958347082138, + "grad_min_sv": 5.49836086882749e-08, + "grad_condition": 21876849.948771022, + "lr": 8.85637463565564e-06, + "time_sec": 66.53060245513916 + }, + { + "epoch": 95, + "train_loss": 1.4127644922637939, + "train_acc": 0.4891, + "test_loss": 6.033211676025391, + "test_acc": 0.1068, + "lyapunov": null, + "grad_norm": 1.2852733904252112, + "grad_max_sv": 1.1103495568037034, + "grad_min_sv": 5.0794950290367066e-08, + "grad_condition": 21903481.59645809, + "lr": 6.155829702431171e-06, + "time_sec": 66.54151201248169 + }, + { + "epoch": 96, + "train_loss": 1.42291917427063, + "train_acc": 0.48754, + "test_loss": 5.946468173217774, + "test_acc": 0.1078, + "lyapunov": null, + "grad_norm": 1.296502082808029, + "grad_max_sv": 1.1921778261661529, + "grad_min_sv": 5.59618015927299e-08, + "grad_condition": 21704630.944007598, + "lr": 3.942649342761118e-06, + "time_sec": 66.53685402870178 + }, + { + "epoch": 97, + "train_loss": 1.4221784051132202, + "train_acc": 0.48922, + "test_loss": 5.77611974029541, + "test_acc": 0.1107, + "lyapunov": null, + "grad_norm": 1.283101201721102, + "grad_max_sv": 1.1582708179950714, + "grad_min_sv": 5.3498822172315384e-08, + "grad_condition": 21893400.606446274, + "lr": 2.2190176984600023e-06, + "time_sec": 66.51551508903503 + }, + { + "epoch": 98, + "train_loss": 1.4199727509307862, + "train_acc": 0.48888, + "test_loss": 5.947603340148926, + "test_acc": 0.1072, + "lyapunov": null, + "grad_norm": 1.2852084329880165, + "grad_max_sv": 1.12471182346344, + "grad_min_sv": 5.5720254987789984e-08, + "grad_condition": 20744598.237500653, + "lr": 9.866357858642206e-07, + "time_sec": 66.54128313064575 + }, + { + "epoch": 99, + "train_loss": 1.4189085994720458, + "train_acc": 0.49036, + "test_loss": 6.019410075378418, + "test_acc": 0.1088, + "lyapunov": null, + "grad_norm": 1.2671570273045278, + "grad_max_sv": 1.044458197057247, + "grad_min_sv": 5.2453829901821794e-08, + "grad_condition": 20122144.845569003, + "lr": 2.467198171342e-07, + "time_sec": 66.5876886844635 + }, + { + "epoch": 100, + "train_loss": 1.4237549599456787, + "train_acc": 0.48696, + "test_loss": 6.123869666290283, + "test_acc": 0.1056, + "lyapunov": null, + "grad_norm": 1.2842958901976373, + "grad_max_sv": 1.0893320694565773, + "grad_min_sv": 5.240736280498481e-08, + "grad_condition": 20983923.24178537, + "lr": 0.0, + "time_sec": 66.52526140213013 + } + ] + }, + "lyapunov": { + "4": [ + { + "epoch": 1, + "train_loss": 5.9559499659729, + "train_acc": 0.1816, + "test_loss": 2.127836145401001, + "test_acc": 0.2458, + "lyapunov": 3.1805403927707916, + "grad_norm": 7.669457973262479, + "grad_max_sv": 5.918661725521088, + "grad_min_sv": 2.931642846704108e-07, + "grad_condition": 20422744.62807854, + "lr": 0.0009997532801828658, + "time_sec": 38.74378061294556 + }, + { + "epoch": 2, + "train_loss": 4.402947195281983, + "train_acc": 0.19622, + "test_loss": 2.0710217851638792, + "test_acc": 0.2599, + "lyapunov": 2.5604425824206807, + "grad_norm": 5.322089969338386, + "grad_max_sv": 4.252373713254928, + "grad_min_sv": 1.9552239614029076e-07, + "grad_condition": 22174922.12126705, + "lr": 0.0009990133642141358, + "time_sec": 38.64048624038696 + }, + { + "epoch": 3, + "train_loss": 4.045168105316162, + "train_acc": 0.22284, + "test_loss": 2.047537351036072, + "test_acc": 0.275, + "lyapunov": 2.4094676093372236, + "grad_norm": 3.329135536451279, + "grad_max_sv": 2.700692330300808, + "grad_min_sv": 1.3114565362570828e-07, + "grad_condition": 21120674.055912692, + "lr": 0.00099778098230154, + "time_sec": 38.632225036621094 + }, + { + "epoch": 4, + "train_loss": 3.8760036846923827, + "train_acc": 0.23552, + "test_loss": 2.0494147090911867, + "test_acc": 0.2624, + "lyapunov": 2.323524356803016, + "grad_norm": 1.6169046791962502, + "grad_max_sv": 1.2880224913358689, + "grad_min_sv": 5.374016822656813e-08, + "grad_condition": 24107383.024291664, + "lr": 0.000996057350657239, + "time_sec": 38.643821477890015 + }, + { + "epoch": 5, + "train_loss": 3.7066750312805175, + "train_acc": 0.23364, + "test_loss": 2.073809361457825, + "test_acc": 0.2559, + "lyapunov": 2.2068090539454195, + "grad_norm": 0.6888041501699484, + "grad_max_sv": 0.4505885936319828, + "grad_min_sv": 2.5095627176341396e-08, + "grad_condition": 18224356.70160868, + "lr": 0.0009938441702975688, + "time_sec": 38.63996958732605 + }, + { + "epoch": 6, + "train_loss": 3.5870462338256837, + "train_acc": 0.22278, + "test_loss": 2.0948594261169435, + "test_acc": 0.2419, + "lyapunov": 2.1068829035819947, + "grad_norm": 0.4525297557038159, + "grad_max_sv": 0.2912705983966589, + "grad_min_sv": 1.4355599531334918e-08, + "grad_condition": 20443883.38963156, + "lr": 0.0009911436253643444, + "time_sec": 38.64875626564026 + }, + { + "epoch": 7, + "train_loss": 3.516497625274658, + "train_acc": 0.20518, + "test_loss": 2.122341016769409, + "test_acc": 0.2149, + "lyapunov": 2.031583094535886, + "grad_norm": 0.4192338818357315, + "grad_max_sv": 0.2666142761707306, + "grad_min_sv": 1.244383397436266e-08, + "grad_condition": 21524577.239365414, + "lr": 0.0009879583809693736, + "time_sec": 38.65327429771423 + }, + { + "epoch": 8, + "train_loss": 3.500787953567505, + "train_acc": 0.15934, + "test_loss": 2.30495919342041, + "test_acc": 0.1, + "lyapunov": 1.9705595735393826, + "grad_norm": 0.364806685633591, + "grad_max_sv": 0.19433156847953797, + "grad_min_sv": 7.78323775238877e-09, + "grad_condition": 1400511997.1550007, + "lr": 0.0009842915805643154, + "time_sec": 38.633607625961304 + }, + { + "epoch": 9, + "train_loss": 3.5612770445251463, + "train_acc": 0.0995, + "test_loss": 2.309052435684204, + "test_acc": 0.1, + "lyapunov": 1.9462372851188836, + "grad_norm": 0.1961322565486487, + "grad_max_sv": 0.08832639907486736, + "grad_min_sv": 7.733921171735724e-10, + "grad_condition": 10141008570.944132, + "lr": 0.0009801468428384714, + "time_sec": 38.646180152893066 + }, + { + "epoch": 10, + "train_loss": 3.538458889770508, + "train_acc": 0.09824, + "test_loss": 2.3040579429626464, + "test_acc": 0.1, + "lyapunov": 1.9283022353106447, + "grad_norm": 0.21318046705690488, + "grad_max_sv": 0.0782687779981643, + "grad_min_sv": 8.435315090236436e-10, + "grad_condition": 12098584585.465805, + "lr": 0.0009755282581475767, + "time_sec": 38.63904404640198 + }, + { + "epoch": 11, + "train_loss": 3.529650466461182, + "train_acc": 0.10062, + "test_loss": 2.302797904205322, + "test_acc": 0.1, + "lyapunov": 1.9214661554302401, + "grad_norm": 0.14436104663435, + "grad_max_sv": 0.07406298876740039, + "grad_min_sv": 1.8938792208460978e-10, + "grad_condition": 16582547419.599035, + "lr": 0.0009704403844771127, + "time_sec": 38.65141201019287 + }, + { + "epoch": 12, + "train_loss": 3.527643050994873, + "train_acc": 0.09804, + "test_loss": 2.3026904548645017, + "test_acc": 0.1, + "lyapunov": 1.9200294935489859, + "grad_norm": 0.13153432020985192, + "grad_max_sv": 0.05873946417123079, + "grad_min_sv": 2.2213949011783955e-10, + "grad_condition": 29679782911.168915, + "lr": 0.0009648882429441257, + "time_sec": 38.637062311172485 + }, + { + "epoch": 13, + "train_loss": 3.525748397216797, + "train_acc": 0.09986, + "test_loss": 2.3026839447021485, + "test_acc": 0.1, + "lyapunov": 1.9183377143367173, + "grad_norm": 0.1253530383790545, + "grad_max_sv": 0.054947068355977534, + "grad_min_sv": 2.484597018350735e-10, + "grad_condition": 32728296691.529114, + "lr": 0.0009588773128419905, + "time_sec": 38.639862060546875 + }, + { + "epoch": 14, + "train_loss": 3.5267535670471193, + "train_acc": 0.09928, + "test_loss": 2.303218070602417, + "test_acc": 0.1, + "lyapunov": 1.9196420743337372, + "grad_norm": 0.1092532269273596, + "grad_max_sv": 0.04395028324797749, + "grad_min_sv": 9.613613581557888e-11, + "grad_condition": 21168413985.92494, + "lr": 0.0009524135262330098, + "time_sec": 38.639400243759155 + }, + { + "epoch": 15, + "train_loss": 3.5285498448181154, + "train_acc": 0.0982, + "test_loss": 2.3035209484100343, + "test_acc": 0.1, + "lyapunov": 1.920996154055876, + "grad_norm": 0.10604045531455125, + "grad_max_sv": 0.030423881998285652, + "grad_min_sv": 8.947113291620313e-11, + "grad_condition": 14692894250.958597, + "lr": 0.0009455032620941839, + "time_sec": 38.645652770996094 + }, + { + "epoch": 16, + "train_loss": 3.5281584407806394, + "train_acc": 0.09964, + "test_loss": 2.3028687210083008, + "test_acc": 0.1, + "lyapunov": 1.9207957717768676, + "grad_norm": 0.09543807455983376, + "grad_max_sv": 0.006560872681438923, + "grad_min_sv": 4.056405124991419e-12, + "grad_condition": 3706750979.9989243, + "lr": 0.0009381533400219318, + "time_sec": 38.63558006286621 + }, + { + "epoch": 17, + "train_loss": 3.5265050379943848, + "train_acc": 0.09798, + "test_loss": 2.302896424102783, + "test_acc": 0.1, + "lyapunov": 1.9195188765635576, + "grad_norm": 0.09404328433417611, + "grad_max_sv": 0.005626836745068431, + "grad_min_sv": 8.896868440940896e-13, + "grad_condition": 3600570896.7918577, + "lr": 0.0009303710135019719, + "time_sec": 38.63581418991089 + }, + { + "epoch": 18, + "train_loss": 3.5274914381408693, + "train_acc": 0.09708, + "test_loss": 2.3026503776550293, + "test_acc": 0.1, + "lyapunov": 1.9202668194270804, + "grad_norm": 0.09620880376142034, + "grad_max_sv": 0.003721812926232815, + "grad_min_sv": 3.080583531323011e-13, + "grad_condition": 2605476049.955305, + "lr": 0.0009221639627510076, + "time_sec": 38.637654304504395 + }, + { + "epoch": 19, + "train_loss": 3.5240187657165527, + "train_acc": 0.09788, + "test_loss": 2.3026472286224364, + "test_acc": 0.1, + "lyapunov": 1.917564369833378, + "grad_norm": 0.08696272623748423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000913540287137281, + "time_sec": 38.64585041999817 + }, + { + "epoch": 20, + "train_loss": 3.526093559265137, + "train_acc": 0.09698, + "test_loss": 2.302675205993652, + "test_acc": 0.1, + "lyapunov": 1.9192343212454521, + "grad_norm": 0.08759130668154863, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874739, + "time_sec": 38.63778305053711 + }, + { + "epoch": 21, + "train_loss": 3.5268382842254637, + "train_acc": 0.0963, + "test_loss": 2.302619518661499, + "test_acc": 0.1, + "lyapunov": 1.9198827185594212, + "grad_norm": 0.09131899089817433, + "grad_max_sv": 0.0007137967739254236, + "grad_min_sv": 1.2143662959650498e-34, + "grad_condition": 713796773.9254236, + "lr": 0.0008950775061878452, + "time_sec": 38.63694953918457 + }, + { + "epoch": 22, + "train_loss": 3.5266487127685546, + "train_acc": 0.09736, + "test_loss": 2.302595558166504, + "test_acc": 0.1, + "lyapunov": 1.919754564914557, + "grad_norm": 0.08451797479839518, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 38.62629771232605 + }, + { + "epoch": 23, + "train_loss": 3.526773832244873, + "train_acc": 0.09764, + "test_loss": 2.3026504470825193, + "test_acc": 0.1, + "lyapunov": 1.919811970132696, + "grad_norm": 0.0880141883169143, + "grad_max_sv": 0.003215626534074545, + "grad_min_sv": 6.757893669575438e-13, + "grad_condition": 421691349.6171393, + "lr": 0.0008750555348152298, + "time_sec": 38.627503395080566 + }, + { + "epoch": 24, + "train_loss": 3.5253559977722166, + "train_acc": 0.09686, + "test_loss": 2.302592763519287, + "test_acc": 0.1, + "lyapunov": 1.9186803285423142, + "grad_norm": 0.08625519727104183, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 38.62110924720764 + }, + { + "epoch": 25, + "train_loss": 3.5271505029296875, + "train_acc": 0.09882, + "test_loss": 2.3026457008361816, + "test_acc": 0.1, + "lyapunov": 1.9201455759575299, + "grad_norm": 0.08664315655618471, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008535533905932737, + "time_sec": 38.663304567337036 + }, + { + "epoch": 26, + "train_loss": 3.52567841835022, + "train_acc": 0.09848, + "test_loss": 2.302622730255127, + "test_acc": 0.1, + "lyapunov": 1.918919243775975, + "grad_norm": 0.08931714213407926, + "grad_max_sv": 0.0026560820173472167, + "grad_min_sv": 7.80326428931121e-27, + "grad_condition": 2656082017.346831, + "lr": 0.0008422735529643444, + "time_sec": 38.642497539520264 + }, + { + "epoch": 27, + "train_loss": 3.5247526208496094, + "train_acc": 0.09662, + "test_loss": 2.3026296226501466, + "test_acc": 0.1, + "lyapunov": 1.9182322189935943, + "grad_norm": 0.08339910325165188, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 38.63079476356506 + }, + { + "epoch": 28, + "train_loss": 3.5269400009155274, + "train_acc": 0.09728, + "test_loss": 2.3025920150756836, + "test_acc": 0.1, + "lyapunov": 1.9199587207316133, + "grad_norm": 0.08394537087665149, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 38.61244583129883 + }, + { + "epoch": 29, + "train_loss": 3.5242063328552247, + "train_acc": 0.09546, + "test_loss": 2.3025877166748048, + "test_acc": 0.1, + "lyapunov": 1.9176992738948149, + "grad_norm": 0.08393484553605075, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 38.62086057662964 + }, + { + "epoch": 30, + "train_loss": 3.524652021865845, + "train_acc": 0.09846, + "test_loss": 2.3025890396118163, + "test_acc": 0.1, + "lyapunov": 1.9180299269268886, + "grad_norm": 0.08604739858068552, + "grad_max_sv": 0.0037235306110233067, + "grad_min_sv": 2.2816656604449788e-14, + "grad_condition": 2522915018.0120707, + "lr": 0.0007938926261462367, + "time_sec": 38.63639521598816 + }, + { + "epoch": 31, + "train_loss": 3.5269307495117186, + "train_acc": 0.09852, + "test_loss": 2.302594734954834, + "test_acc": 0.1, + "lyapunov": 1.9199556487295635, + "grad_norm": 0.08308332919661195, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 38.632620334625244 + }, + { + "epoch": 32, + "train_loss": 3.526603982696533, + "train_acc": 0.0987, + "test_loss": 2.3026425048828125, + "test_acc": 0.1, + "lyapunov": 1.9197655053394835, + "grad_norm": 0.08373608851321027, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 38.6338005065918 + }, + { + "epoch": 33, + "train_loss": 3.5402134245300294, + "train_acc": 0.09648, + "test_loss": 2.3025889293670656, + "test_acc": 0.1, + "lyapunov": 1.926927990010937, + "grad_norm": 0.09981834537565924, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 38.6455602645874 + }, + { + "epoch": 34, + "train_loss": 3.5265413635253906, + "train_acc": 0.09788, + "test_loss": 2.302589825439453, + "test_acc": 0.1, + "lyapunov": 1.9196307095115448, + "grad_norm": 0.08459800727870437, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 38.652732133865356 + }, + { + "epoch": 35, + "train_loss": 3.526457656402588, + "train_acc": 0.09848, + "test_loss": 2.3025897277832033, + "test_acc": 0.1, + "lyapunov": 1.91963635930015, + "grad_norm": 0.08392830107993868, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 38.618977308273315 + }, + { + "epoch": 36, + "train_loss": 3.5264506495666503, + "train_acc": 0.09836, + "test_loss": 2.302591544342041, + "test_acc": 0.1, + "lyapunov": 1.919547389840226, + "grad_norm": 0.0844841992615646, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 38.635788917541504 + }, + { + "epoch": 37, + "train_loss": 3.525513755493164, + "train_acc": 0.09824, + "test_loss": 2.302587795257568, + "test_acc": 0.1, + "lyapunov": 1.9188998626626057, + "grad_norm": 0.08511865281250128, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 38.63599181175232 + }, + { + "epoch": 38, + "train_loss": 3.5258794207763673, + "train_acc": 0.09634, + "test_loss": 2.302587114715576, + "test_acc": 0.1, + "lyapunov": 1.9190363072983139, + "grad_norm": 0.08976844520779069, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 38.631999015808105 + }, + { + "epoch": 39, + "train_loss": 3.526812607116699, + "train_acc": 0.09782, + "test_loss": 2.3025868911743164, + "test_acc": 0.1, + "lyapunov": 1.9198928242144377, + "grad_norm": 0.08338895706252505, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 38.62815856933594 + }, + { + "epoch": 40, + "train_loss": 3.5299447924041747, + "train_acc": 0.09834, + "test_loss": 2.302587143325806, + "test_acc": 0.1, + "lyapunov": 1.9223552085554507, + "grad_norm": 0.09522270183573409, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 38.62764048576355 + }, + { + "epoch": 41, + "train_loss": 3.529573831253052, + "train_acc": 0.0978, + "test_loss": 2.3025870990753172, + "test_acc": 0.1, + "lyapunov": 1.922197810829143, + "grad_norm": 0.08338290015497958, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 38.63026428222656 + }, + { + "epoch": 42, + "train_loss": 3.5254642880249025, + "train_acc": 0.09878, + "test_loss": 2.302588144683838, + "test_acc": 0.1, + "lyapunov": 1.9188408784549256, + "grad_norm": 0.08333708848875665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 38.63510298728943 + }, + { + "epoch": 43, + "train_loss": 3.527522850036621, + "train_acc": 0.09724, + "test_loss": 2.302586852264404, + "test_acc": 0.1, + "lyapunov": 1.920439124717127, + "grad_norm": 0.08392990999765709, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 38.61439347267151 + }, + { + "epoch": 44, + "train_loss": 3.5268155879211425, + "train_acc": 0.09854, + "test_loss": 2.302588026046753, + "test_acc": 0.1, + "lyapunov": 1.919859874583876, + "grad_norm": 0.08808142140863674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 38.63164472579956 + }, + { + "epoch": 45, + "train_loss": 3.528644903793335, + "train_acc": 0.09726, + "test_loss": 2.302586632156372, + "test_acc": 0.1, + "lyapunov": 1.9213885017063306, + "grad_norm": 0.08163685266757659, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 38.63089060783386 + }, + { + "epoch": 46, + "train_loss": 3.5269173733520507, + "train_acc": 0.09548, + "test_loss": 2.302586455535889, + "test_acc": 0.1, + "lyapunov": 1.9199798500446408, + "grad_norm": 0.08000528496736534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 38.636719703674316 + }, + { + "epoch": 47, + "train_loss": 3.525616721343994, + "train_acc": 0.0969, + "test_loss": 2.3025855419158936, + "test_acc": 0.1, + "lyapunov": 1.918914921753242, + "grad_norm": 0.0847797082901155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 38.63527321815491 + }, + { + "epoch": 48, + "train_loss": 3.527122305908203, + "train_acc": 0.09908, + "test_loss": 2.302587979507446, + "test_acc": 0.1, + "lyapunov": 1.9201535523090216, + "grad_norm": 0.08334551671941194, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 38.6254460811615 + }, + { + "epoch": 49, + "train_loss": 3.529289007568359, + "train_acc": 0.09836, + "test_loss": 2.3025873039245606, + "test_acc": 0.1, + "lyapunov": 1.9219778029205243, + "grad_norm": 0.08239563380139257, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 38.63705110549927 + }, + { + "epoch": 50, + "train_loss": 3.5303411560821534, + "train_acc": 0.0977, + "test_loss": 2.3025870582580565, + "test_acc": 0.1, + "lyapunov": 1.9227478766380368, + "grad_norm": 0.08162963599167514, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 38.626914262771606 + }, + { + "epoch": 51, + "train_loss": 3.5286489057922363, + "train_acc": 0.09604, + "test_loss": 2.302586822128296, + "test_acc": 0.1, + "lyapunov": 1.9214349052180415, + "grad_norm": 0.08139452605749796, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 38.64423418045044 + }, + { + "epoch": 52, + "train_loss": 3.525787140045166, + "train_acc": 0.09778, + "test_loss": 2.3025859855651856, + "test_acc": 0.1, + "lyapunov": 1.9190660763884444, + "grad_norm": 0.08146521230474718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 38.6294162273407 + }, + { + "epoch": 53, + "train_loss": 3.5288507063293455, + "train_acc": 0.09546, + "test_loss": 2.3025855419158936, + "test_acc": 0.1, + "lyapunov": 1.9215699824530754, + "grad_norm": 0.08218605919682316, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 38.62653970718384 + }, + { + "epoch": 54, + "train_loss": 3.5271841695404054, + "train_acc": 0.09872, + "test_loss": 2.3025858070373535, + "test_acc": 0.1, + "lyapunov": 1.9201822860161666, + "grad_norm": 0.08216715344839949, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 38.638410806655884 + }, + { + "epoch": 55, + "train_loss": 3.526853522644043, + "train_acc": 0.09744, + "test_loss": 2.3025860900878907, + "test_acc": 0.1, + "lyapunov": 1.919959136897036, + "grad_norm": 0.0817176354250303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 38.630091190338135 + }, + { + "epoch": 56, + "train_loss": 3.5288575717926025, + "train_acc": 0.09954, + "test_loss": 2.302586184310913, + "test_acc": 0.1, + "lyapunov": 1.921623296444983, + "grad_norm": 0.08257148205256129, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 38.64346218109131 + }, + { + "epoch": 57, + "train_loss": 3.5272767601776125, + "train_acc": 0.09642, + "test_loss": 2.302586555480957, + "test_acc": 0.1, + "lyapunov": 1.9202661358791848, + "grad_norm": 0.08293348649238423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 38.64233660697937 + }, + { + "epoch": 58, + "train_loss": 3.526464948577881, + "train_acc": 0.09672, + "test_loss": 2.3025856628417967, + "test_acc": 0.1, + "lyapunov": 1.9196561523105786, + "grad_norm": 0.08164186959675705, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 38.63249588012695 + }, + { + "epoch": 59, + "train_loss": 3.5295531370544433, + "train_acc": 0.09774, + "test_loss": 2.302585400390625, + "test_acc": 0.1, + "lyapunov": 1.9221740268990206, + "grad_norm": 0.08246273738852085, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 38.646018266677856 + }, + { + "epoch": 60, + "train_loss": 3.5271629650115965, + "train_acc": 0.0971, + "test_loss": 2.3025858444213867, + "test_acc": 0.1, + "lyapunov": 1.9201987954356787, + "grad_norm": 0.08208001883222767, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 38.6309814453125 + }, + { + "epoch": 61, + "train_loss": 3.5265548262023927, + "train_acc": 0.0977, + "test_loss": 2.302585780715942, + "test_acc": 0.1, + "lyapunov": 1.9197500297785415, + "grad_norm": 0.08189736323511718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 38.638221740722656 + }, + { + "epoch": 62, + "train_loss": 3.52600441986084, + "train_acc": 0.09678, + "test_loss": 2.302585761642456, + "test_acc": 0.1, + "lyapunov": 1.9192463177854142, + "grad_norm": 0.08137598978711448, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 38.63043713569641 + }, + { + "epoch": 63, + "train_loss": 3.5271013943481444, + "train_acc": 0.09814, + "test_loss": 2.302585670852661, + "test_acc": 0.1, + "lyapunov": 1.920157666096602, + "grad_norm": 0.0823619758981674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 38.63147497177124 + }, + { + "epoch": 64, + "train_loss": 3.526780191192627, + "train_acc": 0.09852, + "test_loss": 2.302585818862915, + "test_acc": 0.1, + "lyapunov": 1.919904801546765, + "grad_norm": 0.08022492391600272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 38.62516927719116 + }, + { + "epoch": 65, + "train_loss": 3.5343781797790528, + "train_acc": 0.09912, + "test_loss": 2.3025853904724123, + "test_acc": 0.1, + "lyapunov": 1.9257748550771143, + "grad_norm": 0.10073329729823817, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 38.634148836135864 + }, + { + "epoch": 66, + "train_loss": 3.5349793888092043, + "train_acc": 0.09842, + "test_loss": 2.3025853446960447, + "test_acc": 0.1, + "lyapunov": 1.9264679845336758, + "grad_norm": 0.11920770311136344, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 38.61845135688782 + }, + { + "epoch": 67, + "train_loss": 3.526273007965088, + "train_acc": 0.09544, + "test_loss": 2.3025852378845215, + "test_acc": 0.1, + "lyapunov": 1.9194827823687697, + "grad_norm": 0.08304121043671493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 38.626497983932495 + }, + { + "epoch": 68, + "train_loss": 3.5271414315795897, + "train_acc": 0.0966, + "test_loss": 2.3025850952148437, + "test_acc": 0.1, + "lyapunov": 1.9202514917344389, + "grad_norm": 0.08574615477087318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 38.627126693725586 + }, + { + "epoch": 69, + "train_loss": 3.529951874008179, + "train_acc": 0.0986, + "test_loss": 2.30258518447876, + "test_acc": 0.1, + "lyapunov": 1.9225430412365652, + "grad_norm": 0.08082947961897828, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 38.630186319351196 + }, + { + "epoch": 70, + "train_loss": 3.526535584869385, + "train_acc": 0.09668, + "test_loss": 2.3025852592468263, + "test_acc": 0.1, + "lyapunov": 1.919725867183617, + "grad_norm": 0.08274796493939703, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 38.6431679725647 + }, + { + "epoch": 71, + "train_loss": 3.5277945655822753, + "train_acc": 0.09836, + "test_loss": 2.3025853775024414, + "test_acc": 0.1, + "lyapunov": 1.920768865843868, + "grad_norm": 0.08235441909099428, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 38.63748812675476 + }, + { + "epoch": 72, + "train_loss": 3.5274662791442872, + "train_acc": 0.0948, + "test_loss": 2.3025851234436034, + "test_acc": 0.1, + "lyapunov": 1.9204377185963, + "grad_norm": 0.08364637794680509, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 38.6381402015686 + }, + { + "epoch": 73, + "train_loss": 3.526118115386963, + "train_acc": 0.09886, + "test_loss": 2.302585259628296, + "test_acc": 0.1, + "lyapunov": 1.9193554836160995, + "grad_norm": 0.0826562338509352, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 38.65567326545715 + }, + { + "epoch": 74, + "train_loss": 3.527300643615723, + "train_acc": 0.09764, + "test_loss": 2.302585151672363, + "test_acc": 0.1, + "lyapunov": 1.9203089323190168, + "grad_norm": 0.08128595818241462, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 38.65558409690857 + }, + { + "epoch": 75, + "train_loss": 3.52685251663208, + "train_acc": 0.09664, + "test_loss": 2.3025852661132813, + "test_acc": 0.1, + "lyapunov": 1.9200191327068201, + "grad_norm": 0.08404244166329763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 38.63766312599182 + }, + { + "epoch": 76, + "train_loss": 3.5262623787689207, + "train_acc": 0.09722, + "test_loss": 2.3025850158691408, + "test_acc": 0.1, + "lyapunov": 1.919482776271108, + "grad_norm": 0.08232879952859255, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 38.633180379867554 + }, + { + "epoch": 77, + "train_loss": 3.528319863128662, + "train_acc": 0.09596, + "test_loss": 2.3025850936889647, + "test_acc": 0.1, + "lyapunov": 1.9211895322555776, + "grad_norm": 0.08358594679641423, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 38.6444034576416 + }, + { + "epoch": 78, + "train_loss": 3.526455977935791, + "train_acc": 0.09646, + "test_loss": 2.3025851753234865, + "test_acc": 0.1, + "lyapunov": 1.919646045740913, + "grad_norm": 0.0800944099425941, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 38.63438820838928 + }, + { + "epoch": 79, + "train_loss": 3.528594108276367, + "train_acc": 0.09844, + "test_loss": 2.302585315704346, + "test_acc": 0.1, + "lyapunov": 1.9213674385529345, + "grad_norm": 0.0823521435571041, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 38.63344979286194 + }, + { + "epoch": 80, + "train_loss": 3.5273741276550292, + "train_acc": 0.09784, + "test_loss": 2.3025850051879884, + "test_acc": 0.1, + "lyapunov": 1.9203915013681592, + "grad_norm": 0.0830759912493753, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 38.62626814842224 + }, + { + "epoch": 81, + "train_loss": 3.5291355400848388, + "train_acc": 0.09736, + "test_loss": 2.3025851634979246, + "test_acc": 0.1, + "lyapunov": 1.921823484818344, + "grad_norm": 0.08275874029214267, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 38.62844204902649 + }, + { + "epoch": 82, + "train_loss": 3.525912507019043, + "train_acc": 0.09748, + "test_loss": 2.3025852321624756, + "test_acc": 0.1, + "lyapunov": 1.91920463874212, + "grad_norm": 0.08153852660653182, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 38.653265714645386 + }, + { + "epoch": 83, + "train_loss": 3.5292207734680177, + "train_acc": 0.0958, + "test_loss": 2.3025851135253905, + "test_acc": 0.1, + "lyapunov": 1.9219502158786939, + "grad_norm": 0.08350888633092267, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 38.634111642837524 + }, + { + "epoch": 84, + "train_loss": 3.5284012381744385, + "train_acc": 0.09624, + "test_loss": 2.30258512878418, + "test_acc": 0.1, + "lyapunov": 1.9212511674217556, + "grad_norm": 0.08116909186786311, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 38.64353036880493 + }, + { + "epoch": 85, + "train_loss": 3.5251765769195558, + "train_acc": 0.09792, + "test_loss": 2.30258514251709, + "test_acc": 0.1, + "lyapunov": 1.918617296401802, + "grad_norm": 0.07954191314548852, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 38.62560677528381 + }, + { + "epoch": 86, + "train_loss": 3.5287663554382322, + "train_acc": 0.09838, + "test_loss": 2.302585173034668, + "test_acc": 0.1, + "lyapunov": 1.9215295982482794, + "grad_norm": 0.08355699198177892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 38.65434241294861 + }, + { + "epoch": 87, + "train_loss": 3.5260034490966796, + "train_acc": 0.09604, + "test_loss": 2.3025851554870607, + "test_acc": 0.1, + "lyapunov": 1.9192945807791122, + "grad_norm": 0.08149215014053633, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 38.63465094566345 + }, + { + "epoch": 88, + "train_loss": 3.5243265664672854, + "train_acc": 0.09828, + "test_loss": 2.302585033416748, + "test_acc": 0.1, + "lyapunov": 1.9179029281791824, + "grad_norm": 0.08154521467921626, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 38.6289963722229 + }, + { + "epoch": 89, + "train_loss": 3.5287904942321777, + "train_acc": 0.09666, + "test_loss": 2.302585191345215, + "test_acc": 0.1, + "lyapunov": 1.9215726117648737, + "grad_norm": 0.084132595254172, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 38.642388105392456 + }, + { + "epoch": 90, + "train_loss": 3.526969603881836, + "train_acc": 0.09754, + "test_loss": 2.302585014343262, + "test_acc": 0.1, + "lyapunov": 1.920039845549542, + "grad_norm": 0.0821271686806539, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 38.63814377784729 + }, + { + "epoch": 91, + "train_loss": 3.527617153930664, + "train_acc": 0.09638, + "test_loss": 2.302585041809082, + "test_acc": 0.1, + "lyapunov": 1.9205815706716474, + "grad_norm": 0.08312510555513332, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 38.61940360069275 + }, + { + "epoch": 92, + "train_loss": 3.5268433947753905, + "train_acc": 0.09684, + "test_loss": 2.3025852138519287, + "test_acc": 0.1, + "lyapunov": 1.9199492108181615, + "grad_norm": 0.0823876986166593, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 38.627458810806274 + }, + { + "epoch": 93, + "train_loss": 3.53038783744812, + "train_acc": 0.0982, + "test_loss": 2.3025850196838378, + "test_acc": 0.1, + "lyapunov": 1.9228984605320885, + "grad_norm": 0.08263085862758328, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 38.63483691215515 + }, + { + "epoch": 94, + "train_loss": 3.5289703980255127, + "train_acc": 0.09816, + "test_loss": 2.3025850566864015, + "test_acc": 0.1, + "lyapunov": 1.9216854218631754, + "grad_norm": 0.08327210271669083, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 38.63469362258911 + }, + { + "epoch": 95, + "train_loss": 3.5277647956848144, + "train_acc": 0.0995, + "test_loss": 2.3025852081298828, + "test_acc": 0.1, + "lyapunov": 1.9207559202028357, + "grad_norm": 0.08352486265414892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 38.64616012573242 + }, + { + "epoch": 96, + "train_loss": 3.526619141845703, + "train_acc": 0.09938, + "test_loss": 2.3025851345062254, + "test_acc": 0.1, + "lyapunov": 1.9198539360709812, + "grad_norm": 0.08098182122024891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 38.62220072746277 + }, + { + "epoch": 97, + "train_loss": 3.5280892516326903, + "train_acc": 0.1, + "test_loss": 2.3025852352142335, + "test_acc": 0.1, + "lyapunov": 1.921060741100165, + "grad_norm": 0.08211810367594433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 38.645119190216064 + }, + { + "epoch": 98, + "train_loss": 3.5287079336547853, + "train_acc": 0.1, + "test_loss": 2.3025850273132322, + "test_acc": 0.1, + "lyapunov": 1.9215380800959398, + "grad_norm": 0.08325515946558669, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 38.63027763366699 + }, + { + "epoch": 99, + "train_loss": 3.5253015606689453, + "train_acc": 0.1, + "test_loss": 2.30258511428833, + "test_acc": 0.1, + "lyapunov": 1.9187132022569857, + "grad_norm": 0.08193671483030009, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 38.63921046257019 + }, + { + "epoch": 100, + "train_loss": 3.5272140621948243, + "train_acc": 0.1, + "test_loss": 2.302585135269165, + "test_acc": 0.1, + "lyapunov": 1.9202767503840843, + "grad_norm": 0.08222655054617872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 38.6323139667511 + } + ], + "8": [ + { + "epoch": 1, + "train_loss": 8.479881681365967, + "train_acc": 0.15672, + "test_loss": 2.162619204711914, + "test_acc": 0.2125, + "lyapunov": 4.108346384199684, + "grad_norm": 7.697098833505723, + "grad_max_sv": 6.178906440734863, + "grad_min_sv": 2.761631513692464e-07, + "grad_condition": 23140136.221944965, + "lr": 0.0009997532801828658, + "time_sec": 81.47396469116211 + }, + { + "epoch": 2, + "train_loss": 5.665244631958008, + "train_acc": 0.18, + "test_loss": 2.1842808677673338, + "test_acc": 0.1923, + "lyapunov": 3.230283256686862, + "grad_norm": 5.392009012742897, + "grad_max_sv": 4.110089653730393, + "grad_min_sv": 1.9321651976156317e-07, + "grad_condition": 21420475.323837068, + "lr": 0.0009990133642141358, + "time_sec": 81.45991396903992 + }, + { + "epoch": 3, + "train_loss": 5.333162035522461, + "train_acc": 0.1952, + "test_loss": 2.225303956604004, + "test_acc": 0.167, + "lyapunov": 3.1082111679379594, + "grad_norm": 3.851771920219555, + "grad_max_sv": 3.176962560415268, + "grad_min_sv": 1.3438213457561688e-07, + "grad_condition": 23879291.498504233, + "lr": 0.00099778098230154, + "time_sec": 81.46788787841797 + }, + { + "epoch": 4, + "train_loss": 5.171234805908203, + "train_acc": 0.20002, + "test_loss": 2.235258939361572, + "test_acc": 0.159, + "lyapunov": 3.0473744570446746, + "grad_norm": 2.481126294013876, + "grad_max_sv": 2.0792742133140565, + "grad_min_sv": 8.9392968050106e-08, + "grad_condition": 24637829.84704242, + "lr": 0.000996057350657239, + "time_sec": 81.47967004776001 + }, + { + "epoch": 5, + "train_loss": 5.166805406799316, + "train_acc": 0.19452, + "test_loss": 2.237046794128418, + "test_acc": 0.1327, + "lyapunov": 3.0511742223559133, + "grad_norm": 1.3615579983642885, + "grad_max_sv": 1.0548206314444541, + "grad_min_sv": 4.5490313116403056e-08, + "grad_condition": 23987300.59429905, + "lr": 0.0009938441702975688, + "time_sec": 81.459157705307 + }, + { + "epoch": 6, + "train_loss": 4.8697237976074215, + "train_acc": 0.1737, + "test_loss": 2.2830872146606445, + "test_acc": 0.1253, + "lyapunov": 2.8754516471072535, + "grad_norm": 0.6903867745940513, + "grad_max_sv": 0.41943032629787924, + "grad_min_sv": 1.919375629544362e-08, + "grad_condition": 22192013.87340497, + "lr": 0.0009911436253643444, + "time_sec": 81.48192954063416 + }, + { + "epoch": 7, + "train_loss": 4.493588522949219, + "train_acc": 0.15938, + "test_loss": 2.3302653469085692, + "test_acc": 0.1, + "lyapunov": 2.653091859939458, + "grad_norm": 0.7557218960403191, + "grad_max_sv": 0.26077940948307515, + "grad_min_sv": 1.0986899512399616e-08, + "grad_condition": 25117189.859535195, + "lr": 0.0009879583809693736, + "time_sec": 81.4841628074646 + }, + { + "epoch": 8, + "train_loss": 4.350341845397949, + "train_acc": 0.15252, + "test_loss": 2.3086660652160647, + "test_acc": 0.1, + "lyapunov": 2.5555299291830234, + "grad_norm": 0.6250628446482196, + "grad_max_sv": 0.20942260958254338, + "grad_min_sv": 7.251302003297155e-09, + "grad_condition": 30522570.970140863, + "lr": 0.0009842915805643154, + "time_sec": 81.46237683296204 + }, + { + "epoch": 9, + "train_loss": 4.145118522186279, + "train_acc": 0.13274, + "test_loss": 2.315164138031006, + "test_acc": 0.1, + "lyapunov": 2.40533269762688, + "grad_norm": 0.6205908073118289, + "grad_max_sv": 0.14447018823120744, + "grad_min_sv": 4.4057232563565755e-09, + "grad_condition": 34238562.93985257, + "lr": 0.0009801468428384714, + "time_sec": 81.4730293750763 + }, + { + "epoch": 10, + "train_loss": 4.078840268859863, + "train_acc": 0.1284, + "test_loss": 2.3138900623321534, + "test_acc": 0.1, + "lyapunov": 2.363016066343888, + "grad_norm": 0.7930843872612708, + "grad_max_sv": 0.10398251404985785, + "grad_min_sv": 3.7019540950061767e-09, + "grad_condition": 60913515.913623154, + "lr": 0.0009755282581475767, + "time_sec": 81.45200657844543 + }, + { + "epoch": 11, + "train_loss": 4.092224692230225, + "train_acc": 0.1466, + "test_loss": 2.312975662994385, + "test_acc": 0.1, + "lyapunov": 2.3754844513085795, + "grad_norm": 1.1984655112922225, + "grad_max_sv": 0.17450910471379757, + "grad_min_sv": 5.5799074860640734e-09, + "grad_condition": 13168082812.37189, + "lr": 0.0009704403844771127, + "time_sec": 81.45421433448792 + }, + { + "epoch": 12, + "train_loss": 4.142614550323486, + "train_acc": 0.10048, + "test_loss": 2.3073625778198243, + "test_acc": 0.1, + "lyapunov": 2.36521298623146, + "grad_norm": 0.8201455961321854, + "grad_max_sv": 0.06452706009149552, + "grad_min_sv": 1.4042129118228878e-12, + "grad_condition": 50885083514.90724, + "lr": 0.0009648882429441257, + "time_sec": 81.46072387695312 + }, + { + "epoch": 13, + "train_loss": 3.979385091934204, + "train_acc": 0.10066, + "test_loss": 2.3081630187988282, + "test_acc": 0.1, + "lyapunov": 2.26381984696059, + "grad_norm": 0.16210184952823345, + "grad_max_sv": 0.04905642978847027, + "grad_min_sv": 2.7241308859756593e-12, + "grad_condition": 39268609789.13625, + "lr": 0.0009588773128419905, + "time_sec": 81.4600670337677 + }, + { + "epoch": 14, + "train_loss": 4.013840252990723, + "train_acc": 0.09774, + "test_loss": 2.3071225547790526, + "test_acc": 0.1, + "lyapunov": 2.2779995590219717, + "grad_norm": 0.2350799590612887, + "grad_max_sv": 0.03584399004466832, + "grad_min_sv": 2.4371194341884142e-11, + "grad_condition": 24256890299.017464, + "lr": 0.0009524135262330098, + "time_sec": 81.45963406562805 + }, + { + "epoch": 15, + "train_loss": 3.9913157040405274, + "train_acc": 0.09784, + "test_loss": 2.319146055984497, + "test_acc": 0.1, + "lyapunov": 2.268958825894329, + "grad_norm": 0.15763925383129676, + "grad_max_sv": 0.009183965646661818, + "grad_min_sv": 1.97946225383161e-12, + "grad_condition": 8163098832.376617, + "lr": 0.0009455032620941839, + "time_sec": 81.44594478607178 + }, + { + "epoch": 16, + "train_loss": 3.9718331854248046, + "train_acc": 0.0996, + "test_loss": 2.3092525833129884, + "test_acc": 0.1, + "lyapunov": 2.2586230457286396, + "grad_norm": 0.11766352456542575, + "grad_max_sv": 0.006989215174689889, + "grad_min_sv": 2.4024430389645366e-14, + "grad_condition": 6504081924.260536, + "lr": 0.0009381533400219318, + "time_sec": 81.44390797615051 + }, + { + "epoch": 17, + "train_loss": 3.9787883277130125, + "train_acc": 0.09702, + "test_loss": 2.3043574817657473, + "test_acc": 0.1, + "lyapunov": 2.2631307922665727, + "grad_norm": 0.1527010207412437, + "grad_max_sv": 0.009803948854096235, + "grad_min_sv": 1.4435005241224427e-33, + "grad_condition": 9803948854.096233, + "lr": 0.0009303710135019719, + "time_sec": 81.43403100967407 + }, + { + "epoch": 18, + "train_loss": 3.9913615090942383, + "train_acc": 0.09744, + "test_loss": 2.3033508323669434, + "test_acc": 0.1, + "lyapunov": 2.269262256524752, + "grad_norm": 0.11184179273021279, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009221639627510076, + "time_sec": 81.42399740219116 + }, + { + "epoch": 19, + "train_loss": 3.9763801429748535, + "train_acc": 0.0977, + "test_loss": 2.3026752422332764, + "test_acc": 0.1, + "lyapunov": 2.2619051079615913, + "grad_norm": 0.11713248666386221, + "grad_max_sv": 0.000484072370454669, + "grad_min_sv": 0.0, + "grad_condition": 484072370.454669, + "lr": 0.000913540287137281, + "time_sec": 81.4525249004364 + }, + { + "epoch": 20, + "train_loss": 3.976750040283203, + "train_acc": 0.09734, + "test_loss": 2.302591667175293, + "test_acc": 0.1, + "lyapunov": 2.262148560770332, + "grad_norm": 0.11345857984491753, + "grad_max_sv": 0.004815328773111105, + "grad_min_sv": 7.298523316195025e-36, + "grad_condition": 4815328773.111105, + "lr": 0.0009045084971874739, + "time_sec": 81.51628756523132 + }, + { + "epoch": 21, + "train_loss": 3.980269993438721, + "train_acc": 0.09802, + "test_loss": 2.302587752532959, + "test_acc": 0.1, + "lyapunov": 2.264334798164075, + "grad_norm": 0.13684662833237576, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008950775061878452, + "time_sec": 81.45560097694397 + }, + { + "epoch": 22, + "train_loss": 3.9804648877716065, + "train_acc": 0.0979, + "test_loss": 2.302587752532959, + "test_acc": 0.1, + "lyapunov": 2.2635294013011182, + "grad_norm": 0.13344079799844585, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 81.44366526603699 + }, + { + "epoch": 23, + "train_loss": 3.9813251597595216, + "train_acc": 0.09872, + "test_loss": 2.302596923828125, + "test_acc": 0.1, + "lyapunov": 2.264318755825462, + "grad_norm": 0.11240815342914404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008750555348152298, + "time_sec": 81.4700722694397 + }, + { + "epoch": 24, + "train_loss": 3.9829969465637207, + "train_acc": 0.09762, + "test_loss": 2.302590003967285, + "test_acc": 0.1, + "lyapunov": 2.2655306484388267, + "grad_norm": 0.13657445352154945, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 81.44092345237732 + }, + { + "epoch": 25, + "train_loss": 3.9867445934295653, + "train_acc": 0.09768, + "test_loss": 2.3025884731292723, + "test_acc": 0.1, + "lyapunov": 2.2683042187215117, + "grad_norm": 0.13504220620651136, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008535533905932737, + "time_sec": 81.44885325431824 + }, + { + "epoch": 26, + "train_loss": 4.011947896575927, + "train_acc": 0.09772, + "test_loss": 2.302588147735596, + "test_acc": 0.1, + "lyapunov": 2.2796514083052535, + "grad_norm": 0.16320303411181733, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643444, + "time_sec": 81.45354628562927 + }, + { + "epoch": 27, + "train_loss": 3.9786824931335447, + "train_acc": 0.09896, + "test_loss": 2.302594832611084, + "test_acc": 0.1, + "lyapunov": 2.26323458300832, + "grad_norm": 0.10988564477689002, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 81.44628882408142 + }, + { + "epoch": 28, + "train_loss": 3.977536257247925, + "train_acc": 0.098, + "test_loss": 2.302598391723633, + "test_acc": 0.1, + "lyapunov": 2.262441022926584, + "grad_norm": 0.12595116922261335, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 81.4543764591217 + }, + { + "epoch": 29, + "train_loss": 3.976567816162109, + "train_acc": 0.09876, + "test_loss": 2.302590633010864, + "test_acc": 0.1, + "lyapunov": 2.2617232262935785, + "grad_norm": 0.11663224483129596, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 81.45405316352844 + }, + { + "epoch": 30, + "train_loss": 3.98611599609375, + "train_acc": 0.09902, + "test_loss": 2.302588882827759, + "test_acc": 0.1, + "lyapunov": 2.268034580723404, + "grad_norm": 0.12156603788402341, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462367, + "time_sec": 81.43305087089539 + }, + { + "epoch": 31, + "train_loss": 3.973400810546875, + "train_acc": 0.09778, + "test_loss": 2.3025912315368653, + "test_acc": 0.1, + "lyapunov": 2.259550383633665, + "grad_norm": 0.11416147448139306, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 81.45837593078613 + }, + { + "epoch": 32, + "train_loss": 3.988133301086426, + "train_acc": 0.0974, + "test_loss": 2.3025894966125486, + "test_acc": 0.1, + "lyapunov": 2.2669999562870817, + "grad_norm": 0.11056723038790034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 81.44456076622009 + }, + { + "epoch": 33, + "train_loss": 4.005648225860596, + "train_acc": 0.09582, + "test_loss": 2.302590217590332, + "test_acc": 0.1, + "lyapunov": 2.2759649180390342, + "grad_norm": 0.15627582965327647, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 81.45507860183716 + }, + { + "epoch": 34, + "train_loss": 3.979487621154785, + "train_acc": 0.09842, + "test_loss": 2.3025886589050293, + "test_acc": 0.1, + "lyapunov": 2.2636950528225324, + "grad_norm": 0.11766964677730013, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 81.40873432159424 + }, + { + "epoch": 35, + "train_loss": 3.9761420146942137, + "train_acc": 0.09734, + "test_loss": 2.3025886192321776, + "test_acc": 0.1, + "lyapunov": 2.2615554509565348, + "grad_norm": 0.13516175590778773, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 81.41994976997375 + }, + { + "epoch": 36, + "train_loss": 3.982365760269165, + "train_acc": 0.09772, + "test_loss": 2.302588511276245, + "test_acc": 0.1, + "lyapunov": 2.2654811189607584, + "grad_norm": 0.11681074828605718, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 81.44073605537415 + }, + { + "epoch": 37, + "train_loss": 4.0145159342956545, + "train_acc": 0.09844, + "test_loss": 2.3025877605438234, + "test_acc": 0.1, + "lyapunov": 2.279959214617834, + "grad_norm": 0.16927419652036743, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 81.44942951202393 + }, + { + "epoch": 38, + "train_loss": 3.9834751657104492, + "train_acc": 0.0988, + "test_loss": 2.3025879089355468, + "test_acc": 0.1, + "lyapunov": 2.26584634939423, + "grad_norm": 0.14984272020285577, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 81.45499515533447 + }, + { + "epoch": 39, + "train_loss": 4.02413849609375, + "train_acc": 0.09734, + "test_loss": 2.30258787689209, + "test_acc": 0.1, + "lyapunov": 2.286009701316619, + "grad_norm": 0.22145868959770007, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 81.45317363739014 + }, + { + "epoch": 40, + "train_loss": 3.9736411520385744, + "train_acc": 0.09894, + "test_loss": 2.3025887702941894, + "test_acc": 0.1, + "lyapunov": 2.259992800710146, + "grad_norm": 0.08893647577966153, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 81.45592546463013 + }, + { + "epoch": 41, + "train_loss": 3.976674521484375, + "train_acc": 0.09844, + "test_loss": 2.302586205673218, + "test_acc": 0.1, + "lyapunov": 2.262093958647355, + "grad_norm": 0.09526075366227103, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 81.4629635810852 + }, + { + "epoch": 42, + "train_loss": 3.9767224240112307, + "train_acc": 0.09934, + "test_loss": 2.3025863662719726, + "test_acc": 0.1, + "lyapunov": 2.2621575853098994, + "grad_norm": 0.0889728077319319, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 81.4452486038208 + }, + { + "epoch": 43, + "train_loss": 3.9843084770202637, + "train_acc": 0.0983, + "test_loss": 2.302587857055664, + "test_acc": 0.1, + "lyapunov": 2.266823678980093, + "grad_norm": 0.14286833201945623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 81.46053290367126 + }, + { + "epoch": 44, + "train_loss": 3.978666923828125, + "train_acc": 0.09862, + "test_loss": 2.302588472366333, + "test_acc": 0.1, + "lyapunov": 2.262758489764865, + "grad_norm": 0.10285858309556797, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 81.4441590309143 + }, + { + "epoch": 45, + "train_loss": 3.984368924102783, + "train_acc": 0.09714, + "test_loss": 2.3025872661590574, + "test_acc": 0.1, + "lyapunov": 2.2663481009890662, + "grad_norm": 0.11152947980914625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 81.43797850608826 + }, + { + "epoch": 46, + "train_loss": 3.9835290453338623, + "train_acc": 0.09794, + "test_loss": 2.302588889694214, + "test_acc": 0.1, + "lyapunov": 2.2661942069792684, + "grad_norm": 0.12155880302110986, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 81.4439845085144 + }, + { + "epoch": 47, + "train_loss": 3.976571675872803, + "train_acc": 0.09746, + "test_loss": 2.302587047958374, + "test_acc": 0.1, + "lyapunov": 2.262034943646482, + "grad_norm": 0.09434388559512244, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 81.44648504257202 + }, + { + "epoch": 48, + "train_loss": 3.978961787414551, + "train_acc": 0.09674, + "test_loss": 2.302586452484131, + "test_acc": 0.1, + "lyapunov": 2.2636160929794507, + "grad_norm": 0.09388300184277713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 81.50625872612 + }, + { + "epoch": 49, + "train_loss": 3.9766515798950195, + "train_acc": 0.09856, + "test_loss": 2.302586361694336, + "test_acc": 0.1, + "lyapunov": 2.2621047679725512, + "grad_norm": 0.08611192583269686, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 81.42919588088989 + }, + { + "epoch": 50, + "train_loss": 3.9754750718688965, + "train_acc": 0.09614, + "test_loss": 2.302587022018433, + "test_acc": 0.1, + "lyapunov": 2.261166003049182, + "grad_norm": 0.09585057441328976, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 81.43738746643066 + }, + { + "epoch": 51, + "train_loss": 3.9752406224823, + "train_acc": 0.09726, + "test_loss": 2.302586801147461, + "test_acc": 0.1, + "lyapunov": 2.2611102423704494, + "grad_norm": 0.09095072097377155, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 81.45784163475037 + }, + { + "epoch": 52, + "train_loss": 3.98188600982666, + "train_acc": 0.0951, + "test_loss": 2.302586806488037, + "test_acc": 0.1, + "lyapunov": 2.265076126893768, + "grad_norm": 0.1123738428492386, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 81.47153091430664 + }, + { + "epoch": 53, + "train_loss": 3.980596968536377, + "train_acc": 0.0976, + "test_loss": 2.3025859146118166, + "test_acc": 0.1, + "lyapunov": 2.2645553932775315, + "grad_norm": 0.1076773200596488, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 81.44375872612 + }, + { + "epoch": 54, + "train_loss": 3.9776349996948244, + "train_acc": 0.09706, + "test_loss": 2.3025868438720702, + "test_acc": 0.1, + "lyapunov": 2.2628720568878875, + "grad_norm": 0.08828239082049001, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 81.42411518096924 + }, + { + "epoch": 55, + "train_loss": 3.9808822979736327, + "train_acc": 0.09588, + "test_loss": 2.302585488128662, + "test_acc": 0.1, + "lyapunov": 2.2643827629821076, + "grad_norm": 0.11262628002715089, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 81.4528546333313 + }, + { + "epoch": 56, + "train_loss": 3.974801806488037, + "train_acc": 0.09592, + "test_loss": 2.3025861625671387, + "test_acc": 0.1, + "lyapunov": 2.2608287944208327, + "grad_norm": 0.09195483599034024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 81.44676446914673 + }, + { + "epoch": 57, + "train_loss": 3.976495365371704, + "train_acc": 0.09736, + "test_loss": 2.3025858879089354, + "test_acc": 0.1, + "lyapunov": 2.262001718096721, + "grad_norm": 0.08361845913085657, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 81.45348882675171 + }, + { + "epoch": 58, + "train_loss": 3.980894155731201, + "train_acc": 0.09842, + "test_loss": 2.3025855281829832, + "test_acc": 0.1, + "lyapunov": 2.2647068646862683, + "grad_norm": 0.11991605921354555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 81.47408199310303 + }, + { + "epoch": 59, + "train_loss": 3.994586195449829, + "train_acc": 0.0973, + "test_loss": 2.3025854663848877, + "test_acc": 0.1, + "lyapunov": 2.27294464672313, + "grad_norm": 0.18222829815312913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 81.44711089134216 + }, + { + "epoch": 60, + "train_loss": 3.9781198291015625, + "train_acc": 0.09658, + "test_loss": 2.3025856033325196, + "test_acc": 0.1, + "lyapunov": 2.263154449365328, + "grad_norm": 0.08448254246697348, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 81.44161295890808 + }, + { + "epoch": 61, + "train_loss": 4.02450031616211, + "train_acc": 0.0976, + "test_loss": 2.302585502624512, + "test_acc": 0.1, + "lyapunov": 2.286170544831649, + "grad_norm": 0.23432897685131301, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 81.45745611190796 + }, + { + "epoch": 62, + "train_loss": 3.988269701385498, + "train_acc": 0.09688, + "test_loss": 2.3025854175567626, + "test_acc": 0.1, + "lyapunov": 2.267505117084669, + "grad_norm": 0.10764931064603923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 81.45787954330444 + }, + { + "epoch": 63, + "train_loss": 3.9736854934692385, + "train_acc": 0.09646, + "test_loss": 2.3025857013702393, + "test_acc": 0.1, + "lyapunov": 2.2600014398774833, + "grad_norm": 0.08382317206831051, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 81.44196057319641 + }, + { + "epoch": 64, + "train_loss": 3.9797292990875244, + "train_acc": 0.0969, + "test_loss": 2.3025853332519532, + "test_acc": 0.1, + "lyapunov": 2.264177340680681, + "grad_norm": 0.11933485737211565, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 81.45828652381897 + }, + { + "epoch": 65, + "train_loss": 3.9763733405303956, + "train_acc": 0.097, + "test_loss": 2.3025854026794432, + "test_acc": 0.1, + "lyapunov": 2.2618614468733065, + "grad_norm": 0.08601466707594763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 81.44515085220337 + }, + { + "epoch": 66, + "train_loss": 4.001672252197266, + "train_acc": 0.09836, + "test_loss": 2.302585359954834, + "test_acc": 0.1, + "lyapunov": 2.276178054492492, + "grad_norm": 0.19097066416551475, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 81.44997453689575 + }, + { + "epoch": 67, + "train_loss": 3.983064818649292, + "train_acc": 0.09848, + "test_loss": 2.302585221862793, + "test_acc": 0.1, + "lyapunov": 2.2660030678410052, + "grad_norm": 0.11726894505680324, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 81.45755219459534 + }, + { + "epoch": 68, + "train_loss": 3.9874353774261473, + "train_acc": 0.09726, + "test_loss": 2.302585542297363, + "test_acc": 0.1, + "lyapunov": 2.26753244497587, + "grad_norm": 0.1096052061821724, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 81.45092463493347 + }, + { + "epoch": 69, + "train_loss": 3.984990802612305, + "train_acc": 0.09842, + "test_loss": 2.3025853466033936, + "test_acc": 0.1, + "lyapunov": 2.2674437922894803, + "grad_norm": 0.08538883278176537, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 81.44036960601807 + }, + { + "epoch": 70, + "train_loss": 3.9768560768127443, + "train_acc": 0.09864, + "test_loss": 2.3025853176116944, + "test_acc": 0.1, + "lyapunov": 2.262266612113894, + "grad_norm": 0.0826759570118499, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 81.44237995147705 + }, + { + "epoch": 71, + "train_loss": 3.97729412109375, + "train_acc": 0.09838, + "test_loss": 2.3025852783203127, + "test_acc": 0.1, + "lyapunov": 2.262566337195199, + "grad_norm": 0.08149339121565821, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 81.46553111076355 + }, + { + "epoch": 72, + "train_loss": 3.999013508300781, + "train_acc": 0.09792, + "test_loss": 2.3025853332519532, + "test_acc": 0.1, + "lyapunov": 2.2738718602358534, + "grad_norm": 0.15690481475260892, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 81.440505027771 + }, + { + "epoch": 73, + "train_loss": 3.9769914697265625, + "train_acc": 0.09758, + "test_loss": 2.302585132598877, + "test_acc": 0.1, + "lyapunov": 2.262345004264656, + "grad_norm": 0.08468511131490652, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 81.45508050918579 + }, + { + "epoch": 74, + "train_loss": 3.9735559133148195, + "train_acc": 0.09684, + "test_loss": 2.302585078430176, + "test_acc": 0.1, + "lyapunov": 2.2599204360981426, + "grad_norm": 0.08407853053475459, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 81.43686723709106 + }, + { + "epoch": 75, + "train_loss": 3.975616183166504, + "train_acc": 0.09758, + "test_loss": 2.302585101699829, + "test_acc": 0.1, + "lyapunov": 2.2613788644980897, + "grad_norm": 0.08410718060667108, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 81.46202492713928 + }, + { + "epoch": 76, + "train_loss": 3.9777969396972654, + "train_acc": 0.09642, + "test_loss": 2.302585230255127, + "test_acc": 0.1, + "lyapunov": 2.262849387000589, + "grad_norm": 0.08412741392957411, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 81.69426202774048 + }, + { + "epoch": 77, + "train_loss": 3.997583436126709, + "train_acc": 0.09804, + "test_loss": 2.3025851612091066, + "test_acc": 0.1, + "lyapunov": 2.272977476534636, + "grad_norm": 0.19693507091470583, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 81.47962164878845 + }, + { + "epoch": 78, + "train_loss": 3.981567749633789, + "train_acc": 0.0972, + "test_loss": 2.302585176086426, + "test_acc": 0.1, + "lyapunov": 2.2653762513719253, + "grad_norm": 0.08819478927352292, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 81.44144415855408 + }, + { + "epoch": 79, + "train_loss": 3.979712967529297, + "train_acc": 0.09928, + "test_loss": 2.3025852310180666, + "test_acc": 0.1, + "lyapunov": 2.2640710157506607, + "grad_norm": 0.10900387268878003, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 81.44691228866577 + }, + { + "epoch": 80, + "train_loss": 3.9752784634399414, + "train_acc": 0.09612, + "test_loss": 2.3025851806640625, + "test_acc": 0.1, + "lyapunov": 2.2611999310495907, + "grad_norm": 0.08485114515050625, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 81.44573497772217 + }, + { + "epoch": 81, + "train_loss": 3.973998136444092, + "train_acc": 0.09674, + "test_loss": 2.302585205078125, + "test_acc": 0.1, + "lyapunov": 2.2602438634009006, + "grad_norm": 0.08193297107495977, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 81.44051194190979 + }, + { + "epoch": 82, + "train_loss": 3.9795581608581543, + "train_acc": 0.0974, + "test_loss": 2.3025851707458496, + "test_acc": 0.1, + "lyapunov": 2.2642151602088947, + "grad_norm": 0.08382214616673372, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 81.44579362869263 + }, + { + "epoch": 83, + "train_loss": 3.97544639793396, + "train_acc": 0.0975, + "test_loss": 2.3025851676940916, + "test_acc": 0.1, + "lyapunov": 2.261258240550985, + "grad_norm": 0.0830598190151241, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 81.46574568748474 + }, + { + "epoch": 84, + "train_loss": 3.9764262825775147, + "train_acc": 0.09818, + "test_loss": 2.302585060119629, + "test_acc": 0.1, + "lyapunov": 2.2619712322264376, + "grad_norm": 0.08369246247456191, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 81.45664143562317 + }, + { + "epoch": 85, + "train_loss": 3.9776910205078124, + "train_acc": 0.0955, + "test_loss": 2.3025851593017577, + "test_acc": 0.1, + "lyapunov": 2.2629058550080985, + "grad_norm": 0.08247891269837844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 81.461270570755 + }, + { + "epoch": 86, + "train_loss": 3.9771215029907228, + "train_acc": 0.09536, + "test_loss": 2.3025850746154783, + "test_acc": 0.1, + "lyapunov": 2.2625219870711226, + "grad_norm": 0.08304329059000737, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 81.45261931419373 + }, + { + "epoch": 87, + "train_loss": 3.9780111279296877, + "train_acc": 0.09718, + "test_loss": 2.3025850124359133, + "test_acc": 0.1, + "lyapunov": 2.263096221572603, + "grad_norm": 0.08168556680409891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 81.47083902359009 + }, + { + "epoch": 88, + "train_loss": 3.975586996154785, + "train_acc": 0.09506, + "test_loss": 2.3025851093292236, + "test_acc": 0.1, + "lyapunov": 2.261420638360026, + "grad_norm": 0.08585199329222436, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 81.46594524383545 + }, + { + "epoch": 89, + "train_loss": 3.9770257449340822, + "train_acc": 0.0982, + "test_loss": 2.3025851146698, + "test_acc": 0.1, + "lyapunov": 2.262422331153889, + "grad_norm": 0.08469063518506169, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 81.46577405929565 + }, + { + "epoch": 90, + "train_loss": 3.973931856689453, + "train_acc": 0.09746, + "test_loss": 2.3025850677490234, + "test_acc": 0.1, + "lyapunov": 2.2602365346210997, + "grad_norm": 0.08267580569635262, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 81.45771622657776 + }, + { + "epoch": 91, + "train_loss": 3.9777387670898436, + "train_acc": 0.09732, + "test_loss": 2.3025851654052736, + "test_acc": 0.1, + "lyapunov": 2.262757078765908, + "grad_norm": 0.10473963211370652, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 81.46830105781555 + }, + { + "epoch": 92, + "train_loss": 3.973895709075928, + "train_acc": 0.09754, + "test_loss": 2.302585176086426, + "test_acc": 0.1, + "lyapunov": 2.2601819568887698, + "grad_norm": 0.08524438116449506, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 81.45872473716736 + }, + { + "epoch": 93, + "train_loss": 3.975780742340088, + "train_acc": 0.09832, + "test_loss": 2.302585258483887, + "test_acc": 0.1, + "lyapunov": 2.261494060916364, + "grad_norm": 0.08296746372602809, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 81.44344329833984 + }, + { + "epoch": 94, + "train_loss": 3.9749393853759765, + "train_acc": 0.099, + "test_loss": 2.3025851181030275, + "test_acc": 0.1, + "lyapunov": 2.2609141049787516, + "grad_norm": 0.081703214219651, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 81.47197723388672 + }, + { + "epoch": 95, + "train_loss": 3.977360173110962, + "train_acc": 0.09844, + "test_loss": 2.3025852035522463, + "test_acc": 0.1, + "lyapunov": 2.2626446403200973, + "grad_norm": 0.08370580659845218, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 81.4649875164032 + }, + { + "epoch": 96, + "train_loss": 3.9748195641326904, + "train_acc": 0.09918, + "test_loss": 2.3025851348876953, + "test_acc": 0.1, + "lyapunov": 2.2608655974688125, + "grad_norm": 0.08506351899121649, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 81.45548796653748 + }, + { + "epoch": 97, + "train_loss": 3.977184408874512, + "train_acc": 0.09888, + "test_loss": 2.3025851238250734, + "test_acc": 0.1, + "lyapunov": 2.262512852163876, + "grad_norm": 0.08383579924614167, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 81.4503653049469 + }, + { + "epoch": 98, + "train_loss": 3.979651080627441, + "train_acc": 0.1, + "test_loss": 2.3025852249145506, + "test_acc": 0.1, + "lyapunov": 2.264271725778994, + "grad_norm": 0.08181479722385572, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 81.46501636505127 + }, + { + "epoch": 99, + "train_loss": 3.9744724880981446, + "train_acc": 0.1, + "test_loss": 2.302585131072998, + "test_acc": 0.1, + "lyapunov": 2.260578519547992, + "grad_norm": 0.08286890329554125, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 81.44538688659668 + }, + { + "epoch": 100, + "train_loss": 3.9755064764404295, + "train_acc": 0.1, + "test_loss": 2.302585161590576, + "test_acc": 0.1, + "lyapunov": 2.2613274374276475, + "grad_norm": 0.08253103448725845, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 81.44115138053894 + } + ], + "12": [ + { + "epoch": 1, + "train_loss": 11.514268187866211, + "train_acc": 0.12322, + "test_loss": 2.335220721435547, + "test_acc": 0.1082, + "lyapunov": 5.094494405609872, + "grad_norm": 6.68472372840091, + "grad_max_sv": 5.768041110038757, + "grad_min_sv": 2.425695402763495e-07, + "grad_condition": 23767971.115653183, + "lr": 0.0009997532801828658, + "time_sec": 124.28109288215637 + }, + { + "epoch": 2, + "train_loss": 6.767582432556153, + "train_acc": 0.13338, + "test_loss": 2.3135711360931395, + "test_acc": 0.1058, + "lyapunov": 3.703414491375389, + "grad_norm": 4.437490608687784, + "grad_max_sv": 3.688317948579788, + "grad_min_sv": 1.6068337682639822e-07, + "grad_condition": 23679624.47851156, + "lr": 0.0009990133642141358, + "time_sec": 124.28083038330078 + }, + { + "epoch": 3, + "train_loss": 6.359151521911621, + "train_acc": 0.1371, + "test_loss": 2.3046204761505127, + "test_acc": 0.1017, + "lyapunov": 3.53740519087028, + "grad_norm": 3.3992685611612004, + "grad_max_sv": 3.1906665176153184, + "grad_min_sv": 1.0806052515022202e-07, + "grad_condition": 30020073.39935509, + "lr": 0.00099778098230154, + "time_sec": 124.26130867004395 + }, + { + "epoch": 4, + "train_loss": 5.680015151367187, + "train_acc": 0.12346, + "test_loss": 2.4307143615722655, + "test_acc": 0.0946, + "lyapunov": 3.2194143725783015, + "grad_norm": 3.6284679983008856, + "grad_max_sv": 2.3083297662011844, + "grad_min_sv": 7.267783242878633e-08, + "grad_condition": 28802302.157710887, + "lr": 0.000996057350657239, + "time_sec": 124.2893226146698 + }, + { + "epoch": 5, + "train_loss": 5.515282614440918, + "train_acc": 0.11878, + "test_loss": 2.3333636627197265, + "test_acc": 0.0806, + "lyapunov": 3.1298821100493526, + "grad_norm": 2.1440857096164527, + "grad_max_sv": 1.8293321043252946, + "grad_min_sv": 6.11613814704981e-08, + "grad_condition": 30298382.919277746, + "lr": 0.0009938441702975688, + "time_sec": 124.24556708335876 + }, + { + "epoch": 6, + "train_loss": 4.830215334472657, + "train_acc": 0.10662, + "test_loss": 2.3030837219238283, + "test_acc": 0.1, + "lyapunov": 2.7727705700623106, + "grad_norm": 2.350059460657985, + "grad_max_sv": 1.5110829517245292, + "grad_min_sv": 2.7742502849842366e-08, + "grad_condition": 415971679.7996719, + "lr": 0.0009911436253643444, + "time_sec": 124.2670316696167 + }, + { + "epoch": 7, + "train_loss": 5.0002188845825195, + "train_acc": 0.1014, + "test_loss": 2.306517247772217, + "test_acc": 0.1, + "lyapunov": 2.8697540314910968, + "grad_norm": 4.791639177202153, + "grad_max_sv": 0.7900435705131315, + "grad_min_sv": 1.012708673176853e-08, + "grad_condition": 1185811132.9619708, + "lr": 0.0009879583809693736, + "time_sec": 124.2431480884552 + }, + { + "epoch": 8, + "train_loss": 5.872336234741211, + "train_acc": 0.10816, + "test_loss": 2.3033512046813964, + "test_acc": 0.1, + "lyapunov": 3.2996887185079666, + "grad_norm": 4.562165296743471, + "grad_max_sv": 0.4824362076822354, + "grad_min_sv": 1.352856967967285e-08, + "grad_condition": 33563973.110157445, + "lr": 0.0009842915805643154, + "time_sec": 124.24206638336182 + }, + { + "epoch": 9, + "train_loss": 5.207491922912598, + "train_acc": 0.1015, + "test_loss": 2.302657497024536, + "test_acc": 0.1, + "lyapunov": 2.982921624732444, + "grad_norm": 1.2857988530859297, + "grad_max_sv": 0.4782970450818539, + "grad_min_sv": 6.14909029240993e-09, + "grad_condition": 17001336844.82257, + "lr": 0.0009801468428384714, + "time_sec": 124.2599868774414 + }, + { + "epoch": 10, + "train_loss": 5.278977078552246, + "train_acc": 0.11042, + "test_loss": 2.303682248687744, + "test_acc": 0.1, + "lyapunov": 3.0210835842220374, + "grad_norm": 2.219210747930246, + "grad_max_sv": 0.26804067082703115, + "grad_min_sv": 5.793725242549423e-09, + "grad_condition": 7080161076.764597, + "lr": 0.0009755282581475767, + "time_sec": 124.2449324131012 + }, + { + "epoch": 11, + "train_loss": 4.803467753601074, + "train_acc": 0.1012, + "test_loss": 4.169252464294433, + "test_acc": 0.1, + "lyapunov": 2.77325821654571, + "grad_norm": 2.127622649938152, + "grad_max_sv": 0.1682983461767435, + "grad_min_sv": 5.603680153853458e-10, + "grad_condition": 68373983123.414894, + "lr": 0.0009704403844771127, + "time_sec": 124.30126142501831 + }, + { + "epoch": 12, + "train_loss": 4.544517149658203, + "train_acc": 0.09926, + "test_loss": 4.290980886840821, + "test_acc": 0.1, + "lyapunov": 2.62944141068422, + "grad_norm": 1.638854096476257, + "grad_max_sv": 0.07512564162607305, + "grad_min_sv": 2.6490731026315825e-12, + "grad_condition": 54196459261.33328, + "lr": 0.0009648882429441257, + "time_sec": 124.24927043914795 + }, + { + "epoch": 13, + "train_loss": 4.369602390441894, + "train_acc": 0.09752, + "test_loss": 4.109600519561767, + "test_acc": 0.1, + "lyapunov": 2.5177556279370243, + "grad_norm": 2.133122078616872, + "grad_max_sv": 0.09587469333782792, + "grad_min_sv": 2.093604774056981e-12, + "grad_condition": 86094204980.57991, + "lr": 0.0009588773128419905, + "time_sec": 124.26178216934204 + }, + { + "epoch": 14, + "train_loss": 4.34119681640625, + "train_acc": 0.09926, + "test_loss": 4.199708403778076, + "test_acc": 0.1, + "lyapunov": 2.495693293373908, + "grad_norm": 2.708849611541162, + "grad_max_sv": 0.09101940747350454, + "grad_min_sv": 8.368649587364072e-14, + "grad_condition": 87173383288.77208, + "lr": 0.0009524135262330098, + "time_sec": 124.24493861198425 + }, + { + "epoch": 15, + "train_loss": 5.13457500289917, + "train_acc": 0.10424, + "test_loss": 2.308458815765381, + "test_acc": 0.1, + "lyapunov": 2.9219820334783297, + "grad_norm": 3.354402938679459, + "grad_max_sv": 0.09543408825993538, + "grad_min_sv": 1.3719995468877692e-10, + "grad_condition": 59504120268.59434, + "lr": 0.0009455032620941839, + "time_sec": 124.29389190673828 + }, + { + "epoch": 16, + "train_loss": 5.3248897048950194, + "train_acc": 0.10296, + "test_loss": 2.302912854766846, + "test_acc": 0.1, + "lyapunov": 2.9764596306149613, + "grad_norm": 0.6322085012676749, + "grad_max_sv": 0.053145987424068154, + "grad_min_sv": 3.2089368939156336e-11, + "grad_condition": 21592510035.150898, + "lr": 0.0009381533400219318, + "time_sec": 124.22647547721863 + }, + { + "epoch": 17, + "train_loss": 4.330915478057861, + "train_acc": 0.09936, + "test_loss": 2.3026626167297364, + "test_acc": 0.1, + "lyapunov": 2.493599863613353, + "grad_norm": 0.20813626461361764, + "grad_max_sv": 0.0220638582482934, + "grad_min_sv": 5.079951297939575e-13, + "grad_condition": 7528215997.404785, + "lr": 0.0009303710135019719, + "time_sec": 124.25075626373291 + }, + { + "epoch": 18, + "train_loss": 4.329695655975342, + "train_acc": 0.09802, + "test_loss": 2.3026026527404784, + "test_acc": 0.1, + "lyapunov": 2.4943465003577034, + "grad_norm": 0.28764831256555634, + "grad_max_sv": 0.00430559329688549, + "grad_min_sv": 1.0630859058082507e-17, + "grad_condition": 4303763188.890272, + "lr": 0.0009221639627510076, + "time_sec": 124.26908159255981 + }, + { + "epoch": 19, + "train_loss": 4.449291636352539, + "train_acc": 0.09546, + "test_loss": 2.3025916465759275, + "test_acc": 0.1, + "lyapunov": 2.5493475122524956, + "grad_norm": 0.286977076303005, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000913540287137281, + "time_sec": 124.22392654418945 + }, + { + "epoch": 20, + "train_loss": 4.275282980957031, + "train_acc": 0.09758, + "test_loss": 2.3025943778991698, + "test_acc": 0.1, + "lyapunov": 2.4641005602639043, + "grad_norm": 0.11226214403634883, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0009045084971874739, + "time_sec": 124.30651044845581 + }, + { + "epoch": 21, + "train_loss": 4.299091949005127, + "train_acc": 0.09792, + "test_loss": 2.30259245262146, + "test_acc": 0.1, + "lyapunov": 2.477661563917194, + "grad_norm": 0.12888554972749486, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008950775061878452, + "time_sec": 124.23446798324585 + }, + { + "epoch": 22, + "train_loss": 4.315002240905762, + "train_acc": 0.0975, + "test_loss": 2.3025940551757813, + "test_acc": 0.1, + "lyapunov": 2.4848342008907776, + "grad_norm": 0.13926908971905202, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008852566213878947, + "time_sec": 124.30266809463501 + }, + { + "epoch": 23, + "train_loss": 4.362473590087891, + "train_acc": 0.09968, + "test_loss": 2.3025879684448243, + "test_acc": 0.1, + "lyapunov": 2.508172784619929, + "grad_norm": 0.25147158848993745, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008750555348152298, + "time_sec": 124.24051856994629 + }, + { + "epoch": 24, + "train_loss": 4.361022654266358, + "train_acc": 0.09674, + "test_loss": 2.3025897010803225, + "test_acc": 0.1, + "lyapunov": 2.5060998808087596, + "grad_norm": 0.25289701667178555, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008644843137107057, + "time_sec": 124.22614932060242 + }, + { + "epoch": 25, + "train_loss": 4.292231715545654, + "train_acc": 0.098, + "test_loss": 2.3025892387390137, + "test_acc": 0.1, + "lyapunov": 2.4726591543163483, + "grad_norm": 0.15846202884892668, + "grad_max_sv": 0.007139207795262337, + "grad_min_sv": 1.1884213096035809e-14, + "grad_condition": 5768863374.104107, + "lr": 0.0008535533905932737, + "time_sec": 124.29175138473511 + }, + { + "epoch": 26, + "train_loss": 4.278334856414795, + "train_acc": 0.09952, + "test_loss": 2.302597050857544, + "test_acc": 0.1, + "lyapunov": 2.46608062229498, + "grad_norm": 0.09871518957397614, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008422735529643444, + "time_sec": 124.22811436653137 + }, + { + "epoch": 27, + "train_loss": 4.279530144348144, + "train_acc": 0.09882, + "test_loss": 2.3025887565612795, + "test_acc": 0.1, + "lyapunov": 2.466456468757766, + "grad_norm": 0.09728576577451334, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008306559326618259, + "time_sec": 124.25813937187195 + }, + { + "epoch": 28, + "train_loss": 4.276873157348633, + "train_acc": 0.0965, + "test_loss": 2.302586852264404, + "test_acc": 0.1, + "lyapunov": 2.4651820092554897, + "grad_norm": 0.09336828927700111, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 124.22499465942383 + }, + { + "epoch": 29, + "train_loss": 4.274294167022705, + "train_acc": 0.09674, + "test_loss": 2.302587184906006, + "test_acc": 0.1, + "lyapunov": 2.4635079608244053, + "grad_norm": 0.08132883703681491, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008064535268264883, + "time_sec": 124.26223015785217 + }, + { + "epoch": 30, + "train_loss": 4.3161706869506835, + "train_acc": 0.09742, + "test_loss": 2.302589612197876, + "test_acc": 0.1, + "lyapunov": 2.4838878163291365, + "grad_norm": 0.1244076499240839, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007938926261462367, + "time_sec": 124.22068643569946 + }, + { + "epoch": 31, + "train_loss": 4.2865172996520995, + "train_acc": 0.09864, + "test_loss": 2.3025933723449707, + "test_acc": 0.1, + "lyapunov": 2.4704265179841416, + "grad_norm": 0.11325710428703713, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 124.27307343482971 + }, + { + "epoch": 32, + "train_loss": 4.276113499755859, + "train_acc": 0.09876, + "test_loss": 2.302595587158203, + "test_acc": 0.1, + "lyapunov": 2.464605447276474, + "grad_norm": 0.11188150655123451, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 124.21617436408997 + }, + { + "epoch": 33, + "train_loss": 4.390245020904541, + "train_acc": 0.09734, + "test_loss": 2.302589817047119, + "test_acc": 0.1, + "lyapunov": 2.5185477038478608, + "grad_norm": 0.2703519117597579, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 124.22293186187744 + }, + { + "epoch": 34, + "train_loss": 4.350401836242676, + "train_acc": 0.09758, + "test_loss": 2.302588123321533, + "test_acc": 0.1, + "lyapunov": 2.4999206596628176, + "grad_norm": 0.21853702579717843, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 124.26609373092651 + }, + { + "epoch": 35, + "train_loss": 4.305715147399902, + "train_acc": 0.09856, + "test_loss": 2.302589534378052, + "test_acc": 0.1, + "lyapunov": 2.4810556158080432, + "grad_norm": 0.17605927419881373, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 124.22794723510742 + }, + { + "epoch": 36, + "train_loss": 4.305906265258789, + "train_acc": 0.09718, + "test_loss": 2.302591007232666, + "test_acc": 0.1, + "lyapunov": 2.477643119709571, + "grad_norm": 0.1236420897514881, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 124.26314496994019 + }, + { + "epoch": 37, + "train_loss": 4.27584158996582, + "train_acc": 0.0968, + "test_loss": 2.302587622451782, + "test_acc": 0.1, + "lyapunov": 2.464479011038075, + "grad_norm": 0.09532844351778941, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 124.25255799293518 + }, + { + "epoch": 38, + "train_loss": 4.283268468475342, + "train_acc": 0.097, + "test_loss": 2.302587129211426, + "test_acc": 0.1, + "lyapunov": 2.4685643030249556, + "grad_norm": 0.12053745808537034, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 124.26603984832764 + }, + { + "epoch": 39, + "train_loss": 4.340071802978516, + "train_acc": 0.09756, + "test_loss": 2.302587187576294, + "test_acc": 0.1, + "lyapunov": 2.496372491807279, + "grad_norm": 0.2265015040889252, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 124.26093554496765 + }, + { + "epoch": 40, + "train_loss": 4.285524172973632, + "train_acc": 0.0976, + "test_loss": 2.302589253234863, + "test_acc": 0.1, + "lyapunov": 2.4703913722806576, + "grad_norm": 0.12837922155849044, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 124.23279547691345 + }, + { + "epoch": 41, + "train_loss": 4.353975823822021, + "train_acc": 0.0984, + "test_loss": 2.3025891468048094, + "test_acc": 0.1, + "lyapunov": 2.502122705854723, + "grad_norm": 0.31834434179235455, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 124.27406620979309 + }, + { + "epoch": 42, + "train_loss": 4.285235863494873, + "train_acc": 0.0975, + "test_loss": 2.3025873653411866, + "test_acc": 0.1, + "lyapunov": 2.4699011251444705, + "grad_norm": 0.16460675806479913, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 124.23745155334473 + }, + { + "epoch": 43, + "train_loss": 4.273813045043945, + "train_acc": 0.09694, + "test_loss": 2.3025889190673827, + "test_acc": 0.1, + "lyapunov": 2.463189967148139, + "grad_norm": 0.09609475828794435, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 124.27437806129456 + }, + { + "epoch": 44, + "train_loss": 4.297922962646484, + "train_acc": 0.09686, + "test_loss": 2.3025868633270266, + "test_acc": 0.1, + "lyapunov": 2.474009756541923, + "grad_norm": 0.14502465560049782, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 124.22268414497375 + }, + { + "epoch": 45, + "train_loss": 4.279574555053711, + "train_acc": 0.09652, + "test_loss": 2.3025878047943116, + "test_acc": 0.1, + "lyapunov": 2.4667322599064665, + "grad_norm": 0.12003136414158579, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 124.28323554992676 + }, + { + "epoch": 46, + "train_loss": 4.273971158905029, + "train_acc": 0.0966, + "test_loss": 2.302587424468994, + "test_acc": 0.1, + "lyapunov": 2.463305209908644, + "grad_norm": 0.09172584937965118, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 124.20362710952759 + }, + { + "epoch": 47, + "train_loss": 4.313593041381836, + "train_acc": 0.09574, + "test_loss": 2.302586856460571, + "test_acc": 0.1, + "lyapunov": 2.4801262095761114, + "grad_norm": 0.15167690922053198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 124.29144883155823 + }, + { + "epoch": 48, + "train_loss": 4.295382699737549, + "train_acc": 0.09748, + "test_loss": 2.302586772155762, + "test_acc": 0.1, + "lyapunov": 2.4740971671345897, + "grad_norm": 0.10879569327624422, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 124.23017454147339 + }, + { + "epoch": 49, + "train_loss": 4.2751529647827144, + "train_acc": 0.09936, + "test_loss": 2.3025859580993653, + "test_acc": 0.1, + "lyapunov": 2.4640432062661253, + "grad_norm": 0.10568439425734225, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 124.25622701644897 + }, + { + "epoch": 50, + "train_loss": 4.273743729553223, + "train_acc": 0.0957, + "test_loss": 2.3025863090515135, + "test_acc": 0.1, + "lyapunov": 2.4630955387564266, + "grad_norm": 0.11615112587060138, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 124.27268052101135 + }, + { + "epoch": 51, + "train_loss": 4.280425806427002, + "train_acc": 0.09628, + "test_loss": 2.302586248397827, + "test_acc": 0.1, + "lyapunov": 2.466461474938161, + "grad_norm": 0.10654878565362114, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 124.24109268188477 + }, + { + "epoch": 52, + "train_loss": 4.279801727294922, + "train_acc": 0.09702, + "test_loss": 2.3025866828918455, + "test_acc": 0.1, + "lyapunov": 2.4669952484043054, + "grad_norm": 0.130514829251149, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 124.26980781555176 + }, + { + "epoch": 53, + "train_loss": 4.315970222320557, + "train_acc": 0.09704, + "test_loss": 2.3025870681762695, + "test_acc": 0.1, + "lyapunov": 2.484521316445392, + "grad_norm": 0.1939414239261272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 124.22718167304993 + }, + { + "epoch": 54, + "train_loss": 4.311761430969239, + "train_acc": 0.09862, + "test_loss": 2.3025857872009277, + "test_acc": 0.1, + "lyapunov": 2.482763496506245, + "grad_norm": 0.18263667447361673, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 124.2686333656311 + }, + { + "epoch": 55, + "train_loss": 4.277025068054199, + "train_acc": 0.09778, + "test_loss": 2.3025857639312743, + "test_acc": 0.1, + "lyapunov": 2.465040735576464, + "grad_norm": 0.09424723224869033, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 124.23272252082825 + }, + { + "epoch": 56, + "train_loss": 4.308205063934326, + "train_acc": 0.0989, + "test_loss": 2.3025861671447756, + "test_acc": 0.1, + "lyapunov": 2.4804823679082535, + "grad_norm": 0.20788469844558666, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 124.45265817642212 + }, + { + "epoch": 57, + "train_loss": 4.282971714477539, + "train_acc": 0.09876, + "test_loss": 2.3025856742858886, + "test_acc": 0.1, + "lyapunov": 2.4687917086169544, + "grad_norm": 0.1374470775631024, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 124.2466242313385 + }, + { + "epoch": 58, + "train_loss": 4.311033409729004, + "train_acc": 0.09662, + "test_loss": 2.302585438156128, + "test_acc": 0.1, + "lyapunov": 2.4805221582007837, + "grad_norm": 0.15017627742331574, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 124.22827982902527 + }, + { + "epoch": 59, + "train_loss": 4.29637522354126, + "train_acc": 0.09756, + "test_loss": 2.302585637664795, + "test_acc": 0.1, + "lyapunov": 2.4749210880845403, + "grad_norm": 0.1570135955415664, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 124.30038142204285 + }, + { + "epoch": 60, + "train_loss": 4.307900915527344, + "train_acc": 0.09804, + "test_loss": 2.302586008834839, + "test_acc": 0.1, + "lyapunov": 2.4804043434465024, + "grad_norm": 0.21537262268091628, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 124.21648406982422 + }, + { + "epoch": 61, + "train_loss": 4.294828899230957, + "train_acc": 0.09696, + "test_loss": 2.302585659408569, + "test_acc": 0.1, + "lyapunov": 2.474180576441538, + "grad_norm": 0.15175328138376964, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 124.26800394058228 + }, + { + "epoch": 62, + "train_loss": 4.27745719039917, + "train_acc": 0.09794, + "test_loss": 2.302585639190674, + "test_acc": 0.1, + "lyapunov": 2.465500669406198, + "grad_norm": 0.10570315629890674, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 124.23925018310547 + }, + { + "epoch": 63, + "train_loss": 4.2727640603637695, + "train_acc": 0.09586, + "test_loss": 2.3025855934143067, + "test_acc": 0.1, + "lyapunov": 2.4626387360760624, + "grad_norm": 0.0890330369346984, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 124.27016854286194 + }, + { + "epoch": 64, + "train_loss": 4.272457419738769, + "train_acc": 0.09604, + "test_loss": 2.3025855697631834, + "test_acc": 0.1, + "lyapunov": 2.4623735072972526, + "grad_norm": 0.0847950891199477, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 124.20920252799988 + }, + { + "epoch": 65, + "train_loss": 4.273480668334961, + "train_acc": 0.09808, + "test_loss": 2.302585276031494, + "test_acc": 0.1, + "lyapunov": 2.4630366255865073, + "grad_norm": 0.08372012214032937, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 124.22656655311584 + }, + { + "epoch": 66, + "train_loss": 4.307428127746582, + "train_acc": 0.09712, + "test_loss": 2.302585486602783, + "test_acc": 0.1, + "lyapunov": 2.4764473944368874, + "grad_norm": 0.12238051774317063, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 124.28961944580078 + }, + { + "epoch": 67, + "train_loss": 4.310281341094971, + "train_acc": 0.09792, + "test_loss": 2.3025853305816653, + "test_acc": 0.1, + "lyapunov": 2.480989251295319, + "grad_norm": 0.27019424894200594, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 124.25288558006287 + }, + { + "epoch": 68, + "train_loss": 4.282535659484863, + "train_acc": 0.09756, + "test_loss": 2.3025853900909423, + "test_acc": 0.1, + "lyapunov": 2.4676397261412246, + "grad_norm": 0.1281762106524609, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 124.26717019081116 + }, + { + "epoch": 69, + "train_loss": 4.276787458190918, + "train_acc": 0.09688, + "test_loss": 2.3025852905273436, + "test_acc": 0.1, + "lyapunov": 2.4651669858361753, + "grad_norm": 0.08124252440804115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 124.23096060752869 + }, + { + "epoch": 70, + "train_loss": 4.28195741897583, + "train_acc": 0.09668, + "test_loss": 2.302585355377197, + "test_acc": 0.1, + "lyapunov": 2.468135183729479, + "grad_norm": 0.11112746909721634, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 124.27119207382202 + }, + { + "epoch": 71, + "train_loss": 4.284729679412842, + "train_acc": 0.09706, + "test_loss": 2.302585294342041, + "test_acc": 0.1, + "lyapunov": 2.469655635716665, + "grad_norm": 0.12307199730963861, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 124.23093914985657 + }, + { + "epoch": 72, + "train_loss": 4.276600415039063, + "train_acc": 0.09806, + "test_loss": 2.3025852252960206, + "test_acc": 0.1, + "lyapunov": 2.464849721440269, + "grad_norm": 0.12908363321506647, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 124.25842094421387 + }, + { + "epoch": 73, + "train_loss": 4.3069706353759765, + "train_acc": 0.09654, + "test_loss": 2.3025852447509765, + "test_acc": 0.1, + "lyapunov": 2.479751230810609, + "grad_norm": 0.183601868909449, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 124.21842932701111 + }, + { + "epoch": 74, + "train_loss": 4.287112475280762, + "train_acc": 0.09722, + "test_loss": 2.302585179901123, + "test_acc": 0.1, + "lyapunov": 2.4702408582048343, + "grad_norm": 0.1331148526919891, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 124.22039604187012 + }, + { + "epoch": 75, + "train_loss": 4.271034491882324, + "train_acc": 0.09664, + "test_loss": 2.3025851165771485, + "test_acc": 0.1, + "lyapunov": 2.461448823704439, + "grad_norm": 0.08255701875769623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 124.30420184135437 + }, + { + "epoch": 76, + "train_loss": 4.272865072021484, + "train_acc": 0.09542, + "test_loss": 2.302585235977173, + "test_acc": 0.1, + "lyapunov": 2.462638800101512, + "grad_norm": 0.08790859271963604, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 124.23553800582886 + }, + { + "epoch": 77, + "train_loss": 4.271533363189698, + "train_acc": 0.09712, + "test_loss": 2.3025852149963377, + "test_acc": 0.1, + "lyapunov": 2.4617462914313197, + "grad_norm": 0.08471091537010327, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 124.25954508781433 + }, + { + "epoch": 78, + "train_loss": 4.290692696685791, + "train_acc": 0.09754, + "test_loss": 2.302585163116455, + "test_acc": 0.1, + "lyapunov": 2.470475591357102, + "grad_norm": 0.10652401748252295, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 124.22494149208069 + }, + { + "epoch": 79, + "train_loss": 4.274790961608887, + "train_acc": 0.09758, + "test_loss": 2.302585228347778, + "test_acc": 0.1, + "lyapunov": 2.4638520756645885, + "grad_norm": 0.08078835262733591, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 124.29019331932068 + }, + { + "epoch": 80, + "train_loss": 4.272836723175049, + "train_acc": 0.09616, + "test_loss": 2.3025851444244383, + "test_acc": 0.1, + "lyapunov": 2.462624883407827, + "grad_norm": 0.08161990901444113, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 124.22851657867432 + }, + { + "epoch": 81, + "train_loss": 4.39987655090332, + "train_acc": 0.0985, + "test_loss": 2.302585282897949, + "test_acc": 0.1, + "lyapunov": 2.5367127757548067, + "grad_norm": 0.6635822194594717, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 124.23617506027222 + }, + { + "epoch": 82, + "train_loss": 4.297471022949218, + "train_acc": 0.0953, + "test_loss": 2.3025852149963377, + "test_acc": 0.1, + "lyapunov": 2.475090144540343, + "grad_norm": 0.729945935366233, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 124.25805640220642 + }, + { + "epoch": 83, + "train_loss": 4.269278663024902, + "train_acc": 0.09916, + "test_loss": 2.3025850776672363, + "test_acc": 0.1, + "lyapunov": 2.4603407303695484, + "grad_norm": 0.09631779246548546, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 124.23541116714478 + }, + { + "epoch": 84, + "train_loss": 4.2767918655395505, + "train_acc": 0.09902, + "test_loss": 2.3025851837158204, + "test_acc": 0.1, + "lyapunov": 2.464642455815659, + "grad_norm": 0.15914456443799777, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 124.2600998878479 + }, + { + "epoch": 85, + "train_loss": 4.275007407989502, + "train_acc": 0.09774, + "test_loss": 2.302585231781006, + "test_acc": 0.1, + "lyapunov": 2.4639958829221213, + "grad_norm": 0.08948000358835351, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 124.19096970558167 + }, + { + "epoch": 86, + "train_loss": 4.282883452606201, + "train_acc": 0.0984, + "test_loss": 2.3025849563598633, + "test_acc": 0.1, + "lyapunov": 2.46685717294893, + "grad_norm": 0.20955582940776452, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 124.28308463096619 + }, + { + "epoch": 87, + "train_loss": 4.273255398712158, + "train_acc": 0.09732, + "test_loss": 2.3025850818634033, + "test_acc": 0.1, + "lyapunov": 2.4628877334887416, + "grad_norm": 0.08251896757547691, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 124.24707794189453 + }, + { + "epoch": 88, + "train_loss": 4.27318275390625, + "train_acc": 0.09818, + "test_loss": 2.3025852210998536, + "test_acc": 0.1, + "lyapunov": 2.462852593273153, + "grad_norm": 0.08488796189115587, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 124.27159857749939 + }, + { + "epoch": 89, + "train_loss": 4.274446720886231, + "train_acc": 0.0964, + "test_loss": 2.3025852279663086, + "test_acc": 0.1, + "lyapunov": 2.463662301792818, + "grad_norm": 0.08254333748035417, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 124.20991706848145 + }, + { + "epoch": 90, + "train_loss": 4.282081894989013, + "train_acc": 0.09898, + "test_loss": 2.302585124206543, + "test_acc": 0.1, + "lyapunov": 2.4669584868204257, + "grad_norm": 0.11057422059552115, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 124.23175573348999 + }, + { + "epoch": 91, + "train_loss": 4.270762037200928, + "train_acc": 0.09742, + "test_loss": 2.302585070037842, + "test_acc": 0.1, + "lyapunov": 2.4613021468872303, + "grad_norm": 0.08094752788352252, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 124.28751397132874 + }, + { + "epoch": 92, + "train_loss": 4.2731778295898435, + "train_acc": 0.0967, + "test_loss": 2.3025849838256836, + "test_acc": 0.1, + "lyapunov": 2.4628693057448054, + "grad_norm": 0.08218150011851272, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 124.20022916793823 + }, + { + "epoch": 93, + "train_loss": 4.271317660827637, + "train_acc": 0.09598, + "test_loss": 2.302585059738159, + "test_acc": 0.1, + "lyapunov": 2.461685863602192, + "grad_norm": 0.09351987385512874, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 124.32517552375793 + }, + { + "epoch": 94, + "train_loss": 4.271005298614502, + "train_acc": 0.09678, + "test_loss": 2.3025850238800047, + "test_acc": 0.1, + "lyapunov": 2.461446201100069, + "grad_norm": 0.08051510852574385, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 124.25493431091309 + }, + { + "epoch": 95, + "train_loss": 4.272550579528809, + "train_acc": 0.0975, + "test_loss": 2.302585118865967, + "test_acc": 0.1, + "lyapunov": 2.462437502258574, + "grad_norm": 0.08133134154526532, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 124.2907202243805 + }, + { + "epoch": 96, + "train_loss": 4.27599407836914, + "train_acc": 0.09808, + "test_loss": 2.302585164642334, + "test_acc": 0.1, + "lyapunov": 2.464714573472357, + "grad_norm": 0.08129994421530186, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 124.2441520690918 + }, + { + "epoch": 97, + "train_loss": 4.27250137512207, + "train_acc": 0.1, + "test_loss": 2.3025850723266603, + "test_acc": 0.1, + "lyapunov": 2.462406137105449, + "grad_norm": 0.08085760651650271, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 124.25383496284485 + }, + { + "epoch": 98, + "train_loss": 4.272909243469238, + "train_acc": 0.1, + "test_loss": 2.30258510017395, + "test_acc": 0.1, + "lyapunov": 2.462700468195064, + "grad_norm": 0.08430371763203995, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 124.2897834777832 + }, + { + "epoch": 99, + "train_loss": 4.27265819152832, + "train_acc": 0.1, + "test_loss": 2.302585132598877, + "test_acc": 0.1, + "lyapunov": 2.462563226290066, + "grad_norm": 0.08009730488173318, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 124.25932240486145 + }, + { + "epoch": 100, + "train_loss": 4.272679078521729, + "train_acc": 0.1, + "test_loss": 2.302585071182251, + "test_acc": 0.1, + "lyapunov": 2.462542835708774, + "grad_norm": 0.08019670403901732, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 124.30135154724121 + } + ], + "16": [ + { + "epoch": 1, + "train_loss": 11.842812671203614, + "train_acc": 0.14506, + "test_loss": 2.34111376953125, + "test_acc": 0.1088, + "lyapunov": 5.111980842507404, + "grad_norm": 6.803328171635302, + "grad_max_sv": 5.664273583889008, + "grad_min_sv": 2.45656453401466e-07, + "grad_condition": 23556170.622745253, + "lr": 0.0009997532801828658, + "time_sec": 167.03577542304993 + }, + { + "epoch": 2, + "train_loss": 6.864391835327148, + "train_acc": 0.1532, + "test_loss": 2.3584522315979, + "test_acc": 0.1126, + "lyapunov": 3.7626322760911246, + "grad_norm": 5.449127371208671, + "grad_max_sv": 4.509619396924973, + "grad_min_sv": 1.816841066926145e-07, + "grad_condition": 25473679.781934455, + "lr": 0.0009990133642141358, + "time_sec": 167.0620617866516 + }, + { + "epoch": 3, + "train_loss": 6.632632642822266, + "train_acc": 0.16122, + "test_loss": 2.358525146102905, + "test_acc": 0.1, + "lyapunov": 3.702555048496217, + "grad_norm": 3.996691628576675, + "grad_max_sv": 3.4047091096639632, + "grad_min_sv": 1.1248512699069124e-07, + "grad_condition": 30963953.097301744, + "lr": 0.00099778098230154, + "time_sec": 167.01362991333008 + }, + { + "epoch": 4, + "train_loss": 6.508619455108643, + "train_acc": 0.15906, + "test_loss": 2.3301877449035646, + "test_acc": 0.1, + "lyapunov": 3.647035371312095, + "grad_norm": 3.2655343849407332, + "grad_max_sv": 3.0296140223741532, + "grad_min_sv": 9.594998209294659e-08, + "grad_condition": 32002571.000903092, + "lr": 0.000996057350657239, + "time_sec": 166.97752714157104 + }, + { + "epoch": 5, + "train_loss": 5.912459800109863, + "train_acc": 0.13794, + "test_loss": 2.3143163734436034, + "test_acc": 0.1, + "lyapunov": 3.364570482917454, + "grad_norm": 2.882730301769821, + "grad_max_sv": 2.836460363864899, + "grad_min_sv": 8.620691849259288e-08, + "grad_condition": 34084982.42197102, + "lr": 0.0009938441702975688, + "time_sec": 167.01780152320862 + }, + { + "epoch": 6, + "train_loss": 5.365990347290039, + "train_acc": 0.12352, + "test_loss": 2.307030549240112, + "test_acc": 0.1, + "lyapunov": 3.0800778951181473, + "grad_norm": 2.6661229845796357, + "grad_max_sv": 1.9664998756031884, + "grad_min_sv": 4.7012965353151585e-08, + "grad_condition": 714227055.0495954, + "lr": 0.0009911436253643444, + "time_sec": 166.95626974105835 + }, + { + "epoch": 7, + "train_loss": 5.098499784545899, + "train_acc": 0.11974, + "test_loss": 2.306401748275757, + "test_acc": 0.1, + "lyapunov": 2.9394846096672973, + "grad_norm": 2.0425554711132987, + "grad_max_sv": 1.3562358289975485, + "grad_min_sv": 3.416944161021407e-08, + "grad_condition": 430074872.43269414, + "lr": 0.0009879583809693736, + "time_sec": 167.02987694740295 + }, + { + "epoch": 8, + "train_loss": 4.836283032226563, + "train_acc": 0.1193, + "test_loss": 2.3056865058898928, + "test_acc": 0.1, + "lyapunov": 2.8134650903589584, + "grad_norm": 1.9015682902174655, + "grad_max_sv": 1.3965314358472825, + "grad_min_sv": 2.998794566512128e-08, + "grad_condition": 984527791.9432541, + "lr": 0.0009842915805643154, + "time_sec": 166.99379587173462 + }, + { + "epoch": 9, + "train_loss": 4.799866871795654, + "train_acc": 0.11898, + "test_loss": 2.3078849700927733, + "test_acc": 0.1, + "lyapunov": 2.7906805755537185, + "grad_norm": 1.830247256824178, + "grad_max_sv": 1.0446476072072983, + "grad_min_sv": 2.2101311034875437e-08, + "grad_condition": 6442199712.909399, + "lr": 0.0009801468428384714, + "time_sec": 167.04091095924377 + }, + { + "epoch": 10, + "train_loss": 4.8418486264038085, + "train_acc": 0.1198, + "test_loss": 2.306636996841431, + "test_acc": 0.1, + "lyapunov": 2.8099952402627073, + "grad_norm": 2.137959073318514, + "grad_max_sv": 0.7742668629978022, + "grad_min_sv": 1.0732185378244782e-08, + "grad_condition": 12825727231.027037, + "lr": 0.0009755282581475767, + "time_sec": 167.01724100112915 + }, + { + "epoch": 11, + "train_loss": 4.899544752502441, + "train_acc": 0.11034, + "test_loss": 2.303115463256836, + "test_acc": 0.1, + "lyapunov": 2.8371418083415314, + "grad_norm": 1.6003418244695304, + "grad_max_sv": 0.6158522295280715, + "grad_min_sv": 3.796369944507449e-09, + "grad_condition": 6480545635.210354, + "lr": 0.0009704403844771127, + "time_sec": 167.04382944107056 + }, + { + "epoch": 12, + "train_loss": 4.951635014648438, + "train_acc": 0.10792, + "test_loss": 2.3031677284240724, + "test_acc": 0.1, + "lyapunov": 2.866735147393268, + "grad_norm": 2.666838044816494, + "grad_max_sv": 0.5319730836898089, + "grad_min_sv": 3.372458990007535e-10, + "grad_condition": 39511669967.92405, + "lr": 0.0009648882429441257, + "time_sec": 166.9957308769226 + }, + { + "epoch": 13, + "train_loss": 6.152256243286133, + "train_acc": 0.10692, + "test_loss": 2.303246379852295, + "test_acc": 0.1, + "lyapunov": 3.4366153896312275, + "grad_norm": 6.342546880123247, + "grad_max_sv": 0.2403870326364995, + "grad_min_sv": 2.6050612198124816e-10, + "grad_condition": 34925794452.094666, + "lr": 0.0009588773128419905, + "time_sec": 167.01189947128296 + }, + { + "epoch": 14, + "train_loss": 6.052201841888428, + "train_acc": 0.10886, + "test_loss": 2.3029991958618163, + "test_acc": 0.1, + "lyapunov": 3.407372230154169, + "grad_norm": 3.751884478526656, + "grad_max_sv": 0.3085380573000293, + "grad_min_sv": 1.7481779514657177e-10, + "grad_condition": 69456467004.02864, + "lr": 0.0009524135262330098, + "time_sec": 166.99195837974548 + }, + { + "epoch": 15, + "train_loss": 6.174399379577637, + "train_acc": 0.10784, + "test_loss": 2.3030965816497804, + "test_acc": 0.1, + "lyapunov": 3.468341021891445, + "grad_norm": 2.2149403643105514, + "grad_max_sv": 0.2665206765946223, + "grad_min_sv": 7.174466620587407e-11, + "grad_condition": 25279718153.525455, + "lr": 0.0009455032620941839, + "time_sec": 167.02302026748657 + }, + { + "epoch": 16, + "train_loss": 5.8687522245788575, + "train_acc": 0.10852, + "test_loss": 2.302928673553467, + "test_acc": 0.1, + "lyapunov": 3.3205134075925784, + "grad_norm": 2.1727798236859517, + "grad_max_sv": 0.1694878804436172, + "grad_min_sv": 5.284483110394732e-11, + "grad_condition": 29825093550.928566, + "lr": 0.0009381533400219318, + "time_sec": 166.98851919174194 + }, + { + "epoch": 17, + "train_loss": 5.00506268585205, + "train_acc": 0.10292, + "test_loss": 2.3029050621032714, + "test_acc": 0.1, + "lyapunov": 2.8923883834458373, + "grad_norm": 1.1450970364565718, + "grad_max_sv": 0.12666865187754867, + "grad_min_sv": 2.4102328364569327e-11, + "grad_condition": 25147403549.501667, + "lr": 0.0009303710135019719, + "time_sec": 167.02036666870117 + }, + { + "epoch": 18, + "train_loss": 4.855449399719238, + "train_acc": 0.104, + "test_loss": 2.3028139762878417, + "test_acc": 0.1, + "lyapunov": 2.8120573298705507, + "grad_norm": 0.7305556308720836, + "grad_max_sv": 0.09714378891512751, + "grad_min_sv": 8.150729035001414e-12, + "grad_condition": 58264297783.12268, + "lr": 0.0009221639627510076, + "time_sec": 167.08689284324646 + }, + { + "epoch": 19, + "train_loss": 4.96336449584961, + "train_acc": 0.1041, + "test_loss": 2.3027950325012205, + "test_acc": 0.1, + "lyapunov": 2.8725837020922804, + "grad_norm": 1.182474133176391, + "grad_max_sv": 0.07083241189830006, + "grad_min_sv": 7.22405413796021e-12, + "grad_condition": 38280733847.458176, + "lr": 0.000913540287137281, + "time_sec": 167.00970244407654 + }, + { + "epoch": 20, + "train_loss": 4.743826732025147, + "train_acc": 0.10382, + "test_loss": 2.3027557773590086, + "test_acc": 0.1, + "lyapunov": 2.7483980515423942, + "grad_norm": 0.6554501104680703, + "grad_max_sv": 0.05732933725230396, + "grad_min_sv": 5.653544739145854e-12, + "grad_condition": 35503198727.48572, + "lr": 0.0009045084971874739, + "time_sec": 167.09380722045898 + }, + { + "epoch": 21, + "train_loss": 4.678205784606933, + "train_acc": 0.10294, + "test_loss": 3.7050921539306643, + "test_acc": 0.1, + "lyapunov": 2.712228787219738, + "grad_norm": 0.9024618566776086, + "grad_max_sv": 0.03976228955434635, + "grad_min_sv": 5.291108131013551e-11, + "grad_condition": 16349739158.901342, + "lr": 0.0008950775061878452, + "time_sec": 167.0224826335907 + }, + { + "epoch": 22, + "train_loss": 4.63441824432373, + "train_acc": 0.09868, + "test_loss": 2.678515822601318, + "test_acc": 0.1, + "lyapunov": 2.6848394797586113, + "grad_norm": 0.9464113383195869, + "grad_max_sv": 0.03219134085811674, + "grad_min_sv": 3.575371656772674e-11, + "grad_condition": 22552839587.69338, + "lr": 0.0008852566213878947, + "time_sec": 167.0608777999878 + }, + { + "epoch": 23, + "train_loss": 4.728675323486328, + "train_acc": 0.09932, + "test_loss": 3.68248123626709, + "test_acc": 0.1, + "lyapunov": 2.732565569450788, + "grad_norm": 1.1845032429393016, + "grad_max_sv": 0.009998515527695418, + "grad_min_sv": 1.095997224005267e-20, + "grad_condition": 9998514820.705112, + "lr": 0.0008750555348152298, + "time_sec": 167.0682075023651 + }, + { + "epoch": 24, + "train_loss": 4.65850959197998, + "train_acc": 0.09912, + "test_loss": 3.6423350326538086, + "test_acc": 0.1, + "lyapunov": 2.6980338791752105, + "grad_norm": 1.5417542431510867, + "grad_max_sv": 0.008353105513378978, + "grad_min_sv": 1.9907194983962853e-18, + "grad_condition": 8352993676.098096, + "lr": 0.0008644843137107057, + "time_sec": 167.08017802238464 + }, + { + "epoch": 25, + "train_loss": 4.584089448547363, + "train_acc": 0.09784, + "test_loss": 2.3033696189880373, + "test_acc": 0.1, + "lyapunov": 2.653346909891309, + "grad_norm": 0.9625814425500707, + "grad_max_sv": 0.0027962074615061282, + "grad_min_sv": 1.8178542286825737e-15, + "grad_condition": 2726213455.6624613, + "lr": 0.0008535533905932737, + "time_sec": 167.05963444709778 + }, + { + "epoch": 26, + "train_loss": 4.562473741149902, + "train_acc": 0.0972, + "test_loss": 2.5531665412902833, + "test_acc": 0.1, + "lyapunov": 2.6440261763989774, + "grad_norm": 1.0966601277478685, + "grad_max_sv": 0.0009299686178565025, + "grad_min_sv": 7.864982908802376e-35, + "grad_condition": 929968617.8565025, + "lr": 0.0008422735529643444, + "time_sec": 167.0820574760437 + }, + { + "epoch": 27, + "train_loss": 4.557928927612305, + "train_acc": 0.10072, + "test_loss": 2.3032149608612063, + "test_acc": 0.1, + "lyapunov": 2.640467453490743, + "grad_norm": 1.5990578945087282, + "grad_max_sv": 0.001147926412522793, + "grad_min_sv": 2.0663573730241894e-15, + "grad_condition": 1060288974.8907245, + "lr": 0.0008306559326618259, + "time_sec": 167.0413818359375 + }, + { + "epoch": 28, + "train_loss": 4.533458753051757, + "train_acc": 0.09686, + "test_loss": 2.303218946838379, + "test_acc": 0.1, + "lyapunov": 2.6252909279845253, + "grad_norm": 0.6753306901464893, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0008187119948743449, + "time_sec": 167.0830535888672 + }, + { + "epoch": 29, + "train_loss": 4.496531313171387, + "train_acc": 0.09852, + "test_loss": 2.3032687267303467, + "test_acc": 0.1, + "lyapunov": 2.6040675938891633, + "grad_norm": 0.18386399798172356, + "grad_max_sv": 0.00110331317409873, + "grad_min_sv": 7.969612926285099e-35, + "grad_condition": 1103313174.09873, + "lr": 0.0008064535268264883, + "time_sec": 167.04623770713806 + }, + { + "epoch": 30, + "train_loss": 4.504303005065918, + "train_acc": 0.0976, + "test_loss": 2.303500841522217, + "test_acc": 0.1, + "lyapunov": 2.6081804003556974, + "grad_norm": 0.15236154258308318, + "grad_max_sv": 0.0028056097216904163, + "grad_min_sv": 0.0, + "grad_condition": 2805609721.6904163, + "lr": 0.0007938926261462367, + "time_sec": 167.02854776382446 + }, + { + "epoch": 31, + "train_loss": 4.50321345703125, + "train_acc": 0.09666, + "test_loss": 2.3035490158081053, + "test_acc": 0.1, + "lyapunov": 2.607592426602493, + "grad_norm": 0.10039091720588617, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007810416889260654, + "time_sec": 167.07999300956726 + }, + { + "epoch": 32, + "train_loss": 4.501663753662109, + "train_acc": 0.09806, + "test_loss": 2.3034838943481444, + "test_acc": 0.1, + "lyapunov": 2.607143198437703, + "grad_norm": 0.1048906506411198, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007679133974894983, + "time_sec": 167.00407528877258 + }, + { + "epoch": 33, + "train_loss": 4.5019655114746095, + "train_acc": 0.09498, + "test_loss": 2.30348473739624, + "test_acc": 0.1, + "lyapunov": 2.607365154549289, + "grad_norm": 0.09466991605122166, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007545207078751857, + "time_sec": 167.04430413246155 + }, + { + "epoch": 34, + "train_loss": 4.4972885162353515, + "train_acc": 0.09806, + "test_loss": 2.3035587966918945, + "test_acc": 0.1, + "lyapunov": 2.6045894854513887, + "grad_norm": 0.094802640603578, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007408768370508577, + "time_sec": 167.01064467430115 + }, + { + "epoch": 35, + "train_loss": 4.496900313110352, + "train_acc": 0.09916, + "test_loss": 2.3035878532409666, + "test_acc": 0.1, + "lyapunov": 2.6043496991667294, + "grad_norm": 0.08505627865784493, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007269952498697734, + "time_sec": 167.04931592941284 + }, + { + "epoch": 36, + "train_loss": 4.498045174407959, + "train_acc": 0.09896, + "test_loss": 2.303556993865967, + "test_acc": 0.1, + "lyapunov": 2.6051284626621722, + "grad_norm": 0.08865673943824036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0007128896457825364, + "time_sec": 166.99707579612732 + }, + { + "epoch": 37, + "train_loss": 4.494941578521728, + "train_acc": 0.09764, + "test_loss": 2.3035079292297365, + "test_acc": 0.1, + "lyapunov": 2.6031092463247, + "grad_norm": 0.09732931123675816, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006985739453173903, + "time_sec": 167.02038192749023 + }, + { + "epoch": 38, + "train_loss": 4.496269936523437, + "train_acc": 0.09764, + "test_loss": 2.3035408573150633, + "test_acc": 0.1, + "lyapunov": 2.604000445217123, + "grad_norm": 0.08852073271727623, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006840622763423391, + "time_sec": 167.02108144760132 + }, + { + "epoch": 39, + "train_loss": 4.493522086791992, + "train_acc": 0.09734, + "test_loss": 2.303493659210205, + "test_acc": 0.1, + "lyapunov": 2.6023181265272446, + "grad_norm": 0.08748337786673831, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006693689601226458, + "time_sec": 167.05211973190308 + }, + { + "epoch": 40, + "train_loss": 4.498229814758301, + "train_acc": 0.09844, + "test_loss": 2.3034747520446777, + "test_acc": 0.1, + "lyapunov": 2.6050954608966017, + "grad_norm": 0.10483613599174303, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006545084971874737, + "time_sec": 167.01571893692017 + }, + { + "epoch": 41, + "train_loss": 4.498432325286865, + "train_acc": 0.09692, + "test_loss": 2.3034770004272462, + "test_acc": 0.1, + "lyapunov": 2.6052994520767876, + "grad_norm": 0.09650951998583779, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006394955530196147, + "time_sec": 167.06526255607605 + }, + { + "epoch": 42, + "train_loss": 4.496120017395019, + "train_acc": 0.09806, + "test_loss": 2.303461635971069, + "test_acc": 0.1, + "lyapunov": 2.6038818706941727, + "grad_norm": 0.08793824539769711, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006243449435824273, + "time_sec": 167.0240659713745 + }, + { + "epoch": 43, + "train_loss": 4.50342136932373, + "train_acc": 0.0968, + "test_loss": 3.123962462234497, + "test_acc": 0.1, + "lyapunov": 2.6082677432643178, + "grad_norm": 0.10763460634241757, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0006090716206982714, + "time_sec": 167.04283785820007 + }, + { + "epoch": 44, + "train_loss": 4.497545390930176, + "train_acc": 0.0993, + "test_loss": 2.30349365196228, + "test_acc": 0.1, + "lyapunov": 2.6048193215714086, + "grad_norm": 0.0914051250208073, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005936906572928625, + "time_sec": 167.00522899627686 + }, + { + "epoch": 45, + "train_loss": 4.497059263458252, + "train_acc": 0.0983, + "test_loss": 2.303560007476807, + "test_acc": 0.1, + "lyapunov": 2.604434971919145, + "grad_norm": 0.09665268401606698, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005782172325201156, + "time_sec": 166.98798084259033 + }, + { + "epoch": 46, + "train_loss": 4.496945586547851, + "train_acc": 0.09766, + "test_loss": 2.303540351486206, + "test_acc": 0.1, + "lyapunov": 2.6044252626121502, + "grad_norm": 0.08182959271154387, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005626666167821523, + "time_sec": 167.05580401420593 + }, + { + "epoch": 47, + "train_loss": 4.5494916119384765, + "train_acc": 0.0975, + "test_loss": 2.3035491088867186, + "test_acc": 0.1, + "lyapunov": 2.6250632187289655, + "grad_norm": 0.16118104591565238, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005470541566592572, + "time_sec": 167.02027297019958 + }, + { + "epoch": 48, + "train_loss": 4.527786728515625, + "train_acc": 0.09808, + "test_loss": 2.303548764038086, + "test_acc": 0.1, + "lyapunov": 2.6161820851933317, + "grad_norm": 0.1522047852768872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005313952597646569, + "time_sec": 167.08899068832397 + }, + { + "epoch": 49, + "train_loss": 4.49808083328247, + "train_acc": 0.0977, + "test_loss": 2.3034967575073244, + "test_acc": 0.1, + "lyapunov": 2.6051423244769008, + "grad_norm": 0.09227111356756569, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005157053795390643, + "time_sec": 167.04247641563416 + }, + { + "epoch": 50, + "train_loss": 4.506656402282715, + "train_acc": 0.09788, + "test_loss": 2.3035506187438965, + "test_acc": 0.1, + "lyapunov": 2.6092079515042514, + "grad_norm": 0.0989012749171036, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0005000000000000002, + "time_sec": 167.06817507743835 + }, + { + "epoch": 51, + "train_loss": 4.518285944213867, + "train_acc": 0.09874, + "test_loss": 2.303562999343872, + "test_acc": 0.1, + "lyapunov": 2.6132117506793087, + "grad_norm": 0.14702247022618603, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00048429462046093607, + "time_sec": 167.00237131118774 + }, + { + "epoch": 52, + "train_loss": 4.510767389526367, + "train_acc": 0.0985, + "test_loss": 2.303548727416992, + "test_acc": 0.1, + "lyapunov": 2.611425805884554, + "grad_norm": 0.12770796891288963, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004686047402353435, + "time_sec": 167.03129529953003 + }, + { + "epoch": 53, + "train_loss": 4.524528532714844, + "train_acc": 0.09758, + "test_loss": 2.3034987804412843, + "test_acc": 0.1, + "lyapunov": 2.6168906950889648, + "grad_norm": 0.16221922023587404, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000452945843340743, + "time_sec": 167.0302333831787 + }, + { + "epoch": 54, + "train_loss": 4.514558558197021, + "train_acc": 0.09898, + "test_loss": 2.3035224128723146, + "test_acc": 0.1, + "lyapunov": 2.6116219816915214, + "grad_norm": 0.11874932612009399, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00043733338321784806, + "time_sec": 167.03262758255005 + }, + { + "epoch": 55, + "train_loss": 4.500117692108154, + "train_acc": 0.0969, + "test_loss": 2.303501333999634, + "test_acc": 0.1, + "lyapunov": 2.6062854854652033, + "grad_norm": 0.10674428233360923, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0004217827674798847, + "time_sec": 166.98121881484985 + }, + { + "epoch": 56, + "train_loss": 4.51960044921875, + "train_acc": 0.09628, + "test_loss": 2.30349303855896, + "test_acc": 0.1, + "lyapunov": 2.616247482616883, + "grad_norm": 0.14277503967283073, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00040630934270713783, + "time_sec": 167.03360319137573 + }, + { + "epoch": 57, + "train_loss": 4.538308909759522, + "train_acc": 0.0975, + "test_loss": 2.303505461502075, + "test_acc": 0.1, + "lyapunov": 2.624653117431094, + "grad_norm": 0.17354441507562746, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.000390928379301729, + "time_sec": 167.00332236289978 + }, + { + "epoch": 58, + "train_loss": 4.5402243867492675, + "train_acc": 0.09768, + "test_loss": 2.3034944499969483, + "test_acc": 0.1, + "lyapunov": 2.6235652969926213, + "grad_norm": 0.18590049129605235, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003756550564175727, + "time_sec": 166.94713830947876 + }, + { + "epoch": 59, + "train_loss": 4.497288510131836, + "train_acc": 0.09656, + "test_loss": 2.303503835296631, + "test_acc": 0.1, + "lyapunov": 2.60465430237753, + "grad_norm": 0.08925667815477244, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00036050444698038553, + "time_sec": 166.97111773490906 + }, + { + "epoch": 60, + "train_loss": 4.520837378082275, + "train_acc": 0.09746, + "test_loss": 2.3035025501251223, + "test_acc": 0.1, + "lyapunov": 2.6177086183787, + "grad_norm": 0.14390327015753798, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00034549150281252655, + "time_sec": 166.95851969718933 + }, + { + "epoch": 61, + "train_loss": 4.503204351348877, + "train_acc": 0.09616, + "test_loss": 2.3035063259124757, + "test_acc": 0.1, + "lyapunov": 2.6079881752238556, + "grad_norm": 0.11060100204296372, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003306310398773544, + "time_sec": 167.04684805870056 + }, + { + "epoch": 62, + "train_loss": 4.529549421844482, + "train_acc": 0.0966, + "test_loss": 2.303504373550415, + "test_acc": 0.1, + "lyapunov": 2.620155497889994, + "grad_norm": 0.25260476730678916, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00031593772365766127, + "time_sec": 166.9670557975769 + }, + { + "epoch": 63, + "train_loss": 4.504642747955322, + "train_acc": 0.09824, + "test_loss": 2.302585437011719, + "test_acc": 0.1, + "lyapunov": 2.6090027182303426, + "grad_norm": 0.14482467729355822, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0003014260546826097, + "time_sec": 167.07136464118958 + }, + { + "epoch": 64, + "train_loss": 4.5207818331909175, + "train_acc": 0.09658, + "test_loss": 2.302585619735718, + "test_acc": 0.1, + "lyapunov": 2.6153993130949758, + "grad_norm": 0.14340140289375716, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002871103542174637, + "time_sec": 167.0296709537506 + }, + { + "epoch": 65, + "train_loss": 4.514579942321777, + "train_acc": 0.09692, + "test_loss": 2.302585908126831, + "test_acc": 0.1, + "lyapunov": 2.612202508370285, + "grad_norm": 0.11615853114383813, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002730047501302267, + "time_sec": 167.06110525131226 + }, + { + "epoch": 66, + "train_loss": 4.539550397949219, + "train_acc": 0.09668, + "test_loss": 2.3025857189178467, + "test_acc": 0.1, + "lyapunov": 2.6239442215551194, + "grad_norm": 0.24377422344866448, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00025912316294914234, + "time_sec": 166.96833562850952 + }, + { + "epoch": 67, + "train_loss": 4.520765433959961, + "train_acc": 0.09678, + "test_loss": 2.3025856506347657, + "test_acc": 0.1, + "lyapunov": 2.6144380130426352, + "grad_norm": 0.17143215114502838, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0002454792921248144, + "time_sec": 167.06375288963318 + }, + { + "epoch": 68, + "train_loss": 4.501224665222168, + "train_acc": 0.09848, + "test_loss": 2.3025851860046385, + "test_acc": 0.1, + "lyapunov": 2.606965447935607, + "grad_norm": 0.22167025880962787, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00023208660251050164, + "time_sec": 166.97689723968506 + }, + { + "epoch": 69, + "train_loss": 4.516330520629883, + "train_acc": 0.09716, + "test_loss": 2.3025853271484373, + "test_acc": 0.1, + "lyapunov": 2.6127135893877815, + "grad_norm": 0.1178159153430125, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00021895831107393473, + "time_sec": 167.03971099853516 + }, + { + "epoch": 70, + "train_loss": 4.518335289764404, + "train_acc": 0.09628, + "test_loss": 2.3025851623535156, + "test_acc": 0.1, + "lyapunov": 2.614670734576252, + "grad_norm": 0.19910468609269888, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00020610737385376356, + "time_sec": 167.01087379455566 + }, + { + "epoch": 71, + "train_loss": 4.506198991699219, + "train_acc": 0.0961, + "test_loss": 2.3025853843688964, + "test_acc": 0.1, + "lyapunov": 2.6081283720557953, + "grad_norm": 0.09098734124729495, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00019354647317351177, + "time_sec": 167.0194799900055 + }, + { + "epoch": 72, + "train_loss": 4.49574895111084, + "train_acc": 0.09856, + "test_loss": 2.3025853591918946, + "test_acc": 0.1, + "lyapunov": 2.603733692632612, + "grad_norm": 0.08176729544229487, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001812880051256552, + "time_sec": 167.05306220054626 + }, + { + "epoch": 73, + "train_loss": 4.497463835449219, + "train_acc": 0.09886, + "test_loss": 2.3025851680755616, + "test_acc": 0.1, + "lyapunov": 2.604736436053615, + "grad_norm": 0.082986396115534, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00016934406733817422, + "time_sec": 166.98811650276184 + }, + { + "epoch": 74, + "train_loss": 4.4971358953857425, + "train_acc": 0.09738, + "test_loss": 2.302585493850708, + "test_acc": 0.1, + "lyapunov": 2.6045719363805278, + "grad_norm": 0.08151196821637299, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001577264470356557, + "time_sec": 167.01667833328247 + }, + { + "epoch": 75, + "train_loss": 4.50925322631836, + "train_acc": 0.0967, + "test_loss": 2.302585232925415, + "test_acc": 0.1, + "lyapunov": 2.6094926751178242, + "grad_norm": 0.21190207725464844, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00014644660940672634, + "time_sec": 166.97911548614502 + }, + { + "epoch": 76, + "train_loss": 4.496390933227539, + "train_acc": 0.0967, + "test_loss": 2.302585297393799, + "test_acc": 0.1, + "lyapunov": 2.6040706823549002, + "grad_norm": 0.08435313407684436, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0001355156862892944, + "time_sec": 167.0480306148529 + }, + { + "epoch": 77, + "train_loss": 4.496095029296875, + "train_acc": 0.0965, + "test_loss": 2.3025853218078614, + "test_acc": 0.1, + "lyapunov": 2.6039189987475306, + "grad_norm": 0.1373346720572696, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00012494446518477025, + "time_sec": 166.97820734977722 + }, + { + "epoch": 78, + "train_loss": 4.499068414611816, + "train_acc": 0.096, + "test_loss": 2.3025852237701416, + "test_acc": 0.1, + "lyapunov": 2.605743714305751, + "grad_norm": 0.10939849657650327, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00011474337861210548, + "time_sec": 166.98934531211853 + }, + { + "epoch": 79, + "train_loss": 4.4964453392028805, + "train_acc": 0.09828, + "test_loss": 2.302585151672363, + "test_acc": 0.1, + "lyapunov": 2.604178778655694, + "grad_norm": 0.08774538011729731, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.00010492249381215483, + "time_sec": 167.02672863006592 + }, + { + "epoch": 80, + "train_loss": 4.499743932647705, + "train_acc": 0.09862, + "test_loss": 2.302585228347778, + "test_acc": 0.1, + "lyapunov": 2.606093951808217, + "grad_norm": 0.2420142867175763, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.549150281252637e-05, + "time_sec": 167.10957646369934 + }, + { + "epoch": 81, + "train_loss": 4.502734872436523, + "train_acc": 0.09578, + "test_loss": 2.302585201263428, + "test_acc": 0.1, + "lyapunov": 2.6076697900776975, + "grad_norm": 0.13251791023485532, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.645971286271918e-05, + "time_sec": 166.9769287109375 + }, + { + "epoch": 82, + "train_loss": 4.494626608581543, + "train_acc": 0.09758, + "test_loss": 2.3025851295471194, + "test_acc": 0.1, + "lyapunov": 2.6029957383489974, + "grad_norm": 0.08170465976084904, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 7.78360372489926e-05, + "time_sec": 167.00449562072754 + }, + { + "epoch": 83, + "train_loss": 4.495700520019532, + "train_acc": 0.09822, + "test_loss": 2.3025853286743163, + "test_acc": 0.1, + "lyapunov": 2.6036597090913816, + "grad_norm": 0.1210411913955966, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.962898649802815e-05, + "time_sec": 166.96435856819153 + }, + { + "epoch": 84, + "train_loss": 4.49369448425293, + "train_acc": 0.09848, + "test_loss": 2.3025850296020507, + "test_acc": 0.1, + "lyapunov": 2.6024485061235745, + "grad_norm": 0.1169116031555102, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.184665997806824e-05, + "time_sec": 166.9589819908142 + }, + { + "epoch": 85, + "train_loss": 4.493269319915772, + "train_acc": 0.09772, + "test_loss": 2.3025851333618164, + "test_acc": 0.1, + "lyapunov": 2.60219204151417, + "grad_norm": 0.08026909865070977, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 5.449673790581613e-05, + "time_sec": 167.0204620361328 + }, + { + "epoch": 86, + "train_loss": 4.4974218487548825, + "train_acc": 0.09802, + "test_loss": 2.302585245895386, + "test_acc": 0.1, + "lyapunov": 2.604730949987231, + "grad_norm": 0.08689607041758553, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.758647376699034e-05, + "time_sec": 166.964524269104 + }, + { + "epoch": 87, + "train_loss": 4.495326493072509, + "train_acc": 0.0982, + "test_loss": 2.3025850296020507, + "test_acc": 0.1, + "lyapunov": 2.603457776481843, + "grad_norm": 0.09583928752803095, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 4.112268715800956e-05, + "time_sec": 167.03006196022034 + }, + { + "epoch": 88, + "train_loss": 4.494311538085937, + "train_acc": 0.09762, + "test_loss": 2.3025852684020998, + "test_acc": 0.1, + "lyapunov": 2.602831931980065, + "grad_norm": 0.08201988600112256, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.511175705587434e-05, + "time_sec": 166.98635745048523 + }, + { + "epoch": 89, + "train_loss": 4.497406745605469, + "train_acc": 0.09872, + "test_loss": 2.302585092926025, + "test_acc": 0.1, + "lyapunov": 2.6046652647540394, + "grad_norm": 0.11011286998675665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.9559615522887284e-05, + "time_sec": 167.0066351890564 + }, + { + "epoch": 90, + "train_loss": 4.495393841552734, + "train_acc": 0.0955, + "test_loss": 2.3025851219177245, + "test_acc": 0.1, + "lyapunov": 2.603500037546963, + "grad_norm": 0.08854801622590937, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.447174185242324e-05, + "time_sec": 166.98117446899414 + }, + { + "epoch": 91, + "train_loss": 4.496799105529785, + "train_acc": 0.09778, + "test_loss": 2.3025851669311526, + "test_acc": 0.1, + "lyapunov": 2.6043886601772455, + "grad_norm": 0.08317548392372451, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.9853157161528526e-05, + "time_sec": 167.05606770515442 + }, + { + "epoch": 92, + "train_loss": 4.501456503753662, + "train_acc": 0.09732, + "test_loss": 2.302585040283203, + "test_acc": 0.1, + "lyapunov": 2.6069688260402826, + "grad_norm": 0.09601255447418665, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.570841943568452e-05, + "time_sec": 166.95690035820007 + }, + { + "epoch": 93, + "train_loss": 4.4988940646362305, + "train_acc": 0.09822, + "test_loss": 2.302585070037842, + "test_acc": 0.1, + "lyapunov": 2.6056473828337685, + "grad_norm": 0.11345521860163729, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 1.204161903062634e-05, + "time_sec": 167.01007437705994 + }, + { + "epoch": 94, + "train_loss": 4.500971371002198, + "train_acc": 0.09656, + "test_loss": 2.3025852294921876, + "test_acc": 0.1, + "lyapunov": 2.606662953296281, + "grad_norm": 0.10989679012817173, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 8.85637463565564e-06, + "time_sec": 166.93790555000305 + }, + { + "epoch": 95, + "train_loss": 4.496245345458984, + "train_acc": 0.09824, + "test_loss": 2.3025850425720216, + "test_acc": 0.1, + "lyapunov": 2.6040014677950185, + "grad_norm": 0.13386825999790872, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 6.155829702431171e-06, + "time_sec": 166.99875664710999 + }, + { + "epoch": 96, + "train_loss": 4.4964897052001955, + "train_acc": 0.09874, + "test_loss": 2.302585097122192, + "test_acc": 0.1, + "lyapunov": 2.6042159268313356, + "grad_norm": 0.09409731933962433, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 3.942649342761118e-06, + "time_sec": 166.96930813789368 + }, + { + "epoch": 97, + "train_loss": 4.499828433837891, + "train_acc": 0.1, + "test_loss": 2.3025849605560302, + "test_acc": 0.1, + "lyapunov": 2.6062122037648545, + "grad_norm": 0.16887612557601597, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.2190176984600023e-06, + "time_sec": 166.9714593887329 + }, + { + "epoch": 98, + "train_loss": 4.496156484069824, + "train_acc": 0.1, + "test_loss": 2.302585231781006, + "test_acc": 0.1, + "lyapunov": 2.603946977259253, + "grad_norm": 0.08139214809285189, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 9.866357858642206e-07, + "time_sec": 167.0184144973755 + }, + { + "epoch": 99, + "train_loss": 4.497607230377198, + "train_acc": 0.1, + "test_loss": 2.302585125350952, + "test_acc": 0.1, + "lyapunov": 2.6048427774473226, + "grad_norm": 0.08064979301518677, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 2.467198171342e-07, + "time_sec": 166.95221614837646 + }, + { + "epoch": 100, + "train_loss": 4.493742803955078, + "train_acc": 0.1, + "test_loss": 2.302585009765625, + "test_acc": 0.1, + "lyapunov": 2.602488872035385, + "grad_norm": 0.08215126330977654, + "grad_max_sv": 0.0, + "grad_min_sv": 0.0, + "grad_condition": 0.0, + "lr": 0.0, + "time_sec": 166.99254083633423 + } + ] + } +}
\ No newline at end of file |
