summaryrefslogtreecommitdiff
path: root/runs/depth_scaling/cifar10_20251229-160504
diff options
context:
space:
mode:
authorYurenHao0426 <blackhao0426@gmail.com>2026-01-13 23:50:59 -0600
committerYurenHao0426 <blackhao0426@gmail.com>2026-01-13 23:50:59 -0600
commit00cf667cee7ffacb144d5805fc7e0ef443f3583a (patch)
tree77d20a3adaecf96bf3aff0612bdd3b5fa1a7dc7e /runs/depth_scaling/cifar10_20251229-160504
parentc53c04aa1d6ff75cb478a9498c370baa929c74b6 (diff)
parentcd99d6b874d9d09b3bb87b8485cc787885af71f1 (diff)
Merge master into main
Diffstat (limited to 'runs/depth_scaling/cifar10_20251229-160504')
-rw-r--r--runs/depth_scaling/cifar10_20251229-160504/config.json20
-rw-r--r--runs/depth_scaling/cifar10_20251229-160504/results.json11222
2 files changed, 11242 insertions, 0 deletions
diff --git a/runs/depth_scaling/cifar10_20251229-160504/config.json b/runs/depth_scaling/cifar10_20251229-160504/config.json
new file mode 100644
index 0000000..c87b8a8
--- /dev/null
+++ b/runs/depth_scaling/cifar10_20251229-160504/config.json
@@ -0,0 +1,20 @@
+{
+ "dataset": "cifar10",
+ "depths": [
+ 4,
+ 8,
+ 12,
+ 16
+ ],
+ "T": 4,
+ "epochs": 100,
+ "batch_size": 128,
+ "lr": 0.001,
+ "lambda_reg": 0.3,
+ "lambda_target": -0.1,
+ "data_dir": "./data",
+ "out_dir": "runs/depth_scaling",
+ "device": "cuda",
+ "seed": 42,
+ "no_progress": false
+} \ No newline at end of file
diff --git a/runs/depth_scaling/cifar10_20251229-160504/results.json b/runs/depth_scaling/cifar10_20251229-160504/results.json
new file mode 100644
index 0000000..2e9b6eb
--- /dev/null
+++ b/runs/depth_scaling/cifar10_20251229-160504/results.json
@@ -0,0 +1,11222 @@
+{
+ "vanilla": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 1.87523081199646,
+ "train_acc": 0.3904,
+ "test_loss": 1.3005033981323242,
+ "test_acc": 0.538,
+ "lyapunov": null,
+ "grad_norm": 7.167065437345997,
+ "grad_max_sv": 6.2841449797153475,
+ "grad_min_sv": 2.820393511626662e-07,
+ "grad_condition": 22637653.325481158,
+ "lr": 0.0009997532801828658,
+ "time_sec": 17.83638072013855
+ },
+ {
+ "epoch": 2,
+ "train_loss": 1.330778917236328,
+ "train_acc": 0.53242,
+ "test_loss": 1.3051589399337769,
+ "test_acc": 0.5299,
+ "lyapunov": null,
+ "grad_norm": 5.684293544168513,
+ "grad_max_sv": 4.961454087495804,
+ "grad_min_sv": 2.2011614504435783e-07,
+ "grad_condition": 23000049.3006949,
+ "lr": 0.0009990133642141358,
+ "time_sec": 15.308318853378296
+ },
+ {
+ "epoch": 3,
+ "train_loss": 1.1224762370300292,
+ "train_acc": 0.59994,
+ "test_loss": 1.1229688482284546,
+ "test_acc": 0.6085,
+ "lyapunov": null,
+ "grad_norm": 4.767601837094887,
+ "grad_max_sv": 4.13027862906456,
+ "grad_min_sv": 1.9442289698190506e-07,
+ "grad_condition": 21218061.296424918,
+ "lr": 0.00099778098230154,
+ "time_sec": 15.306547403335571
+ },
+ {
+ "epoch": 4,
+ "train_loss": 0.9929985418510437,
+ "train_acc": 0.6506,
+ "test_loss": 1.0345463452339172,
+ "test_acc": 0.6476,
+ "lyapunov": null,
+ "grad_norm": 4.154534311876162,
+ "grad_max_sv": 3.4217750519514083,
+ "grad_min_sv": 1.738904227721605e-07,
+ "grad_condition": 19945043.08817544,
+ "lr": 0.000996057350657239,
+ "time_sec": 15.302969694137573
+ },
+ {
+ "epoch": 5,
+ "train_loss": 0.8976026094818115,
+ "train_acc": 0.68438,
+ "test_loss": 0.8756585054397583,
+ "test_acc": 0.6914,
+ "lyapunov": null,
+ "grad_norm": 3.6333960771107905,
+ "grad_max_sv": 2.9354925364255906,
+ "grad_min_sv": 1.6106242668456615e-07,
+ "grad_condition": 18489046.232839655,
+ "lr": 0.0009938441702975688,
+ "time_sec": 15.317728281021118
+ },
+ {
+ "epoch": 6,
+ "train_loss": 0.8413557116317749,
+ "train_acc": 0.70288,
+ "test_loss": 1.0890468210220337,
+ "test_acc": 0.6361,
+ "lyapunov": null,
+ "grad_norm": 3.416502916483722,
+ "grad_max_sv": 2.8772784233093263,
+ "grad_min_sv": 1.524946609876565e-07,
+ "grad_condition": 19017545.32666207,
+ "lr": 0.0009911436253643444,
+ "time_sec": 15.30530047416687
+ },
+ {
+ "epoch": 7,
+ "train_loss": 0.780380486125946,
+ "train_acc": 0.72624,
+ "test_loss": 0.7749503490447998,
+ "test_acc": 0.7328,
+ "lyapunov": null,
+ "grad_norm": 3.046069709126096,
+ "grad_max_sv": 2.3629971712827684,
+ "grad_min_sv": 1.380081055657456e-07,
+ "grad_condition": 17149009.230771504,
+ "lr": 0.0009879583809693736,
+ "time_sec": 15.307675838470459
+ },
+ {
+ "epoch": 8,
+ "train_loss": 0.7390781346511841,
+ "train_acc": 0.7414,
+ "test_loss": 0.7958005157470703,
+ "test_acc": 0.7277,
+ "lyapunov": null,
+ "grad_norm": 2.7435338958916513,
+ "grad_max_sv": 2.05181370973587,
+ "grad_min_sv": 1.2932217341443675e-07,
+ "grad_condition": 16036517.768211821,
+ "lr": 0.0009842915805643154,
+ "time_sec": 15.307319641113281
+ },
+ {
+ "epoch": 9,
+ "train_loss": 0.7052495925521851,
+ "train_acc": 0.75274,
+ "test_loss": 1.0447007677078246,
+ "test_acc": 0.6745,
+ "lyapunov": null,
+ "grad_norm": 2.552586529905072,
+ "grad_max_sv": 2.0337040573358536,
+ "grad_min_sv": 1.2101497901539914e-07,
+ "grad_condition": 16963155.872520845,
+ "lr": 0.0009801468428384714,
+ "time_sec": 15.290063619613647
+ },
+ {
+ "epoch": 10,
+ "train_loss": 0.6694383864402771,
+ "train_acc": 0.76588,
+ "test_loss": 0.9462176066398621,
+ "test_acc": 0.6842,
+ "lyapunov": null,
+ "grad_norm": 2.3520331395340692,
+ "grad_max_sv": 1.7684333354234696,
+ "grad_min_sv": 1.1190378259584577e-07,
+ "grad_condition": 15955738.307438832,
+ "lr": 0.0009755282581475767,
+ "time_sec": 15.305615901947021
+ },
+ {
+ "epoch": 11,
+ "train_loss": 0.6340117832756043,
+ "train_acc": 0.77878,
+ "test_loss": 0.7613432981491088,
+ "test_acc": 0.7377,
+ "lyapunov": null,
+ "grad_norm": 2.164571307713442,
+ "grad_max_sv": 1.7057331085205079,
+ "grad_min_sv": 1.0792852087604387e-07,
+ "grad_condition": 15783530.208328355,
+ "lr": 0.0009704403844771127,
+ "time_sec": 15.29656457901001
+ },
+ {
+ "epoch": 12,
+ "train_loss": 0.6060477030181884,
+ "train_acc": 0.78728,
+ "test_loss": 0.7971237164974213,
+ "test_acc": 0.729,
+ "lyapunov": null,
+ "grad_norm": 1.993298876301324,
+ "grad_max_sv": 1.514353270828724,
+ "grad_min_sv": 1.009763655801521e-07,
+ "grad_condition": 14944755.026175302,
+ "lr": 0.0009648882429441257,
+ "time_sec": 15.30236530303955
+ },
+ {
+ "epoch": 13,
+ "train_loss": 0.5870892490005493,
+ "train_acc": 0.79524,
+ "test_loss": 0.8448094959259034,
+ "test_acc": 0.7127,
+ "lyapunov": null,
+ "grad_norm": 1.8629217723116693,
+ "grad_max_sv": 1.3949483826756477,
+ "grad_min_sv": 9.635141964281502e-08,
+ "grad_condition": 14581029.38399595,
+ "lr": 0.0009588773128419905,
+ "time_sec": 15.315025806427002
+ },
+ {
+ "epoch": 14,
+ "train_loss": 0.5539195073699951,
+ "train_acc": 0.80644,
+ "test_loss": 0.7561563467979431,
+ "test_acc": 0.7394,
+ "lyapunov": null,
+ "grad_norm": 1.6986166991338625,
+ "grad_max_sv": 1.245494757592678,
+ "grad_min_sv": 8.711651755533012e-08,
+ "grad_condition": 14401234.8235637,
+ "lr": 0.0009524135262330098,
+ "time_sec": 15.308890104293823
+ },
+ {
+ "epoch": 15,
+ "train_loss": 0.5333379591941834,
+ "train_acc": 0.8143,
+ "test_loss": 0.6968033623695373,
+ "test_acc": 0.7569,
+ "lyapunov": null,
+ "grad_norm": 1.5656089916965232,
+ "grad_max_sv": 1.1909169003367424,
+ "grad_min_sv": 8.488269482853639e-08,
+ "grad_condition": 14106351.27298153,
+ "lr": 0.0009455032620941839,
+ "time_sec": 15.311123609542847
+ },
+ {
+ "epoch": 16,
+ "train_loss": 0.5167095581436157,
+ "train_acc": 0.82042,
+ "test_loss": 0.849514400100708,
+ "test_acc": 0.7133,
+ "lyapunov": null,
+ "grad_norm": 1.496171987836298,
+ "grad_max_sv": 1.0258999049663544,
+ "grad_min_sv": 8.006283778172473e-08,
+ "grad_condition": 12841377.110361751,
+ "lr": 0.0009381533400219318,
+ "time_sec": 15.310609817504883
+ },
+ {
+ "epoch": 17,
+ "train_loss": 0.49894729826927187,
+ "train_acc": 0.8262,
+ "test_loss": 0.7154086270809173,
+ "test_acc": 0.7552,
+ "lyapunov": null,
+ "grad_norm": 1.3884031919720434,
+ "grad_max_sv": 0.9819801226258278,
+ "grad_min_sv": 7.953692726658801e-08,
+ "grad_condition": 12477520.833613167,
+ "lr": 0.0009303710135019719,
+ "time_sec": 15.301868200302124
+ },
+ {
+ "epoch": 18,
+ "train_loss": 0.4833205630302429,
+ "train_acc": 0.83074,
+ "test_loss": 0.8212436129570008,
+ "test_acc": 0.7372,
+ "lyapunov": null,
+ "grad_norm": 1.322943153444315,
+ "grad_max_sv": 0.9954353883862496,
+ "grad_min_sv": 7.706266931251094e-08,
+ "grad_condition": 12928888.561653998,
+ "lr": 0.0009221639627510076,
+ "time_sec": 15.304028987884521
+ },
+ {
+ "epoch": 19,
+ "train_loss": 0.46378349807739255,
+ "train_acc": 0.8371,
+ "test_loss": 0.6447551451683045,
+ "test_acc": 0.789,
+ "lyapunov": null,
+ "grad_norm": 1.231933968586028,
+ "grad_max_sv": 0.7683330580592156,
+ "grad_min_sv": 6.892571695615856e-08,
+ "grad_condition": 11194075.895721275,
+ "lr": 0.000913540287137281,
+ "time_sec": 15.304960489273071
+ },
+ {
+ "epoch": 20,
+ "train_loss": 0.44474551233291626,
+ "train_acc": 0.84504,
+ "test_loss": 0.6990101715087891,
+ "test_acc": 0.7693,
+ "lyapunov": null,
+ "grad_norm": 1.1785280692983833,
+ "grad_max_sv": 0.8134334728121757,
+ "grad_min_sv": 6.934622298615523e-08,
+ "grad_condition": 11771827.214910198,
+ "lr": 0.0009045084971874739,
+ "time_sec": 15.309978008270264
+ },
+ {
+ "epoch": 21,
+ "train_loss": 0.4328971823978424,
+ "train_acc": 0.8493,
+ "test_loss": 0.605803295135498,
+ "test_acc": 0.7971,
+ "lyapunov": null,
+ "grad_norm": 1.1010893792673297,
+ "grad_max_sv": 0.74788568764925,
+ "grad_min_sv": 6.635127869358826e-08,
+ "grad_condition": 11337903.371089932,
+ "lr": 0.0008950775061878452,
+ "time_sec": 15.304766416549683
+ },
+ {
+ "epoch": 22,
+ "train_loss": 0.42013943620681765,
+ "train_acc": 0.85398,
+ "test_loss": 0.6351155483245849,
+ "test_acc": 0.7873,
+ "lyapunov": null,
+ "grad_norm": 1.050275059187082,
+ "grad_max_sv": 0.733056052774191,
+ "grad_min_sv": 6.172693325368073e-08,
+ "grad_condition": 11926578.893480929,
+ "lr": 0.0008852566213878947,
+ "time_sec": 15.304250001907349
+ },
+ {
+ "epoch": 23,
+ "train_loss": 0.4068706720542908,
+ "train_acc": 0.85872,
+ "test_loss": 0.6962938892364502,
+ "test_acc": 0.7771,
+ "lyapunov": null,
+ "grad_norm": 1.0041008989601972,
+ "grad_max_sv": 0.6977266952395439,
+ "grad_min_sv": 6.174876086006975e-08,
+ "grad_condition": 11375115.065625418,
+ "lr": 0.0008750555348152298,
+ "time_sec": 15.29546570777893
+ },
+ {
+ "epoch": 24,
+ "train_loss": 0.3927080359458923,
+ "train_acc": 0.86198,
+ "test_loss": 0.6316822688102722,
+ "test_acc": 0.797,
+ "lyapunov": null,
+ "grad_norm": 0.9591057928108919,
+ "grad_max_sv": 0.6601924143731595,
+ "grad_min_sv": 5.981677704269828e-08,
+ "grad_condition": 10958128.320144685,
+ "lr": 0.0008644843137107057,
+ "time_sec": 15.319843292236328
+ },
+ {
+ "epoch": 25,
+ "train_loss": 0.37991392849445343,
+ "train_acc": 0.8662,
+ "test_loss": 0.7685016389846802,
+ "test_acc": 0.7528,
+ "lyapunov": null,
+ "grad_norm": 0.9185108543931831,
+ "grad_max_sv": 0.5813446715474129,
+ "grad_min_sv": 5.7562914257403006e-08,
+ "grad_condition": 10132723.13073414,
+ "lr": 0.0008535533905932737,
+ "time_sec": 15.314316272735596
+ },
+ {
+ "epoch": 26,
+ "train_loss": 0.3740078569984436,
+ "train_acc": 0.86904,
+ "test_loss": 0.6302923937797547,
+ "test_acc": 0.7894,
+ "lyapunov": null,
+ "grad_norm": 0.896823092741051,
+ "grad_max_sv": 0.5897809371352196,
+ "grad_min_sv": 5.612208120453488e-08,
+ "grad_condition": 10555219.724126566,
+ "lr": 0.0008422735529643444,
+ "time_sec": 15.295911312103271
+ },
+ {
+ "epoch": 27,
+ "train_loss": 0.35986615454673765,
+ "train_acc": 0.8722,
+ "test_loss": 0.5293433817148209,
+ "test_acc": 0.8255,
+ "lyapunov": null,
+ "grad_norm": 0.8414160526480361,
+ "grad_max_sv": 0.5433246113359929,
+ "grad_min_sv": 5.460546566027347e-08,
+ "grad_condition": 10029361.12551422,
+ "lr": 0.0008306559326618259,
+ "time_sec": 15.296611309051514
+ },
+ {
+ "epoch": 28,
+ "train_loss": 0.34749350198745727,
+ "train_acc": 0.87846,
+ "test_loss": 0.6013012096405029,
+ "test_acc": 0.8077,
+ "lyapunov": null,
+ "grad_norm": 0.8012028361027335,
+ "grad_max_sv": 0.5324302047491074,
+ "grad_min_sv": 5.343053706141632e-08,
+ "grad_condition": 9995030.902296156,
+ "lr": 0.0008187119948743449,
+ "time_sec": 15.314170122146606
+ },
+ {
+ "epoch": 29,
+ "train_loss": 0.33312201313018797,
+ "train_acc": 0.88212,
+ "test_loss": 0.5545183982849121,
+ "test_acc": 0.8162,
+ "lyapunov": null,
+ "grad_norm": 0.7852771005330633,
+ "grad_max_sv": 0.5164767228066921,
+ "grad_min_sv": 5.198521888516439e-08,
+ "grad_condition": 10107248.49432898,
+ "lr": 0.0008064535268264883,
+ "time_sec": 15.311892986297607
+ },
+ {
+ "epoch": 30,
+ "train_loss": 0.3230313647842407,
+ "train_acc": 0.88538,
+ "test_loss": 0.658975659275055,
+ "test_acc": 0.7951,
+ "lyapunov": null,
+ "grad_norm": 0.7620779575769897,
+ "grad_max_sv": 0.5038670122623443,
+ "grad_min_sv": 5.0398949014152095e-08,
+ "grad_condition": 10038873.739317197,
+ "lr": 0.0007938926261462367,
+ "time_sec": 15.305739402770996
+ },
+ {
+ "epoch": 31,
+ "train_loss": 0.318023904876709,
+ "train_acc": 0.88796,
+ "test_loss": 0.6099616609573364,
+ "test_acc": 0.8127,
+ "lyapunov": null,
+ "grad_norm": 0.7501021639283835,
+ "grad_max_sv": 0.48214229866862296,
+ "grad_min_sv": 5.136175964537415e-08,
+ "grad_condition": 9343056.264591306,
+ "lr": 0.0007810416889260654,
+ "time_sec": 15.325766324996948
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.31232675287246703,
+ "train_acc": 0.89082,
+ "test_loss": 0.5936648756027222,
+ "test_acc": 0.8109,
+ "lyapunov": null,
+ "grad_norm": 0.7279129448401558,
+ "grad_max_sv": 0.4431505911052227,
+ "grad_min_sv": 4.812153910904726e-08,
+ "grad_condition": 9245973.275864627,
+ "lr": 0.0007679133974894983,
+ "time_sec": 15.317164897918701
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.29341697571754455,
+ "train_acc": 0.8967,
+ "test_loss": 0.5134524160385132,
+ "test_acc": 0.8357,
+ "lyapunov": null,
+ "grad_norm": 0.6884958324446571,
+ "grad_max_sv": 0.4426784858107567,
+ "grad_min_sv": 4.9337259699910875e-08,
+ "grad_condition": 9173234.108017813,
+ "lr": 0.0007545207078751857,
+ "time_sec": 15.312905311584473
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.2897170938873291,
+ "train_acc": 0.89828,
+ "test_loss": 0.5332132309913635,
+ "test_acc": 0.8335,
+ "lyapunov": null,
+ "grad_norm": 0.6750271636840882,
+ "grad_max_sv": 0.4532689817249775,
+ "grad_min_sv": 4.866335441278125e-08,
+ "grad_condition": 9412153.339201316,
+ "lr": 0.0007408768370508577,
+ "time_sec": 15.313745260238647
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.28602589085578917,
+ "train_acc": 0.89756,
+ "test_loss": 0.6111867341041565,
+ "test_acc": 0.8164,
+ "lyapunov": null,
+ "grad_norm": 0.6693786571127541,
+ "grad_max_sv": 0.4255728892982006,
+ "grad_min_sv": 4.737296563916971e-08,
+ "grad_condition": 9020003.170186436,
+ "lr": 0.0007269952498697734,
+ "time_sec": 15.32437539100647
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.2724088624763489,
+ "train_acc": 0.90408,
+ "test_loss": 0.5054482436180114,
+ "test_acc": 0.8387,
+ "lyapunov": null,
+ "grad_norm": 0.6416324201224461,
+ "grad_max_sv": 0.4291106700897217,
+ "grad_min_sv": 4.6136759568327077e-08,
+ "grad_condition": 9385408.654433403,
+ "lr": 0.0007128896457825364,
+ "time_sec": 15.322253704071045
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.26598569943904876,
+ "train_acc": 0.90576,
+ "test_loss": 0.5292941621780396,
+ "test_acc": 0.8315,
+ "lyapunov": null,
+ "grad_norm": 0.6311835178833255,
+ "grad_max_sv": 0.372799988463521,
+ "grad_min_sv": 4.42526025601353e-08,
+ "grad_condition": 8432960.688056583,
+ "lr": 0.0006985739453173903,
+ "time_sec": 15.330822467803955
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.2548411606884003,
+ "train_acc": 0.90972,
+ "test_loss": 0.5889158064842224,
+ "test_acc": 0.8304,
+ "lyapunov": null,
+ "grad_norm": 0.6075907586779873,
+ "grad_max_sv": 0.40464401319622995,
+ "grad_min_sv": 4.5029356776638e-08,
+ "grad_condition": 9144084.308266882,
+ "lr": 0.0006840622763423391,
+ "time_sec": 15.306779623031616
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.2488733386993408,
+ "train_acc": 0.91114,
+ "test_loss": 0.5380938538551331,
+ "test_acc": 0.8325,
+ "lyapunov": null,
+ "grad_norm": 0.6071846116294305,
+ "grad_max_sv": 0.3960565410554409,
+ "grad_min_sv": 4.6051877067299075e-08,
+ "grad_condition": 8601152.95310002,
+ "lr": 0.0006693689601226458,
+ "time_sec": 15.341014862060547
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.24494112944602967,
+ "train_acc": 0.91272,
+ "test_loss": 0.5513611147403717,
+ "test_acc": 0.8299,
+ "lyapunov": null,
+ "grad_norm": 0.592226155692726,
+ "grad_max_sv": 0.3729955680668354,
+ "grad_min_sv": 4.293505284636012e-08,
+ "grad_condition": 8794710.30872355,
+ "lr": 0.0006545084971874737,
+ "time_sec": 15.389995813369751
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.23727083059310913,
+ "train_acc": 0.9153,
+ "test_loss": 0.516801796245575,
+ "test_acc": 0.8461,
+ "lyapunov": null,
+ "grad_norm": 0.5812900748217327,
+ "grad_max_sv": 0.38579080179333686,
+ "grad_min_sv": 4.4259539766500214e-08,
+ "grad_condition": 8748753.244401883,
+ "lr": 0.0006394955530196147,
+ "time_sec": 15.318362474441528
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.22481181490898133,
+ "train_acc": 0.92022,
+ "test_loss": 0.5416705925941467,
+ "test_acc": 0.8322,
+ "lyapunov": null,
+ "grad_norm": 0.5619779097810216,
+ "grad_max_sv": 0.35356797464191914,
+ "grad_min_sv": 4.2614826689657547e-08,
+ "grad_condition": 8335709.16485816,
+ "lr": 0.0006243449435824273,
+ "time_sec": 15.315505743026733
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.22531912160873413,
+ "train_acc": 0.9199,
+ "test_loss": 0.5833574778556824,
+ "test_acc": 0.8338,
+ "lyapunov": null,
+ "grad_norm": 0.557199013327348,
+ "grad_max_sv": 0.33938006646931174,
+ "grad_min_sv": 4.300346327923421e-08,
+ "grad_condition": 7932422.911212927,
+ "lr": 0.0006090716206982714,
+ "time_sec": 15.32206392288208
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.216223452000618,
+ "train_acc": 0.92378,
+ "test_loss": 0.5012358224868775,
+ "test_acc": 0.8491,
+ "lyapunov": null,
+ "grad_norm": 0.5383308349401124,
+ "grad_max_sv": 0.3396204937249422,
+ "grad_min_sv": 4.201267005399245e-08,
+ "grad_condition": 8110585.992247519,
+ "lr": 0.0005936906572928625,
+ "time_sec": 15.314954042434692
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.21238275866508483,
+ "train_acc": 0.92506,
+ "test_loss": 0.5394745681762695,
+ "test_acc": 0.8426,
+ "lyapunov": null,
+ "grad_norm": 0.5338537929467614,
+ "grad_max_sv": 0.34414798244833944,
+ "grad_min_sv": 4.2673109312829635e-08,
+ "grad_condition": 8155102.629835799,
+ "lr": 0.0005782172325201156,
+ "time_sec": 15.313148975372314
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.2043999564409256,
+ "train_acc": 0.9264,
+ "test_loss": 0.4982535705089569,
+ "test_acc": 0.851,
+ "lyapunov": null,
+ "grad_norm": 0.518001070564685,
+ "grad_max_sv": 0.3181751623749733,
+ "grad_min_sv": 4.258852284166892e-08,
+ "grad_condition": 7586177.211236173,
+ "lr": 0.0005626666167821523,
+ "time_sec": 15.31693696975708
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.19748862716674806,
+ "train_acc": 0.93056,
+ "test_loss": 0.511198134803772,
+ "test_acc": 0.8512,
+ "lyapunov": null,
+ "grad_norm": 0.5066091467854666,
+ "grad_max_sv": 0.3097307480871677,
+ "grad_min_sv": 4.0578768167875976e-08,
+ "grad_condition": 7694719.511876054,
+ "lr": 0.0005470541566592572,
+ "time_sec": 15.311876773834229
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.18840614411354065,
+ "train_acc": 0.93296,
+ "test_loss": 0.5223799973011017,
+ "test_acc": 0.8486,
+ "lyapunov": null,
+ "grad_norm": 0.4947799501006328,
+ "grad_max_sv": 0.32398409508168696,
+ "grad_min_sv": 3.967475805666254e-08,
+ "grad_condition": 8181991.0382896485,
+ "lr": 0.0005313952597646569,
+ "time_sec": 15.324450016021729
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.1852111140346527,
+ "train_acc": 0.93434,
+ "test_loss": 0.5372783863067627,
+ "test_acc": 0.8442,
+ "lyapunov": null,
+ "grad_norm": 0.49013002688624263,
+ "grad_max_sv": 0.3128523100167513,
+ "grad_min_sv": 4.042725132435976e-08,
+ "grad_condition": 7786375.414612537,
+ "lr": 0.0005157053795390643,
+ "time_sec": 15.311121940612793
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.17850845782279967,
+ "train_acc": 0.9363,
+ "test_loss": 0.5162768915176391,
+ "test_acc": 0.8514,
+ "lyapunov": null,
+ "grad_norm": 0.4757476361255021,
+ "grad_max_sv": 0.3146433509886265,
+ "grad_min_sv": 3.966314778836022e-08,
+ "grad_condition": 7931529.673702802,
+ "lr": 0.0005000000000000002,
+ "time_sec": 15.3083016872406
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.17266313230514527,
+ "train_acc": 0.9392,
+ "test_loss": 0.5169307453155517,
+ "test_acc": 0.8514,
+ "lyapunov": null,
+ "grad_norm": 0.47267825902613214,
+ "grad_max_sv": 0.30655047073960306,
+ "grad_min_sv": 3.728870501262804e-08,
+ "grad_condition": 8340291.307145154,
+ "lr": 0.00048429462046093607,
+ "time_sec": 15.306477308273315
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.1663313666152954,
+ "train_acc": 0.94122,
+ "test_loss": 0.5442662063598633,
+ "test_acc": 0.8474,
+ "lyapunov": null,
+ "grad_norm": 0.46294043228921017,
+ "grad_max_sv": 0.31195108480751516,
+ "grad_min_sv": 3.8414651104545784e-08,
+ "grad_condition": 8124213.069898104,
+ "lr": 0.0004686047402353435,
+ "time_sec": 15.31308388710022
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.16149800906658174,
+ "train_acc": 0.94246,
+ "test_loss": 0.580558476114273,
+ "test_acc": 0.8416,
+ "lyapunov": null,
+ "grad_norm": 0.4519494684602909,
+ "grad_max_sv": 0.2916812110692263,
+ "grad_min_sv": 3.7287610199499e-08,
+ "grad_condition": 7889287.089630139,
+ "lr": 0.000452945843340743,
+ "time_sec": 15.30961537361145
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.16166152165412903,
+ "train_acc": 0.94208,
+ "test_loss": 0.5555281185150146,
+ "test_acc": 0.8473,
+ "lyapunov": null,
+ "grad_norm": 0.45553329333157905,
+ "grad_max_sv": 0.2948467206209898,
+ "grad_min_sv": 3.7315171308449634e-08,
+ "grad_condition": 7971105.5751351025,
+ "lr": 0.00043733338321784806,
+ "time_sec": 15.302156925201416
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.1565243923521042,
+ "train_acc": 0.94508,
+ "test_loss": 0.5074358646392823,
+ "test_acc": 0.8554,
+ "lyapunov": null,
+ "grad_norm": 0.4482394365745094,
+ "grad_max_sv": 0.2973413269966841,
+ "grad_min_sv": 3.757956048566768e-08,
+ "grad_condition": 8002347.089848238,
+ "lr": 0.0004217827674798847,
+ "time_sec": 15.313871145248413
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.14638519546031953,
+ "train_acc": 0.94786,
+ "test_loss": 0.4880453747272491,
+ "test_acc": 0.8653,
+ "lyapunov": null,
+ "grad_norm": 0.4314707571224286,
+ "grad_max_sv": 0.2860257361084223,
+ "grad_min_sv": 3.907978447514893e-08,
+ "grad_condition": 7325521.391552436,
+ "lr": 0.00040630934270713783,
+ "time_sec": 15.315257549285889
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.14646475307941437,
+ "train_acc": 0.94766,
+ "test_loss": 0.576962650680542,
+ "test_acc": 0.847,
+ "lyapunov": null,
+ "grad_norm": 0.4344661359835185,
+ "grad_max_sv": 0.27631179951131346,
+ "grad_min_sv": 3.824539080987677e-08,
+ "grad_condition": 7229591.786889655,
+ "lr": 0.000390928379301729,
+ "time_sec": 15.307274341583252
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.13712914622783662,
+ "train_acc": 0.95096,
+ "test_loss": 0.577113539648056,
+ "test_acc": 0.8499,
+ "lyapunov": null,
+ "grad_norm": 0.42148317642657124,
+ "grad_max_sv": 0.2975440930575132,
+ "grad_min_sv": 3.797022123386284e-08,
+ "grad_condition": 7915512.058803884,
+ "lr": 0.0003756550564175727,
+ "time_sec": 15.30914568901062
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.13448802095890044,
+ "train_acc": 0.95234,
+ "test_loss": 0.5032788132190704,
+ "test_acc": 0.8625,
+ "lyapunov": null,
+ "grad_norm": 0.4112977684378401,
+ "grad_max_sv": 0.2814919870346785,
+ "grad_min_sv": 3.85102704836271e-08,
+ "grad_condition": 7377336.951999759,
+ "lr": 0.00036050444698038553,
+ "time_sec": 15.317845106124878
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.13363940123558044,
+ "train_acc": 0.952,
+ "test_loss": 0.5432449889659882,
+ "test_acc": 0.854,
+ "lyapunov": null,
+ "grad_norm": 0.4126784436246539,
+ "grad_max_sv": 0.2804244253784418,
+ "grad_min_sv": 3.7023297405625045e-08,
+ "grad_condition": 7621956.91724248,
+ "lr": 0.00034549150281252655,
+ "time_sec": 15.322251796722412
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.12653651702404023,
+ "train_acc": 0.9556,
+ "test_loss": 0.49968673663139346,
+ "test_acc": 0.8678,
+ "lyapunov": null,
+ "grad_norm": 0.4007355103640766,
+ "grad_max_sv": 0.27012523673474786,
+ "grad_min_sv": 3.795508094484035e-08,
+ "grad_condition": 7141541.257203001,
+ "lr": 0.0003306310398773544,
+ "time_sec": 15.314436435699463
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.12188665760755539,
+ "train_acc": 0.9566,
+ "test_loss": 0.5593991501808167,
+ "test_acc": 0.8565,
+ "lyapunov": null,
+ "grad_norm": 0.3921398359098778,
+ "grad_max_sv": 0.27338829450309277,
+ "grad_min_sv": 3.639061785243314e-08,
+ "grad_condition": 7584044.263979311,
+ "lr": 0.00031593772365766127,
+ "time_sec": 15.302758693695068
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.1223608536529541,
+ "train_acc": 0.95622,
+ "test_loss": 0.5149862161636353,
+ "test_acc": 0.8612,
+ "lyapunov": null,
+ "grad_norm": 0.39447951861080405,
+ "grad_max_sv": 0.2628227811306715,
+ "grad_min_sv": 3.7084175330548416e-08,
+ "grad_condition": 7085494.638547185,
+ "lr": 0.0003014260546826097,
+ "time_sec": 15.300389051437378
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.11717436948299408,
+ "train_acc": 0.95768,
+ "test_loss": 0.5029231981754303,
+ "test_acc": 0.8645,
+ "lyapunov": null,
+ "grad_norm": 0.3837842917710247,
+ "grad_max_sv": 0.2503308400511742,
+ "grad_min_sv": 3.676226967286311e-08,
+ "grad_condition": 6852674.209660569,
+ "lr": 0.0002871103542174637,
+ "time_sec": 15.306849479675293
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.1104171419763565,
+ "train_acc": 0.96138,
+ "test_loss": 0.5105278373241424,
+ "test_acc": 0.8621,
+ "lyapunov": null,
+ "grad_norm": 0.37324824392122696,
+ "grad_max_sv": 0.24798878654837608,
+ "grad_min_sv": 3.5933988673519934e-08,
+ "grad_condition": 6928104.161500673,
+ "lr": 0.0002730047501302267,
+ "time_sec": 15.306128978729248
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.11005497314453125,
+ "train_acc": 0.9604,
+ "test_loss": 0.5454881217956543,
+ "test_acc": 0.8593,
+ "lyapunov": null,
+ "grad_norm": 0.3740796827280413,
+ "grad_max_sv": 0.25094335451722144,
+ "grad_min_sv": 3.760543059172505e-08,
+ "grad_condition": 6680130.259128613,
+ "lr": 0.00025912316294914234,
+ "time_sec": 15.311371803283691
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.1054667473077774,
+ "train_acc": 0.96206,
+ "test_loss": 0.5242725006103516,
+ "test_acc": 0.8654,
+ "lyapunov": null,
+ "grad_norm": 0.368892738378212,
+ "grad_max_sv": 0.25266984924674035,
+ "grad_min_sv": 3.633599621188921e-08,
+ "grad_condition": 7013352.02049877,
+ "lr": 0.0002454792921248144,
+ "time_sec": 15.30515193939209
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.10004293047904968,
+ "train_acc": 0.96412,
+ "test_loss": 0.5743433611869811,
+ "test_acc": 0.8538,
+ "lyapunov": null,
+ "grad_norm": 0.3572601369548122,
+ "grad_max_sv": 0.24928448162972927,
+ "grad_min_sv": 3.5534662101710524e-08,
+ "grad_condition": 7054160.907809177,
+ "lr": 0.00023208660251050164,
+ "time_sec": 15.31411099433899
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.09898206293821335,
+ "train_acc": 0.96434,
+ "test_loss": 0.5453432657718659,
+ "test_acc": 0.8647,
+ "lyapunov": null,
+ "grad_norm": 0.3575462219401736,
+ "grad_max_sv": 0.22338325902819633,
+ "grad_min_sv": 3.5619033011968784e-08,
+ "grad_condition": 6388845.433191194,
+ "lr": 0.00021895831107393473,
+ "time_sec": 15.320244789123535
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.09576731202960015,
+ "train_acc": 0.96662,
+ "test_loss": 0.5289871492862701,
+ "test_acc": 0.8673,
+ "lyapunov": null,
+ "grad_norm": 0.3475548635629844,
+ "grad_max_sv": 0.22887863107025624,
+ "grad_min_sv": 3.558577605922153e-08,
+ "grad_condition": 6520932.801253774,
+ "lr": 0.00020610737385376356,
+ "time_sec": 15.312981367111206
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.09435438349246979,
+ "train_acc": 0.96552,
+ "test_loss": 0.5673801244735718,
+ "test_acc": 0.8597,
+ "lyapunov": null,
+ "grad_norm": 0.35002047617094667,
+ "grad_max_sv": 0.24012817665934563,
+ "grad_min_sv": 3.424292120968175e-08,
+ "grad_condition": 7037803.21914607,
+ "lr": 0.00019354647317351177,
+ "time_sec": 15.323097705841064
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.0899286351108551,
+ "train_acc": 0.96766,
+ "test_loss": 0.5408580667495727,
+ "test_acc": 0.8662,
+ "lyapunov": null,
+ "grad_norm": 0.34100528699001653,
+ "grad_max_sv": 0.22443376183509828,
+ "grad_min_sv": 3.460758826179244e-08,
+ "grad_condition": 6548190.204110672,
+ "lr": 0.0001812880051256552,
+ "time_sec": 15.303936243057251
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.08644640971183777,
+ "train_acc": 0.9696,
+ "test_loss": 0.5231532414436341,
+ "test_acc": 0.8687,
+ "lyapunov": null,
+ "grad_norm": 0.3297853844853395,
+ "grad_max_sv": 0.23831307105720043,
+ "grad_min_sv": 3.648763895469642e-08,
+ "grad_condition": 6564265.399345921,
+ "lr": 0.00016934406733817422,
+ "time_sec": 15.323826313018799
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.08675267961740493,
+ "train_acc": 0.96966,
+ "test_loss": 0.531370454120636,
+ "test_acc": 0.8724,
+ "lyapunov": null,
+ "grad_norm": 0.33474921077291964,
+ "grad_max_sv": 0.23228033129125833,
+ "grad_min_sv": 3.54595965035287e-08,
+ "grad_condition": 6646670.669053013,
+ "lr": 0.0001577264470356557,
+ "time_sec": 15.305448532104492
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.08520255417346954,
+ "train_acc": 0.96946,
+ "test_loss": 0.5489996848106384,
+ "test_acc": 0.8629,
+ "lyapunov": null,
+ "grad_norm": 0.333062577424503,
+ "grad_max_sv": 0.23861498832702638,
+ "grad_min_sv": 3.416034828340742e-08,
+ "grad_condition": 7057996.098654354,
+ "lr": 0.00014644660940672634,
+ "time_sec": 15.307157516479492
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.08347911696434021,
+ "train_acc": 0.97006,
+ "test_loss": 0.5250146618843079,
+ "test_acc": 0.8686,
+ "lyapunov": null,
+ "grad_norm": 0.3315871550000043,
+ "grad_max_sv": 0.23978985324501992,
+ "grad_min_sv": 3.5313697566152766e-08,
+ "grad_condition": 6836692.7541990755,
+ "lr": 0.0001355156862892944,
+ "time_sec": 15.2927827835083
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.08182602140903474,
+ "train_acc": 0.97104,
+ "test_loss": 0.5350998015880585,
+ "test_acc": 0.8704,
+ "lyapunov": null,
+ "grad_norm": 0.3273538350101595,
+ "grad_max_sv": 0.23843283373862506,
+ "grad_min_sv": 3.504422023681286e-08,
+ "grad_condition": 6836027.998268524,
+ "lr": 0.00012494446518477025,
+ "time_sec": 15.317047834396362
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.07884973392605782,
+ "train_acc": 0.9722,
+ "test_loss": 0.543610359621048,
+ "test_acc": 0.869,
+ "lyapunov": null,
+ "grad_norm": 0.318085721614815,
+ "grad_max_sv": 0.2306290850043297,
+ "grad_min_sv": 3.51138401910589e-08,
+ "grad_condition": 6598865.01839647,
+ "lr": 0.00011474337861210548,
+ "time_sec": 15.346408605575562
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.07515444636344909,
+ "train_acc": 0.97302,
+ "test_loss": 0.5453424057006836,
+ "test_acc": 0.8685,
+ "lyapunov": null,
+ "grad_norm": 0.30764732453726595,
+ "grad_max_sv": 0.23328058049082756,
+ "grad_min_sv": 3.4018917194345025e-08,
+ "grad_condition": 6898312.859708968,
+ "lr": 0.00010492249381215483,
+ "time_sec": 15.312849998474121
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.07553981874942779,
+ "train_acc": 0.97342,
+ "test_loss": 0.5447598055839539,
+ "test_acc": 0.8687,
+ "lyapunov": null,
+ "grad_norm": 0.3126827627293077,
+ "grad_max_sv": 0.22440926413983106,
+ "grad_min_sv": 3.5051727831358904e-08,
+ "grad_condition": 6508990.801328001,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 15.31579327583313
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.0691981615459919,
+ "train_acc": 0.9767,
+ "test_loss": 0.6010801038742065,
+ "test_acc": 0.8592,
+ "lyapunov": null,
+ "grad_norm": 0.2964655372784287,
+ "grad_max_sv": 0.20926067158579825,
+ "grad_min_sv": 3.334633209561844e-08,
+ "grad_condition": 6336645.734981732,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 15.311565399169922
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.07134237255096436,
+ "train_acc": 0.97564,
+ "test_loss": 0.5511228674888611,
+ "test_acc": 0.8685,
+ "lyapunov": null,
+ "grad_norm": 0.3035210287863858,
+ "grad_max_sv": 0.2166539143770933,
+ "grad_min_sv": 3.444789098416834e-08,
+ "grad_condition": 6316501.5285459785,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 15.321164846420288
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.06894262619018554,
+ "train_acc": 0.97574,
+ "test_loss": 0.5341768414020538,
+ "test_acc": 0.8666,
+ "lyapunov": null,
+ "grad_norm": 0.3006016750160245,
+ "grad_max_sv": 0.214569428935647,
+ "grad_min_sv": 3.390297984573465e-08,
+ "grad_condition": 6347736.579489769,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 15.31421685218811
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.06843596329629421,
+ "train_acc": 0.97558,
+ "test_loss": 0.5208944204807282,
+ "test_acc": 0.8703,
+ "lyapunov": null,
+ "grad_norm": 0.2931609715468412,
+ "grad_max_sv": 0.2041362512856722,
+ "grad_min_sv": 3.608063616766799e-08,
+ "grad_condition": 5852493.960090882,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 15.313952445983887
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.06798111920118331,
+ "train_acc": 0.97708,
+ "test_loss": 0.5408778586387635,
+ "test_acc": 0.869,
+ "lyapunov": null,
+ "grad_norm": 0.2949462881166867,
+ "grad_max_sv": 0.2191694311797619,
+ "grad_min_sv": 3.3161099466383345e-08,
+ "grad_condition": 6683084.915046187,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 15.323522567749023
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.06374187029123306,
+ "train_acc": 0.97854,
+ "test_loss": 0.534241654920578,
+ "test_acc": 0.8701,
+ "lyapunov": null,
+ "grad_norm": 0.28381214745100436,
+ "grad_max_sv": 0.21770549267530442,
+ "grad_min_sv": 3.4639007706616096e-08,
+ "grad_condition": 6392279.068014438,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 15.312573432922363
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.06471459998726845,
+ "train_acc": 0.97748,
+ "test_loss": 0.5297845101356506,
+ "test_acc": 0.8726,
+ "lyapunov": null,
+ "grad_norm": 0.28897487313019665,
+ "grad_max_sv": 0.19332378804683686,
+ "grad_min_sv": 3.343392815935431e-08,
+ "grad_condition": 5824270.640002059,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 15.310936450958252
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.06347171569228173,
+ "train_acc": 0.97814,
+ "test_loss": 0.5321846860408783,
+ "test_acc": 0.8722,
+ "lyapunov": null,
+ "grad_norm": 0.2861217885894181,
+ "grad_max_sv": 0.18890463691204787,
+ "grad_min_sv": 3.443075908826643e-08,
+ "grad_condition": 5578610.167209303,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 15.30883502960205
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.06456126765966415,
+ "train_acc": 0.97732,
+ "test_loss": 0.5306058297157288,
+ "test_acc": 0.8724,
+ "lyapunov": null,
+ "grad_norm": 0.2911671580013793,
+ "grad_max_sv": 0.20169610902667046,
+ "grad_min_sv": 3.3340199756537456e-08,
+ "grad_condition": 6113921.310843622,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 15.325217247009277
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.05981739419221878,
+ "train_acc": 0.97936,
+ "test_loss": 0.5510406871795654,
+ "test_acc": 0.8698,
+ "lyapunov": null,
+ "grad_norm": 0.27406962038993515,
+ "grad_max_sv": 0.20393476765602828,
+ "grad_min_sv": 3.436182409721766e-08,
+ "grad_condition": 6006804.61096659,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 15.308394432067871
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.05843851445674896,
+ "train_acc": 0.97988,
+ "test_loss": 0.5369569517612457,
+ "test_acc": 0.8726,
+ "lyapunov": null,
+ "grad_norm": 0.270215680703968,
+ "grad_max_sv": 0.19462423361837863,
+ "grad_min_sv": 3.2800926286213895e-08,
+ "grad_condition": 5976870.852957519,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 15.312544584274292
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.06141342503786087,
+ "train_acc": 0.9789,
+ "test_loss": 0.5492124430656433,
+ "test_acc": 0.8715,
+ "lyapunov": null,
+ "grad_norm": 0.28355491226552393,
+ "grad_max_sv": 0.20141606461256742,
+ "grad_min_sv": 3.389024190170176e-08,
+ "grad_condition": 6025484.075561702,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 15.318751096725464
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.06185958398580551,
+ "train_acc": 0.9791,
+ "test_loss": 0.5353557282447815,
+ "test_acc": 0.8734,
+ "lyapunov": null,
+ "grad_norm": 0.28019086696986784,
+ "grad_max_sv": 0.20358563121408224,
+ "grad_min_sv": 3.4872499954374805e-08,
+ "grad_condition": 5972181.870711091,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 15.310726404190063
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.061077375268936154,
+ "train_acc": 0.97862,
+ "test_loss": 0.5403136486530304,
+ "test_acc": 0.8726,
+ "lyapunov": null,
+ "grad_norm": 0.27793458972654056,
+ "grad_max_sv": 0.21468139700591565,
+ "grad_min_sv": 3.314470546911252e-08,
+ "grad_condition": 6531953.716980138,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 15.322482585906982
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.059067166829109195,
+ "train_acc": 0.9801,
+ "test_loss": 0.5499792334079743,
+ "test_acc": 0.8706,
+ "lyapunov": null,
+ "grad_norm": 0.2726950869177449,
+ "grad_max_sv": 0.1847312103956938,
+ "grad_min_sv": 3.442832863242984e-08,
+ "grad_condition": 5484378.490748374,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 15.331462860107422
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.058869197854995725,
+ "train_acc": 0.97992,
+ "test_loss": 0.5609679688453675,
+ "test_acc": 0.8699,
+ "lyapunov": null,
+ "grad_norm": 0.2733600212103379,
+ "grad_max_sv": 0.203422649204731,
+ "grad_min_sv": 3.4962690476092464e-08,
+ "grad_condition": 5877045.15462194,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 15.318592071533203
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.05934914319038391,
+ "train_acc": 0.97972,
+ "test_loss": 0.5556031215667725,
+ "test_acc": 0.8687,
+ "lyapunov": null,
+ "grad_norm": 0.2765716324142509,
+ "grad_max_sv": 0.1996933190152049,
+ "grad_min_sv": 3.3284164402402895e-08,
+ "grad_condition": 6129925.740326188,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 15.329679727554321
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.05874215810537338,
+ "train_acc": 0.97992,
+ "test_loss": 0.5451333051681518,
+ "test_acc": 0.8712,
+ "lyapunov": null,
+ "grad_norm": 0.2696205462857481,
+ "grad_max_sv": 0.19026922769844531,
+ "grad_min_sv": 3.324827377859663e-08,
+ "grad_condition": 5756655.141047328,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 15.31182599067688
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.059339061715602874,
+ "train_acc": 0.98046,
+ "test_loss": 0.5511723966598511,
+ "test_acc": 0.8694,
+ "lyapunov": null,
+ "grad_norm": 0.2722387278016211,
+ "grad_max_sv": 0.17949199080467224,
+ "grad_min_sv": 3.178271090753526e-08,
+ "grad_condition": 5671386.367227938,
+ "lr": 2.467198171342e-07,
+ "time_sec": 15.313301801681519
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.05937783687353134,
+ "train_acc": 0.97908,
+ "test_loss": 0.5341217585086823,
+ "test_acc": 0.8723,
+ "lyapunov": null,
+ "grad_norm": 0.275408042809645,
+ "grad_max_sv": 0.19940215721726418,
+ "grad_min_sv": 3.299201711826072e-08,
+ "grad_condition": 6121670.713258359,
+ "lr": 0.0,
+ "time_sec": 15.337401151657104
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 2.1551968896484377,
+ "train_acc": 0.2953,
+ "test_loss": 1.8477057243347168,
+ "test_acc": 0.3437,
+ "lyapunov": null,
+ "grad_norm": 8.144943624656428,
+ "grad_max_sv": 7.675079941749573,
+ "grad_min_sv": 2.827612160416493e-07,
+ "grad_condition": 28317355.270070046,
+ "lr": 0.0009997532801828658,
+ "time_sec": 32.46485447883606
+ },
+ {
+ "epoch": 2,
+ "train_loss": 1.6082625040054321,
+ "train_acc": 0.42284,
+ "test_loss": 1.6673745800018311,
+ "test_acc": 0.406,
+ "lyapunov": null,
+ "grad_norm": 6.065037474589551,
+ "grad_max_sv": 5.5711340546607975,
+ "grad_min_sv": 2.234880795981553e-07,
+ "grad_condition": 25327173.99046154,
+ "lr": 0.0009990133642141358,
+ "time_sec": 32.39758110046387
+ },
+ {
+ "epoch": 3,
+ "train_loss": 1.4377277154159547,
+ "train_acc": 0.48488,
+ "test_loss": 1.5402760635375976,
+ "test_acc": 0.4555,
+ "lyapunov": null,
+ "grad_norm": 5.494687491087257,
+ "grad_max_sv": 4.691517299413681,
+ "grad_min_sv": 1.9618108950680835e-07,
+ "grad_condition": 24150344.903272796,
+ "lr": 0.00099778098230154,
+ "time_sec": 32.400826930999756
+ },
+ {
+ "epoch": 4,
+ "train_loss": 1.2879639573669435,
+ "train_acc": 0.53716,
+ "test_loss": 1.8371749683380127,
+ "test_acc": 0.4098,
+ "lyapunov": null,
+ "grad_norm": 4.741620609793776,
+ "grad_max_sv": 4.525534170866012,
+ "grad_min_sv": 1.8297150106150184e-07,
+ "grad_condition": 24870782.059164062,
+ "lr": 0.000996057350657239,
+ "time_sec": 32.39713406562805
+ },
+ {
+ "epoch": 5,
+ "train_loss": 1.196011114768982,
+ "train_acc": 0.5717,
+ "test_loss": 1.1917746976852417,
+ "test_acc": 0.5662,
+ "lyapunov": null,
+ "grad_norm": 4.225084445671327,
+ "grad_max_sv": 3.8811924695968627,
+ "grad_min_sv": 1.7304786759098079e-07,
+ "grad_condition": 22788363.03168846,
+ "lr": 0.0009938441702975688,
+ "time_sec": 32.39927625656128
+ },
+ {
+ "epoch": 6,
+ "train_loss": 1.1017011584854126,
+ "train_acc": 0.60624,
+ "test_loss": 1.2156044723510742,
+ "test_acc": 0.5524,
+ "lyapunov": null,
+ "grad_norm": 3.8500733224578765,
+ "grad_max_sv": 3.3867243230342865,
+ "grad_min_sv": 1.5910630946081028e-07,
+ "grad_condition": 21517993.207089722,
+ "lr": 0.0009911436253643444,
+ "time_sec": 32.41104435920715
+ },
+ {
+ "epoch": 7,
+ "train_loss": 1.019956372566223,
+ "train_acc": 0.63884,
+ "test_loss": 1.0341911317825316,
+ "test_acc": 0.6312,
+ "lyapunov": null,
+ "grad_norm": 3.4050623209558424,
+ "grad_max_sv": 2.8642074435949327,
+ "grad_min_sv": 1.3970929391149411e-07,
+ "grad_condition": 20503012.26948414,
+ "lr": 0.0009879583809693736,
+ "time_sec": 32.39900183677673
+ },
+ {
+ "epoch": 8,
+ "train_loss": 0.952932172832489,
+ "train_acc": 0.66154,
+ "test_loss": 0.9561027820587158,
+ "test_acc": 0.6654,
+ "lyapunov": null,
+ "grad_norm": 3.069081296040065,
+ "grad_max_sv": 2.5316490083932877,
+ "grad_min_sv": 1.2806189264580325e-07,
+ "grad_condition": 19934874.23822563,
+ "lr": 0.0009842915805643154,
+ "time_sec": 32.39242911338806
+ },
+ {
+ "epoch": 9,
+ "train_loss": 0.8849921081352234,
+ "train_acc": 0.68628,
+ "test_loss": 1.0301121936798097,
+ "test_acc": 0.6342,
+ "lyapunov": null,
+ "grad_norm": 2.63645918277651,
+ "grad_max_sv": 2.232751601934433,
+ "grad_min_sv": 1.2227004724252312e-07,
+ "grad_condition": 18401740.489395566,
+ "lr": 0.0009801468428384714,
+ "time_sec": 32.409496545791626
+ },
+ {
+ "epoch": 10,
+ "train_loss": 0.8236279186630249,
+ "train_acc": 0.70854,
+ "test_loss": 0.8807288621902466,
+ "test_acc": 0.682,
+ "lyapunov": null,
+ "grad_norm": 2.300239690915013,
+ "grad_max_sv": 1.9658639460802079,
+ "grad_min_sv": 1.1437598530505966e-07,
+ "grad_condition": 17605252.06510754,
+ "lr": 0.0009755282581475767,
+ "time_sec": 32.40023136138916
+ },
+ {
+ "epoch": 11,
+ "train_loss": 0.788265288658142,
+ "train_acc": 0.72186,
+ "test_loss": 0.8550062474250794,
+ "test_acc": 0.6904,
+ "lyapunov": null,
+ "grad_norm": 2.12020034951075,
+ "grad_max_sv": 1.6186737358570098,
+ "grad_min_sv": 1.0332133957291489e-07,
+ "grad_condition": 15780748.729030486,
+ "lr": 0.0009704403844771127,
+ "time_sec": 32.40667533874512
+ },
+ {
+ "epoch": 12,
+ "train_loss": 0.7433690148735046,
+ "train_acc": 0.73772,
+ "test_loss": 0.8008458862304687,
+ "test_acc": 0.7171,
+ "lyapunov": null,
+ "grad_norm": 1.8897751819834427,
+ "grad_max_sv": 1.448184822499752,
+ "grad_min_sv": 9.324852872083511e-08,
+ "grad_condition": 15545592.26156075,
+ "lr": 0.0009648882429441257,
+ "time_sec": 32.4004065990448
+ },
+ {
+ "epoch": 13,
+ "train_loss": 0.7159804575920105,
+ "train_acc": 0.74844,
+ "test_loss": 0.8449424732208252,
+ "test_acc": 0.7107,
+ "lyapunov": null,
+ "grad_norm": 1.7162684736286458,
+ "grad_max_sv": 1.387939277291298,
+ "grad_min_sv": 9.02613965791943e-08,
+ "grad_condition": 15516859.545498159,
+ "lr": 0.0009588773128419905,
+ "time_sec": 32.39161419868469
+ },
+ {
+ "epoch": 14,
+ "train_loss": 0.6710689739608765,
+ "train_acc": 0.7652,
+ "test_loss": 0.8030969514846802,
+ "test_acc": 0.7199,
+ "lyapunov": null,
+ "grad_norm": 1.5415310022642745,
+ "grad_max_sv": 1.124143162369728,
+ "grad_min_sv": 7.788519358342683e-08,
+ "grad_condition": 14586378.513744438,
+ "lr": 0.0009524135262330098,
+ "time_sec": 32.40552067756653
+ },
+ {
+ "epoch": 15,
+ "train_loss": 0.6438176040267944,
+ "train_acc": 0.77396,
+ "test_loss": 0.7497868657112121,
+ "test_acc": 0.7401,
+ "lyapunov": null,
+ "grad_norm": 1.4186644873786285,
+ "grad_max_sv": 1.0314671725034714,
+ "grad_min_sv": 7.5272734179066e-08,
+ "grad_condition": 13653093.352212925,
+ "lr": 0.0009455032620941839,
+ "time_sec": 32.40474534034729
+ },
+ {
+ "epoch": 16,
+ "train_loss": 0.615869576702118,
+ "train_acc": 0.7829,
+ "test_loss": 0.7672984195709228,
+ "test_acc": 0.7337,
+ "lyapunov": null,
+ "grad_norm": 1.2847059491767132,
+ "grad_max_sv": 0.8981582961976529,
+ "grad_min_sv": 7.069710665774664e-08,
+ "grad_condition": 12774971.99569363,
+ "lr": 0.0009381533400219318,
+ "time_sec": 32.411378145217896
+ },
+ {
+ "epoch": 17,
+ "train_loss": 0.5916317593765259,
+ "train_acc": 0.79332,
+ "test_loss": 0.6773865149497986,
+ "test_acc": 0.7673,
+ "lyapunov": null,
+ "grad_norm": 1.1905850089737686,
+ "grad_max_sv": 0.8305475980043411,
+ "grad_min_sv": 6.581527465243652e-08,
+ "grad_condition": 12649477.259974267,
+ "lr": 0.0009303710135019719,
+ "time_sec": 32.40375375747681
+ },
+ {
+ "epoch": 18,
+ "train_loss": 0.5710988390541076,
+ "train_acc": 0.80148,
+ "test_loss": 0.6730817820549011,
+ "test_acc": 0.7658,
+ "lyapunov": null,
+ "grad_norm": 1.1184745092261044,
+ "grad_max_sv": 0.8092691361904144,
+ "grad_min_sv": 6.20087442726458e-08,
+ "grad_condition": 13237272.581055809,
+ "lr": 0.0009221639627510076,
+ "time_sec": 32.403624534606934
+ },
+ {
+ "epoch": 19,
+ "train_loss": 0.5524461611747742,
+ "train_acc": 0.80704,
+ "test_loss": 0.7162760413169861,
+ "test_acc": 0.7602,
+ "lyapunov": null,
+ "grad_norm": 1.023562615452227,
+ "grad_max_sv": 0.6794823326170445,
+ "grad_min_sv": 5.88299432280337e-08,
+ "grad_condition": 11704217.317878243,
+ "lr": 0.000913540287137281,
+ "time_sec": 32.39382600784302
+ },
+ {
+ "epoch": 20,
+ "train_loss": 0.5298428584098815,
+ "train_acc": 0.81452,
+ "test_loss": 0.7450216589927673,
+ "test_acc": 0.752,
+ "lyapunov": null,
+ "grad_norm": 0.9359144343942514,
+ "grad_max_sv": 0.5905756287276744,
+ "grad_min_sv": 5.571528873815623e-08,
+ "grad_condition": 10693233.182217773,
+ "lr": 0.0009045084971874739,
+ "time_sec": 32.40094780921936
+ },
+ {
+ "epoch": 21,
+ "train_loss": 0.5077325123977661,
+ "train_acc": 0.82174,
+ "test_loss": 0.63943037815094,
+ "test_acc": 0.7812,
+ "lyapunov": null,
+ "grad_norm": 0.8805285251076611,
+ "grad_max_sv": 0.615053903311491,
+ "grad_min_sv": 5.4429192175575734e-08,
+ "grad_condition": 11327012.575821584,
+ "lr": 0.0008950775061878452,
+ "time_sec": 32.38740086555481
+ },
+ {
+ "epoch": 22,
+ "train_loss": 0.4933246819114685,
+ "train_acc": 0.8259,
+ "test_loss": 0.718407027053833,
+ "test_acc": 0.7614,
+ "lyapunov": null,
+ "grad_norm": 0.8303617086611039,
+ "grad_max_sv": 0.5229416653513909,
+ "grad_min_sv": 5.0371477122723717e-08,
+ "grad_condition": 10417728.60900723,
+ "lr": 0.0008852566213878947,
+ "time_sec": 32.404406785964966
+ },
+ {
+ "epoch": 23,
+ "train_loss": 0.47660592782020567,
+ "train_acc": 0.83498,
+ "test_loss": 0.6119730060577393,
+ "test_acc": 0.7951,
+ "lyapunov": null,
+ "grad_norm": 0.7772569962051041,
+ "grad_max_sv": 0.5228113703429699,
+ "grad_min_sv": 4.883190189985953e-08,
+ "grad_condition": 10840281.592058718,
+ "lr": 0.0008750555348152298,
+ "time_sec": 32.41756844520569
+ },
+ {
+ "epoch": 24,
+ "train_loss": 0.4621484722900391,
+ "train_acc": 0.8354,
+ "test_loss": 0.6255874982833862,
+ "test_acc": 0.7921,
+ "lyapunov": null,
+ "grad_norm": 0.7435129116165293,
+ "grad_max_sv": 0.5028938911855221,
+ "grad_min_sv": 4.940657198915232e-08,
+ "grad_condition": 10262672.7433966,
+ "lr": 0.0008644843137107057,
+ "time_sec": 32.40160775184631
+ },
+ {
+ "epoch": 25,
+ "train_loss": 0.44543547362804414,
+ "train_acc": 0.84322,
+ "test_loss": 0.6244046552658081,
+ "test_acc": 0.8003,
+ "lyapunov": null,
+ "grad_norm": 0.7057766135770664,
+ "grad_max_sv": 0.45453565418720243,
+ "grad_min_sv": 4.47153126970079e-08,
+ "grad_condition": 10235918.99223967,
+ "lr": 0.0008535533905932737,
+ "time_sec": 32.397634983062744
+ },
+ {
+ "epoch": 26,
+ "train_loss": 0.4291659313964844,
+ "train_acc": 0.85028,
+ "test_loss": 0.586253802204132,
+ "test_acc": 0.8053,
+ "lyapunov": null,
+ "grad_norm": 0.6653011352683553,
+ "grad_max_sv": 0.40432176999747754,
+ "grad_min_sv": 4.4079006933372964e-08,
+ "grad_condition": 9263382.4971398,
+ "lr": 0.0008422735529643444,
+ "time_sec": 32.408364057540894
+ },
+ {
+ "epoch": 27,
+ "train_loss": 0.41755434021949767,
+ "train_acc": 0.8537,
+ "test_loss": 0.6190900807380676,
+ "test_acc": 0.8031,
+ "lyapunov": null,
+ "grad_norm": 0.634844213604884,
+ "grad_max_sv": 0.38489293307065964,
+ "grad_min_sv": 4.278397165435877e-08,
+ "grad_condition": 9083713.307072137,
+ "lr": 0.0008306559326618259,
+ "time_sec": 32.3781955242157
+ },
+ {
+ "epoch": 28,
+ "train_loss": 0.409987173576355,
+ "train_acc": 0.85588,
+ "test_loss": 0.6381987627029418,
+ "test_acc": 0.7967,
+ "lyapunov": null,
+ "grad_norm": 0.6208575070285024,
+ "grad_max_sv": 0.3849256232380867,
+ "grad_min_sv": 4.156698754087529e-08,
+ "grad_condition": 9343591.955088045,
+ "lr": 0.0008187119948743449,
+ "time_sec": 32.424397468566895
+ },
+ {
+ "epoch": 29,
+ "train_loss": 0.39254301443099976,
+ "train_acc": 0.86148,
+ "test_loss": 0.6114391220092773,
+ "test_acc": 0.8072,
+ "lyapunov": null,
+ "grad_norm": 0.5930731028782803,
+ "grad_max_sv": 0.35281661339104176,
+ "grad_min_sv": 3.97135552887562e-08,
+ "grad_condition": 8878121.049382607,
+ "lr": 0.0008064535268264883,
+ "time_sec": 32.40766763687134
+ },
+ {
+ "epoch": 30,
+ "train_loss": 0.3785347310256958,
+ "train_acc": 0.86726,
+ "test_loss": 0.6049399808883666,
+ "test_acc": 0.811,
+ "lyapunov": null,
+ "grad_norm": 0.5794796026042499,
+ "grad_max_sv": 0.36831745132803917,
+ "grad_min_sv": 4.032110121343635e-08,
+ "grad_condition": 9212028.38827365,
+ "lr": 0.0007938926261462367,
+ "time_sec": 32.40119290351868
+ },
+ {
+ "epoch": 31,
+ "train_loss": 0.3689020803642273,
+ "train_acc": 0.87034,
+ "test_loss": 0.6224831011772156,
+ "test_acc": 0.8103,
+ "lyapunov": null,
+ "grad_norm": 0.5518777770693967,
+ "grad_max_sv": 0.34497435614466665,
+ "grad_min_sv": 3.993250263789605e-08,
+ "grad_condition": 8691890.072923485,
+ "lr": 0.0007810416889260654,
+ "time_sec": 32.42319178581238
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.3600490350532532,
+ "train_acc": 0.87378,
+ "test_loss": 0.6563146770000458,
+ "test_acc": 0.7989,
+ "lyapunov": null,
+ "grad_norm": 0.5344416918727563,
+ "grad_max_sv": 0.3161147892475128,
+ "grad_min_sv": 3.79914633530376e-08,
+ "grad_condition": 8391808.948301231,
+ "lr": 0.0007679133974894983,
+ "time_sec": 32.40037226676941
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.3552369830417633,
+ "train_acc": 0.876,
+ "test_loss": 0.5918597935676575,
+ "test_acc": 0.8191,
+ "lyapunov": null,
+ "grad_norm": 0.5223477954823382,
+ "grad_max_sv": 0.32091905549168587,
+ "grad_min_sv": 3.692389771714488e-08,
+ "grad_condition": 8735655.499988783,
+ "lr": 0.0007545207078751857,
+ "time_sec": 32.39385366439819
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.3357627202987671,
+ "train_acc": 0.88192,
+ "test_loss": 0.6601162696361542,
+ "test_acc": 0.8074,
+ "lyapunov": null,
+ "grad_norm": 0.5010170887656177,
+ "grad_max_sv": 0.3139246258884668,
+ "grad_min_sv": 3.658822085306213e-08,
+ "grad_condition": 8606732.681616401,
+ "lr": 0.0007408768370508577,
+ "time_sec": 32.40888476371765
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.32540871870040894,
+ "train_acc": 0.88428,
+ "test_loss": 0.6114396753549576,
+ "test_acc": 0.8112,
+ "lyapunov": null,
+ "grad_norm": 0.4852002465463357,
+ "grad_max_sv": 0.3033136323094368,
+ "grad_min_sv": 3.599271058973841e-08,
+ "grad_condition": 8499862.031601336,
+ "lr": 0.0007269952498697734,
+ "time_sec": 32.40857720375061
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.32421252524375915,
+ "train_acc": 0.8847,
+ "test_loss": 0.6881836595535278,
+ "test_acc": 0.8116,
+ "lyapunov": null,
+ "grad_norm": 0.47585625371919826,
+ "grad_max_sv": 0.28932417593896387,
+ "grad_min_sv": 3.663087517757902e-08,
+ "grad_condition": 7933220.2527872,
+ "lr": 0.0007128896457825364,
+ "time_sec": 32.39529776573181
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.3108924944496155,
+ "train_acc": 0.88942,
+ "test_loss": 0.7008573976516723,
+ "test_acc": 0.8098,
+ "lyapunov": null,
+ "grad_norm": 0.46276747011208014,
+ "grad_max_sv": 0.2795715734362602,
+ "grad_min_sv": 3.448033547570617e-08,
+ "grad_condition": 8262563.079640454,
+ "lr": 0.0006985739453173903,
+ "time_sec": 32.38434648513794
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.31133034090042117,
+ "train_acc": 0.88992,
+ "test_loss": 0.6698009629249573,
+ "test_acc": 0.81,
+ "lyapunov": null,
+ "grad_norm": 0.4586602799362298,
+ "grad_max_sv": 0.2844005227088928,
+ "grad_min_sv": 3.324500559287458e-08,
+ "grad_condition": 8714467.747357922,
+ "lr": 0.0006840622763423391,
+ "time_sec": 32.396021366119385
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.29518098635673523,
+ "train_acc": 0.89552,
+ "test_loss": 0.7677701180458069,
+ "test_acc": 0.7991,
+ "lyapunov": null,
+ "grad_norm": 0.43830085967668675,
+ "grad_max_sv": 0.2725641973316669,
+ "grad_min_sv": 3.3406064270380397e-08,
+ "grad_condition": 8255466.038533419,
+ "lr": 0.0006693689601226458,
+ "time_sec": 32.40195083618164
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.2831247230243683,
+ "train_acc": 0.89996,
+ "test_loss": 0.6842746494293213,
+ "test_acc": 0.8148,
+ "lyapunov": null,
+ "grad_norm": 0.4331819538283316,
+ "grad_max_sv": 0.26449211575090886,
+ "grad_min_sv": 3.399684476157461e-08,
+ "grad_condition": 7879060.46068686,
+ "lr": 0.0006545084971874737,
+ "time_sec": 32.418256521224976
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.27670828733444214,
+ "train_acc": 0.90256,
+ "test_loss": 0.701638517665863,
+ "test_acc": 0.8105,
+ "lyapunov": null,
+ "grad_norm": 0.42402034759846713,
+ "grad_max_sv": 0.26597036607563496,
+ "grad_min_sv": 3.2260157212249396e-08,
+ "grad_condition": 8290157.649110466,
+ "lr": 0.0006394955530196147,
+ "time_sec": 32.40391206741333
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.26722780378341676,
+ "train_acc": 0.90478,
+ "test_loss": 0.676421770954132,
+ "test_acc": 0.8152,
+ "lyapunov": null,
+ "grad_norm": 0.41593559749987674,
+ "grad_max_sv": 0.26356035731732846,
+ "grad_min_sv": 3.2800773563934625e-08,
+ "grad_condition": 8080555.103613043,
+ "lr": 0.0006243449435824273,
+ "time_sec": 32.413851737976074
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.2611290577888489,
+ "train_acc": 0.9069,
+ "test_loss": 0.7091101724147797,
+ "test_acc": 0.8165,
+ "lyapunov": null,
+ "grad_norm": 0.40890139043798995,
+ "grad_max_sv": 0.2530216708779335,
+ "grad_min_sv": 3.0997858102566053e-08,
+ "grad_condition": 8224218.543131987,
+ "lr": 0.0006090716206982714,
+ "time_sec": 32.60969662666321
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.2530948238658905,
+ "train_acc": 0.90982,
+ "test_loss": 0.6961516171455383,
+ "test_acc": 0.8214,
+ "lyapunov": null,
+ "grad_norm": 0.39919304872434885,
+ "grad_max_sv": 0.24201009832322598,
+ "grad_min_sv": 3.264100985056473e-08,
+ "grad_condition": 7496864.741894746,
+ "lr": 0.0005936906572928625,
+ "time_sec": 32.40188717842102
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.23889887328147888,
+ "train_acc": 0.91386,
+ "test_loss": 0.7265622617721558,
+ "test_acc": 0.8196,
+ "lyapunov": null,
+ "grad_norm": 0.39216552760863915,
+ "grad_max_sv": 0.25172842368483545,
+ "grad_min_sv": 3.196390450099784e-08,
+ "grad_condition": 7939664.340514863,
+ "lr": 0.0005782172325201156,
+ "time_sec": 32.40084266662598
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.23805784145355224,
+ "train_acc": 0.91674,
+ "test_loss": 0.6975640031337738,
+ "test_acc": 0.8226,
+ "lyapunov": null,
+ "grad_norm": 0.3825430754006707,
+ "grad_max_sv": 0.23831223957240583,
+ "grad_min_sv": 2.971923072081495e-08,
+ "grad_condition": 8085204.090791678,
+ "lr": 0.0005626666167821523,
+ "time_sec": 32.42257380485535
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.23282361968994142,
+ "train_acc": 0.91824,
+ "test_loss": 0.6992193672657013,
+ "test_acc": 0.8311,
+ "lyapunov": null,
+ "grad_norm": 0.3814486121413188,
+ "grad_max_sv": 0.23424655832350255,
+ "grad_min_sv": 3.104032040290861e-08,
+ "grad_condition": 7643726.892298067,
+ "lr": 0.0005470541566592572,
+ "time_sec": 32.40861511230469
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.22799833922863005,
+ "train_acc": 0.91886,
+ "test_loss": 0.6951349193096161,
+ "test_acc": 0.8282,
+ "lyapunov": null,
+ "grad_norm": 0.38166215011498245,
+ "grad_max_sv": 0.24571430422365664,
+ "grad_min_sv": 3.0606541878697156e-08,
+ "grad_condition": 8099711.568480073,
+ "lr": 0.0005313952597646569,
+ "time_sec": 32.382601499557495
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.21888560410499572,
+ "train_acc": 0.92208,
+ "test_loss": 0.6775056694984436,
+ "test_acc": 0.8377,
+ "lyapunov": null,
+ "grad_norm": 0.3681781600012364,
+ "grad_max_sv": 0.22858488224446774,
+ "grad_min_sv": 3.0608208811955254e-08,
+ "grad_condition": 7499521.525014189,
+ "lr": 0.0005157053795390643,
+ "time_sec": 32.38293170928955
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.2106206985092163,
+ "train_acc": 0.9252,
+ "test_loss": 0.6563802011966705,
+ "test_acc": 0.8396,
+ "lyapunov": null,
+ "grad_norm": 0.36053809946906845,
+ "grad_max_sv": 0.2215539276599884,
+ "grad_min_sv": 2.9670953960447833e-08,
+ "grad_condition": 7567975.97315415,
+ "lr": 0.0005000000000000002,
+ "time_sec": 32.3891761302948
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.19901366895198822,
+ "train_acc": 0.92832,
+ "test_loss": 0.6814763808727264,
+ "test_acc": 0.837,
+ "lyapunov": null,
+ "grad_norm": 0.3509310663538234,
+ "grad_max_sv": 0.21552756875753404,
+ "grad_min_sv": 3.0066001732720335e-08,
+ "grad_condition": 7264544.488552595,
+ "lr": 0.00048429462046093607,
+ "time_sec": 32.41236758232117
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.19969978581905365,
+ "train_acc": 0.9285,
+ "test_loss": 0.6935202028274536,
+ "test_acc": 0.8339,
+ "lyapunov": null,
+ "grad_norm": 0.3520257382758021,
+ "grad_max_sv": 0.22391790114343166,
+ "grad_min_sv": 3.0129751982244104e-08,
+ "grad_condition": 7509087.830538243,
+ "lr": 0.0004686047402353435,
+ "time_sec": 32.39413237571716
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.19100741683721542,
+ "train_acc": 0.93138,
+ "test_loss": 0.686068691778183,
+ "test_acc": 0.8361,
+ "lyapunov": null,
+ "grad_norm": 0.3426294963785598,
+ "grad_max_sv": 0.22632624246180058,
+ "grad_min_sv": 2.9659243594437613e-08,
+ "grad_condition": 7652635.339128266,
+ "lr": 0.000452945843340743,
+ "time_sec": 32.40613842010498
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.18032077651500703,
+ "train_acc": 0.9362,
+ "test_loss": 0.7067575240373611,
+ "test_acc": 0.8336,
+ "lyapunov": null,
+ "grad_norm": 0.3322012382733825,
+ "grad_max_sv": 0.20586859565228224,
+ "grad_min_sv": 2.850985989510946e-08,
+ "grad_condition": 7314687.938871255,
+ "lr": 0.00043733338321784806,
+ "time_sec": 32.4026734828949
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.17773653375148774,
+ "train_acc": 0.93586,
+ "test_loss": 0.7423279015541077,
+ "test_acc": 0.8264,
+ "lyapunov": null,
+ "grad_norm": 0.3304441924446054,
+ "grad_max_sv": 0.21223607212305068,
+ "grad_min_sv": 2.8433270138350508e-08,
+ "grad_condition": 7539548.749518724,
+ "lr": 0.0004217827674798847,
+ "time_sec": 32.404977560043335
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.17266820957183837,
+ "train_acc": 0.93834,
+ "test_loss": 0.7072871742248535,
+ "test_acc": 0.8362,
+ "lyapunov": null,
+ "grad_norm": 0.3213443005744008,
+ "grad_max_sv": 0.20142054706811904,
+ "grad_min_sv": 2.726542889242012e-08,
+ "grad_condition": 7440941.08660387,
+ "lr": 0.00040630934270713783,
+ "time_sec": 32.39922308921814
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.16320502066612244,
+ "train_acc": 0.9411,
+ "test_loss": 0.7605734568834305,
+ "test_acc": 0.8318,
+ "lyapunov": null,
+ "grad_norm": 0.31657510227372176,
+ "grad_max_sv": 0.20284682027995588,
+ "grad_min_sv": 2.7356661469468692e-08,
+ "grad_condition": 7474082.923928386,
+ "lr": 0.000390928379301729,
+ "time_sec": 32.39910292625427
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.15670019901275634,
+ "train_acc": 0.94476,
+ "test_loss": 0.784366103553772,
+ "test_acc": 0.8311,
+ "lyapunov": null,
+ "grad_norm": 0.30805235096734923,
+ "grad_max_sv": 0.20260103438049554,
+ "grad_min_sv": 2.8483807401613605e-08,
+ "grad_condition": 7164125.0338090565,
+ "lr": 0.0003756550564175727,
+ "time_sec": 32.38076663017273
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.1490273987340927,
+ "train_acc": 0.94576,
+ "test_loss": 0.7455846133232117,
+ "test_acc": 0.8376,
+ "lyapunov": null,
+ "grad_norm": 0.303406267580447,
+ "grad_max_sv": 0.19556450732052327,
+ "grad_min_sv": 2.8112297023596967e-08,
+ "grad_condition": 7040746.144049543,
+ "lr": 0.00036050444698038553,
+ "time_sec": 32.39811587333679
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.14525161782741547,
+ "train_acc": 0.94758,
+ "test_loss": 0.7790617815971375,
+ "test_acc": 0.8344,
+ "lyapunov": null,
+ "grad_norm": 0.30155039989577326,
+ "grad_max_sv": 0.19981648530811072,
+ "grad_min_sv": 2.756223151934023e-08,
+ "grad_condition": 7325326.926472412,
+ "lr": 0.00034549150281252655,
+ "time_sec": 32.389100313186646
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.1412713815355301,
+ "train_acc": 0.94936,
+ "test_loss": 0.7642439495563507,
+ "test_acc": 0.836,
+ "lyapunov": null,
+ "grad_norm": 0.29749874721325253,
+ "grad_max_sv": 0.19452713318169118,
+ "grad_min_sv": 2.9010603075363407e-08,
+ "grad_condition": 6769308.704484415,
+ "lr": 0.0003306310398773544,
+ "time_sec": 32.38328981399536
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.1323081604719162,
+ "train_acc": 0.95234,
+ "test_loss": 0.7581991817474365,
+ "test_acc": 0.8398,
+ "lyapunov": null,
+ "grad_norm": 0.29116698502726973,
+ "grad_max_sv": 0.18757329024374486,
+ "grad_min_sv": 2.7799571622466603e-08,
+ "grad_condition": 6802391.979822846,
+ "lr": 0.00031593772365766127,
+ "time_sec": 32.38175868988037
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.12890920341968537,
+ "train_acc": 0.95402,
+ "test_loss": 0.7480168062210083,
+ "test_acc": 0.8421,
+ "lyapunov": null,
+ "grad_norm": 0.286611612578029,
+ "grad_max_sv": 0.1843133084475994,
+ "grad_min_sv": 2.6867626612414597e-08,
+ "grad_condition": 6929516.973504146,
+ "lr": 0.0003014260546826097,
+ "time_sec": 32.42565321922302
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.1265330140542984,
+ "train_acc": 0.9554,
+ "test_loss": 0.8281557668209076,
+ "test_acc": 0.8301,
+ "lyapunov": null,
+ "grad_norm": 0.2827852267700905,
+ "grad_max_sv": 0.18494715746492146,
+ "grad_min_sv": 2.7603675123444305e-08,
+ "grad_condition": 6836444.701068824,
+ "lr": 0.0002871103542174637,
+ "time_sec": 32.41487503051758
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.1179364563369751,
+ "train_acc": 0.95766,
+ "test_loss": 0.8201508460521698,
+ "test_acc": 0.8301,
+ "lyapunov": null,
+ "grad_norm": 0.27559434018913526,
+ "grad_max_sv": 0.1801072470843792,
+ "grad_min_sv": 2.659138749194767e-08,
+ "grad_condition": 6847688.983849314,
+ "lr": 0.0002730047501302267,
+ "time_sec": 32.39773344993591
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.11676965503931046,
+ "train_acc": 0.9583,
+ "test_loss": 0.8626040154457092,
+ "test_acc": 0.8299,
+ "lyapunov": null,
+ "grad_norm": 0.2739785879338369,
+ "grad_max_sv": 0.181886912509799,
+ "grad_min_sv": 2.726705781164185e-08,
+ "grad_condition": 6765344.039900659,
+ "lr": 0.00025912316294914234,
+ "time_sec": 32.3981568813324
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.1134087336063385,
+ "train_acc": 0.95968,
+ "test_loss": 0.8600147367477416,
+ "test_acc": 0.8307,
+ "lyapunov": null,
+ "grad_norm": 0.27359780558028896,
+ "grad_max_sv": 0.17809443082660437,
+ "grad_min_sv": 2.617720586961525e-08,
+ "grad_condition": 6850097.709154141,
+ "lr": 0.0002454792921248144,
+ "time_sec": 32.39709424972534
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.10615333132266998,
+ "train_acc": 0.96164,
+ "test_loss": 0.7972221804141998,
+ "test_acc": 0.8376,
+ "lyapunov": null,
+ "grad_norm": 0.2659183144921437,
+ "grad_max_sv": 0.18308131918311119,
+ "grad_min_sv": 2.689645892672843e-08,
+ "grad_condition": 6797772.602815667,
+ "lr": 0.00023208660251050164,
+ "time_sec": 32.41845703125
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.10183365075588226,
+ "train_acc": 0.9635,
+ "test_loss": 0.826421448802948,
+ "test_acc": 0.8419,
+ "lyapunov": null,
+ "grad_norm": 0.25781252098700996,
+ "grad_max_sv": 0.16897555273026227,
+ "grad_min_sv": 2.6931133589869206e-08,
+ "grad_condition": 6306456.524677806,
+ "lr": 0.00021895831107393473,
+ "time_sec": 32.397175788879395
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.10107698081731796,
+ "train_acc": 0.96376,
+ "test_loss": 0.8561173896312714,
+ "test_acc": 0.831,
+ "lyapunov": null,
+ "grad_norm": 0.25760306881898437,
+ "grad_max_sv": 0.17646125555038453,
+ "grad_min_sv": 2.669760297280277e-08,
+ "grad_condition": 6679362.317952393,
+ "lr": 0.00020610737385376356,
+ "time_sec": 32.403748512268066
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.09157823500394821,
+ "train_acc": 0.9672,
+ "test_loss": 0.819078180027008,
+ "test_acc": 0.8435,
+ "lyapunov": null,
+ "grad_norm": 0.24819829552233322,
+ "grad_max_sv": 0.1644124612212181,
+ "grad_min_sv": 2.60399903861952e-08,
+ "grad_condition": 6357922.646001594,
+ "lr": 0.00019354647317351177,
+ "time_sec": 32.40361571311951
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.09161295493125915,
+ "train_acc": 0.9674,
+ "test_loss": 0.8579238404273987,
+ "test_acc": 0.8382,
+ "lyapunov": null,
+ "grad_norm": 0.2471838058669454,
+ "grad_max_sv": 0.18323104958981276,
+ "grad_min_sv": 2.6274890752020497e-08,
+ "grad_condition": 7043842.298456557,
+ "lr": 0.0001812880051256552,
+ "time_sec": 32.40220522880554
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.08914089821338654,
+ "train_acc": 0.9689,
+ "test_loss": 0.822793147277832,
+ "test_acc": 0.8428,
+ "lyapunov": null,
+ "grad_norm": 0.24800643716145856,
+ "grad_max_sv": 0.17686894070357084,
+ "grad_min_sv": 2.5135920411756273e-08,
+ "grad_condition": 7047438.025677231,
+ "lr": 0.00016934406733817422,
+ "time_sec": 32.38602375984192
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.08674161068916321,
+ "train_acc": 0.96972,
+ "test_loss": 0.9136243630409241,
+ "test_acc": 0.832,
+ "lyapunov": null,
+ "grad_norm": 0.24475644922641637,
+ "grad_max_sv": 0.1730644192546606,
+ "grad_min_sv": 2.701796373294485e-08,
+ "grad_condition": 6442891.2485314775,
+ "lr": 0.0001577264470356557,
+ "time_sec": 32.388394594192505
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.08695965735673905,
+ "train_acc": 0.96928,
+ "test_loss": 0.8845508131980896,
+ "test_acc": 0.8384,
+ "lyapunov": null,
+ "grad_norm": 0.2459968799202821,
+ "grad_max_sv": 0.17426501363515853,
+ "grad_min_sv": 2.6569961386613273e-08,
+ "grad_condition": 6640201.158479671,
+ "lr": 0.00014644660940672634,
+ "time_sec": 32.41233015060425
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.08056579726457595,
+ "train_acc": 0.97162,
+ "test_loss": 0.8616433102607727,
+ "test_acc": 0.843,
+ "lyapunov": null,
+ "grad_norm": 0.2370989720124241,
+ "grad_max_sv": 0.17729146480560304,
+ "grad_min_sv": 2.568868753272113e-08,
+ "grad_condition": 6934864.636315972,
+ "lr": 0.0001355156862892944,
+ "time_sec": 32.40184926986694
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.0778916252565384,
+ "train_acc": 0.97266,
+ "test_loss": 0.8366258358001709,
+ "test_acc": 0.846,
+ "lyapunov": null,
+ "grad_norm": 0.2285631358810043,
+ "grad_max_sv": 0.15610157009214162,
+ "grad_min_sv": 2.4703725332031468e-08,
+ "grad_condition": 6441768.40822393,
+ "lr": 0.00012494446518477025,
+ "time_sec": 32.39042067527771
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.07181410483896733,
+ "train_acc": 0.97442,
+ "test_loss": 0.8555541298389435,
+ "test_acc": 0.8426,
+ "lyapunov": null,
+ "grad_norm": 0.21751467049933892,
+ "grad_max_sv": 0.15433428399264812,
+ "grad_min_sv": 2.665557081726888e-08,
+ "grad_condition": 5918219.605492928,
+ "lr": 0.00011474337861210548,
+ "time_sec": 32.394978523254395
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.07194108392477036,
+ "train_acc": 0.9751,
+ "test_loss": 0.8495045845985413,
+ "test_acc": 0.8448,
+ "lyapunov": null,
+ "grad_norm": 0.22114745807083974,
+ "grad_max_sv": 0.1569668130017817,
+ "grad_min_sv": 2.5639288958601015e-08,
+ "grad_condition": 6206249.934502038,
+ "lr": 0.00010492249381215483,
+ "time_sec": 32.40589165687561
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.07222781093478203,
+ "train_acc": 0.97412,
+ "test_loss": 0.8713514517307281,
+ "test_acc": 0.8394,
+ "lyapunov": null,
+ "grad_norm": 0.22263796587188234,
+ "grad_max_sv": 0.14711420265957714,
+ "grad_min_sv": 2.5633022726623266e-08,
+ "grad_condition": 5761666.097039051,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 32.37701368331909
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.06728733582258224,
+ "train_acc": 0.97644,
+ "test_loss": 0.8841948908805847,
+ "test_acc": 0.8471,
+ "lyapunov": null,
+ "grad_norm": 0.2167084382178911,
+ "grad_max_sv": 0.150007457844913,
+ "grad_min_sv": 2.4493604877662278e-08,
+ "grad_condition": 6166534.410663934,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 32.398573875427246
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.06532315739750862,
+ "train_acc": 0.97664,
+ "test_loss": 0.8479381636619567,
+ "test_acc": 0.8476,
+ "lyapunov": null,
+ "grad_norm": 0.21360344563146125,
+ "grad_max_sv": 0.14955835351720453,
+ "grad_min_sv": 2.5209754284105657e-08,
+ "grad_condition": 5995150.4945804905,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 32.39670705795288
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.06434115768909454,
+ "train_acc": 0.97796,
+ "test_loss": 0.8688706632614136,
+ "test_acc": 0.8462,
+ "lyapunov": null,
+ "grad_norm": 0.208142142739157,
+ "grad_max_sv": 0.14977061534300445,
+ "grad_min_sv": 2.4894345518333694e-08,
+ "grad_condition": 6089831.719725271,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 32.399760007858276
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.06394571399211883,
+ "train_acc": 0.9776,
+ "test_loss": 0.8629561246871948,
+ "test_acc": 0.8473,
+ "lyapunov": null,
+ "grad_norm": 0.2090274768795119,
+ "grad_max_sv": 0.1535501467064023,
+ "grad_min_sv": 2.6076664383367643e-08,
+ "grad_condition": 5914212.49570628,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 32.38430905342102
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.062020836523771286,
+ "train_acc": 0.97872,
+ "test_loss": 0.875181820678711,
+ "test_acc": 0.8453,
+ "lyapunov": null,
+ "grad_norm": 0.2063308108071089,
+ "grad_max_sv": 0.14753851415589453,
+ "grad_min_sv": 2.432188375145472e-08,
+ "grad_condition": 6144261.18306755,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 32.41748404502869
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.06044566638708115,
+ "train_acc": 0.9789,
+ "test_loss": 0.872238347530365,
+ "test_acc": 0.8476,
+ "lyapunov": null,
+ "grad_norm": 0.20133211072179052,
+ "grad_max_sv": 0.148629211448133,
+ "grad_min_sv": 2.4942497534041762e-08,
+ "grad_condition": 6060679.3216307415,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 32.391072273254395
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.061503240056037904,
+ "train_acc": 0.97832,
+ "test_loss": 0.8733239276885987,
+ "test_acc": 0.8431,
+ "lyapunov": null,
+ "grad_norm": 0.2056722075536268,
+ "grad_max_sv": 0.14386752797290683,
+ "grad_min_sv": 2.4274280185920816e-08,
+ "grad_condition": 5915342.2569472315,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 32.393316984176636
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.057686230409145355,
+ "train_acc": 0.98028,
+ "test_loss": 0.9238866704940796,
+ "test_acc": 0.8441,
+ "lyapunov": null,
+ "grad_norm": 0.19849445098013146,
+ "grad_max_sv": 0.14159611044451595,
+ "grad_min_sv": 2.40493778669304e-08,
+ "grad_condition": 5894624.093493214,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 32.38528490066528
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.05870611476659775,
+ "train_acc": 0.9798,
+ "test_loss": 0.8742481526374817,
+ "test_acc": 0.8481,
+ "lyapunov": null,
+ "grad_norm": 0.20012200731407057,
+ "grad_max_sv": 0.15360670480877162,
+ "grad_min_sv": 2.5219260857411995e-08,
+ "grad_condition": 6191506.157967448,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 32.393001079559326
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.05783582457482815,
+ "train_acc": 0.9801,
+ "test_loss": 0.8813467388153076,
+ "test_acc": 0.8475,
+ "lyapunov": null,
+ "grad_norm": 0.19996222144489287,
+ "grad_max_sv": 0.1403856192715466,
+ "grad_min_sv": 2.448204212690541e-08,
+ "grad_condition": 5742298.053374326,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 32.38493609428406
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.05505133232176304,
+ "train_acc": 0.9811,
+ "test_loss": 0.8983916495323181,
+ "test_acc": 0.8462,
+ "lyapunov": null,
+ "grad_norm": 0.1922888220223182,
+ "grad_max_sv": 0.13430234417319298,
+ "grad_min_sv": 2.4953015476114616e-08,
+ "grad_condition": 5451203.641164561,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 32.399288177490234
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.05489971268892288,
+ "train_acc": 0.98124,
+ "test_loss": 0.8997103338241577,
+ "test_acc": 0.843,
+ "lyapunov": null,
+ "grad_norm": 0.1914882132186981,
+ "grad_max_sv": 0.13863548981025814,
+ "grad_min_sv": 2.579038138605938e-08,
+ "grad_condition": 5398596.905280545,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 32.40613651275635
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.05393671277284622,
+ "train_acc": 0.9816,
+ "test_loss": 0.8570820412635803,
+ "test_acc": 0.847,
+ "lyapunov": null,
+ "grad_norm": 0.19247907609747256,
+ "grad_max_sv": 0.14507245384156703,
+ "grad_min_sv": 2.4785522878545406e-08,
+ "grad_condition": 5879853.769356969,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 32.38154458999634
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.05565428542852402,
+ "train_acc": 0.98092,
+ "test_loss": 0.8699159992218017,
+ "test_acc": 0.8494,
+ "lyapunov": null,
+ "grad_norm": 0.1950428660443827,
+ "grad_max_sv": 0.15786617370322348,
+ "grad_min_sv": 2.5128920544403855e-08,
+ "grad_condition": 6342900.039114647,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 32.408872842788696
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.0554716275537014,
+ "train_acc": 0.98074,
+ "test_loss": 0.8724354814529419,
+ "test_acc": 0.848,
+ "lyapunov": null,
+ "grad_norm": 0.1953551453056335,
+ "grad_max_sv": 0.14595830552279948,
+ "grad_min_sv": 2.4523609010174142e-08,
+ "grad_condition": 6097998.471070435,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 32.37954640388489
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.055670329051017764,
+ "train_acc": 0.98156,
+ "test_loss": 0.8982214247703553,
+ "test_acc": 0.8452,
+ "lyapunov": null,
+ "grad_norm": 0.19496196662820392,
+ "grad_max_sv": 0.1501585453748703,
+ "grad_min_sv": 2.5934764646962095e-08,
+ "grad_condition": 5869735.378663734,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 32.4021053314209
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.05344248455762863,
+ "train_acc": 0.9813,
+ "test_loss": 0.9114454601287841,
+ "test_acc": 0.8468,
+ "lyapunov": null,
+ "grad_norm": 0.19018664442063118,
+ "grad_max_sv": 0.14032225906848908,
+ "grad_min_sv": 2.502056415387699e-08,
+ "grad_condition": 5745975.090099884,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 32.38188123703003
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.053135186285972594,
+ "train_acc": 0.9819,
+ "test_loss": 0.869631242275238,
+ "test_acc": 0.8508,
+ "lyapunov": null,
+ "grad_norm": 0.18824134211058935,
+ "grad_max_sv": 0.13075507152825594,
+ "grad_min_sv": 2.4252965857840536e-08,
+ "grad_condition": 5397614.905736231,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 32.386441230773926
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.05097491117954254,
+ "train_acc": 0.983,
+ "test_loss": 0.8943203839302063,
+ "test_acc": 0.8483,
+ "lyapunov": null,
+ "grad_norm": 0.18445756568932634,
+ "grad_max_sv": 0.13804081929847598,
+ "grad_min_sv": 2.4356519201518267e-08,
+ "grad_condition": 5702871.134726013,
+ "lr": 2.467198171342e-07,
+ "time_sec": 32.405375480651855
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.05390245022058487,
+ "train_acc": 0.9809,
+ "test_loss": 0.871891166973114,
+ "test_acc": 0.8498,
+ "lyapunov": null,
+ "grad_norm": 0.1935152752615153,
+ "grad_max_sv": 0.14720266554504632,
+ "grad_min_sv": 2.436729609200938e-08,
+ "grad_condition": 6104513.732861901,
+ "lr": 0.0,
+ "time_sec": 32.40170097351074
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 2.4167917232513427,
+ "train_acc": 0.21668,
+ "test_loss": 2.5600556365966796,
+ "test_acc": 0.1426,
+ "lyapunov": null,
+ "grad_norm": 8.183371300480916,
+ "grad_max_sv": 7.386911773681641,
+ "grad_min_sv": 2.415331181282454e-07,
+ "grad_condition": 30373000.643941343,
+ "lr": 0.0009997532801828658,
+ "time_sec": 49.45663261413574
+ },
+ {
+ "epoch": 2,
+ "train_loss": 1.9079357604217528,
+ "train_acc": 0.31534,
+ "test_loss": 2.481009757232666,
+ "test_acc": 0.1736,
+ "lyapunov": null,
+ "grad_norm": 6.225007320887903,
+ "grad_max_sv": 6.023341983556747,
+ "grad_min_sv": 2.0562342122332212e-07,
+ "grad_condition": 29136429.527644336,
+ "lr": 0.0009990133642141358,
+ "time_sec": 49.483285427093506
+ },
+ {
+ "epoch": 3,
+ "train_loss": 1.7475298168945312,
+ "train_acc": 0.36588,
+ "test_loss": 2.8285199867248534,
+ "test_acc": 0.131,
+ "lyapunov": null,
+ "grad_norm": 5.1420950067433004,
+ "grad_max_sv": 4.660892617702484,
+ "grad_min_sv": 1.8032060928874215e-07,
+ "grad_condition": 26358047.987367053,
+ "lr": 0.00099778098230154,
+ "time_sec": 49.57265663146973
+ },
+ {
+ "epoch": 4,
+ "train_loss": 1.648739521408081,
+ "train_acc": 0.40166,
+ "test_loss": 2.3356450172424315,
+ "test_acc": 0.1751,
+ "lyapunov": null,
+ "grad_norm": 4.371713821921025,
+ "grad_max_sv": 3.9185040295124054,
+ "grad_min_sv": 1.6463919898512814e-07,
+ "grad_condition": 23923294.770848013,
+ "lr": 0.000996057350657239,
+ "time_sec": 49.45625138282776
+ },
+ {
+ "epoch": 5,
+ "train_loss": 1.5810089331436157,
+ "train_acc": 0.4251,
+ "test_loss": 2.673109909439087,
+ "test_acc": 0.1544,
+ "lyapunov": null,
+ "grad_norm": 3.4555186506953595,
+ "grad_max_sv": 2.900471958518028,
+ "grad_min_sv": 1.4436529607309013e-07,
+ "grad_condition": 20173199.710391533,
+ "lr": 0.0009938441702975688,
+ "time_sec": 49.46467709541321
+ },
+ {
+ "epoch": 6,
+ "train_loss": 1.5207538050079346,
+ "train_acc": 0.44858,
+ "test_loss": 2.5345509658813477,
+ "test_acc": 0.1699,
+ "lyapunov": null,
+ "grad_norm": 2.64949967993879,
+ "grad_max_sv": 2.2037453174591066,
+ "grad_min_sv": 1.0903019624919352e-07,
+ "grad_condition": 20443245.381738927,
+ "lr": 0.0009911436253643444,
+ "time_sec": 49.46764326095581
+ },
+ {
+ "epoch": 7,
+ "train_loss": 1.4697360105133057,
+ "train_acc": 0.46474,
+ "test_loss": 2.8721789810180662,
+ "test_acc": 0.1272,
+ "lyapunov": null,
+ "grad_norm": 2.07791741270765,
+ "grad_max_sv": 1.6007355004549026,
+ "grad_min_sv": 8.760053766820875e-08,
+ "grad_condition": 18373378.661422264,
+ "lr": 0.0009879583809693736,
+ "time_sec": 49.47743082046509
+ },
+ {
+ "epoch": 8,
+ "train_loss": 1.4266535543823242,
+ "train_acc": 0.48382,
+ "test_loss": 3.240042792892456,
+ "test_acc": 0.1388,
+ "lyapunov": null,
+ "grad_norm": 1.6671990756280735,
+ "grad_max_sv": 1.2928156778216362,
+ "grad_min_sv": 7.22438866951336e-08,
+ "grad_condition": 18264606.350417227,
+ "lr": 0.0009842915805643154,
+ "time_sec": 49.462923526763916
+ },
+ {
+ "epoch": 9,
+ "train_loss": 1.394312504272461,
+ "train_acc": 0.49708,
+ "test_loss": 2.92084864654541,
+ "test_acc": 0.1515,
+ "lyapunov": null,
+ "grad_norm": 1.4501900520177538,
+ "grad_max_sv": 1.0461901366710662,
+ "grad_min_sv": 6.580800739897086e-08,
+ "grad_condition": 16086880.216684576,
+ "lr": 0.0009801468428384714,
+ "time_sec": 49.47783327102661
+ },
+ {
+ "epoch": 10,
+ "train_loss": 1.3646438373184204,
+ "train_acc": 0.50782,
+ "test_loss": 2.4641769153594972,
+ "test_acc": 0.2432,
+ "lyapunov": null,
+ "grad_norm": 1.291271889799819,
+ "grad_max_sv": 0.9352933883666992,
+ "grad_min_sv": 6.025941292620019e-08,
+ "grad_condition": 15737334.845315147,
+ "lr": 0.0009755282581475767,
+ "time_sec": 49.47376465797424
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.3376501561355592,
+ "train_acc": 0.51558,
+ "test_loss": 2.9219178497314453,
+ "test_acc": 0.2438,
+ "lyapunov": null,
+ "grad_norm": 1.1555098680383777,
+ "grad_max_sv": 0.7429820895195007,
+ "grad_min_sv": 5.2901568192709195e-08,
+ "grad_condition": 14266011.744750757,
+ "lr": 0.0009704403844771127,
+ "time_sec": 49.47013974189758
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.3112868671417237,
+ "train_acc": 0.5284,
+ "test_loss": 2.74031083946228,
+ "test_acc": 0.2031,
+ "lyapunov": null,
+ "grad_norm": 1.0738955371821308,
+ "grad_max_sv": 0.748549421876669,
+ "grad_min_sv": 4.978303538294426e-08,
+ "grad_condition": 15210211.076616298,
+ "lr": 0.0009648882429441257,
+ "time_sec": 49.46808075904846
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.287481568031311,
+ "train_acc": 0.53728,
+ "test_loss": 3.040859108734131,
+ "test_acc": 0.1924,
+ "lyapunov": null,
+ "grad_norm": 0.9771624206683323,
+ "grad_max_sv": 0.64529999345541,
+ "grad_min_sv": 4.393245678357971e-08,
+ "grad_condition": 14761475.748675447,
+ "lr": 0.0009588773128419905,
+ "time_sec": 49.47308921813965
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.2648405401992797,
+ "train_acc": 0.54502,
+ "test_loss": 2.792311123275757,
+ "test_acc": 0.1915,
+ "lyapunov": null,
+ "grad_norm": 0.9467244901324925,
+ "grad_max_sv": 0.6184789575636387,
+ "grad_min_sv": 4.4816473465658643e-08,
+ "grad_condition": 14165375.345471447,
+ "lr": 0.0009524135262330098,
+ "time_sec": 49.483009815216064
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.241471286087036,
+ "train_acc": 0.55048,
+ "test_loss": 2.3441864311218263,
+ "test_acc": 0.2456,
+ "lyapunov": null,
+ "grad_norm": 0.8759338877958681,
+ "grad_max_sv": 0.5726857863366603,
+ "grad_min_sv": 3.894658555658736e-08,
+ "grad_condition": 14972228.263231587,
+ "lr": 0.0009455032620941839,
+ "time_sec": 49.48427653312683
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.2250818849945069,
+ "train_acc": 0.55916,
+ "test_loss": 2.4376744468688964,
+ "test_acc": 0.2811,
+ "lyapunov": null,
+ "grad_norm": 0.8280125995789305,
+ "grad_max_sv": 0.5269983820617199,
+ "grad_min_sv": 3.957679450827811e-08,
+ "grad_condition": 13458638.5630938,
+ "lr": 0.0009381533400219318,
+ "time_sec": 49.491514921188354
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.2011407931518554,
+ "train_acc": 0.5681,
+ "test_loss": 3.077988208389282,
+ "test_acc": 0.2372,
+ "lyapunov": null,
+ "grad_norm": 0.7903623783049802,
+ "grad_max_sv": 0.5003585621714592,
+ "grad_min_sv": 3.7936934749183135e-08,
+ "grad_condition": 13344237.683557762,
+ "lr": 0.0009303710135019719,
+ "time_sec": 49.4895544052124
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.1899376231193541,
+ "train_acc": 0.57472,
+ "test_loss": 2.3918450389862063,
+ "test_acc": 0.2518,
+ "lyapunov": null,
+ "grad_norm": 0.7718039520215193,
+ "grad_max_sv": 0.47414265275001527,
+ "grad_min_sv": 3.554989529419572e-08,
+ "grad_condition": 13438942.364842063,
+ "lr": 0.0009221639627510076,
+ "time_sec": 49.456658124923706
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.168603648300171,
+ "train_acc": 0.57972,
+ "test_loss": 2.283582151031494,
+ "test_acc": 0.2237,
+ "lyapunov": null,
+ "grad_norm": 0.7146309518059523,
+ "grad_max_sv": 0.4340610824525356,
+ "grad_min_sv": 3.228430212054434e-08,
+ "grad_condition": 13543039.003440287,
+ "lr": 0.000913540287137281,
+ "time_sec": 49.45988321304321
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.151336190109253,
+ "train_acc": 0.58574,
+ "test_loss": 2.2708426193237305,
+ "test_acc": 0.2755,
+ "lyapunov": null,
+ "grad_norm": 0.6983120785552407,
+ "grad_max_sv": 0.4454373300075531,
+ "grad_min_sv": 3.350230577403579e-08,
+ "grad_condition": 13641891.236675229,
+ "lr": 0.0009045084971874739,
+ "time_sec": 49.4855215549469
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.1312933298873902,
+ "train_acc": 0.5941,
+ "test_loss": 2.002239217376709,
+ "test_acc": 0.3398,
+ "lyapunov": null,
+ "grad_norm": 0.6668029786621408,
+ "grad_max_sv": 0.4022377036511898,
+ "grad_min_sv": 3.0301077691419207e-08,
+ "grad_condition": 13290330.075167935,
+ "lr": 0.0008950775061878452,
+ "time_sec": 49.5133171081543
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.1186233515167237,
+ "train_acc": 0.59978,
+ "test_loss": 3.6749740661621093,
+ "test_acc": 0.2938,
+ "lyapunov": null,
+ "grad_norm": 0.6355160393463501,
+ "grad_max_sv": 0.3662328697741032,
+ "grad_min_sv": 2.919807395862506e-08,
+ "grad_condition": 12676455.229119861,
+ "lr": 0.0008852566213878947,
+ "time_sec": 49.47933578491211
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.0992162245941162,
+ "train_acc": 0.60538,
+ "test_loss": 2.2956289947509765,
+ "test_acc": 0.3419,
+ "lyapunov": null,
+ "grad_norm": 0.6289434264719856,
+ "grad_max_sv": 0.3852032497525215,
+ "grad_min_sv": 2.838916279834791e-08,
+ "grad_condition": 13726993.354284357,
+ "lr": 0.0008750555348152298,
+ "time_sec": 49.46930289268494
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.09261875541687,
+ "train_acc": 0.6078,
+ "test_loss": 2.194385333251953,
+ "test_acc": 0.3862,
+ "lyapunov": null,
+ "grad_norm": 0.6127565268862699,
+ "grad_max_sv": 0.3749225478619337,
+ "grad_min_sv": 2.902605293897409e-08,
+ "grad_condition": 12941629.392305708,
+ "lr": 0.0008644843137107057,
+ "time_sec": 49.45948123931885
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.0722477124023437,
+ "train_acc": 0.61656,
+ "test_loss": 2.4663957664489744,
+ "test_acc": 0.3925,
+ "lyapunov": null,
+ "grad_norm": 0.5897825535844798,
+ "grad_max_sv": 0.371936571970582,
+ "grad_min_sv": 2.8421365216857452e-08,
+ "grad_condition": 13252758.329758141,
+ "lr": 0.0008535533905932737,
+ "time_sec": 49.479785442352295
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.0658014038848878,
+ "train_acc": 0.62154,
+ "test_loss": 2.2172969047546385,
+ "test_acc": 0.3602,
+ "lyapunov": null,
+ "grad_norm": 0.5970948959400837,
+ "grad_max_sv": 0.3504005130380392,
+ "grad_min_sv": 2.822866052021311e-08,
+ "grad_condition": 12516728.270259932,
+ "lr": 0.0008422735529643444,
+ "time_sec": 49.46492099761963
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.04928136428833,
+ "train_acc": 0.62394,
+ "test_loss": 2.3098046798706053,
+ "test_acc": 0.3753,
+ "lyapunov": null,
+ "grad_norm": 0.5799982623396496,
+ "grad_max_sv": 0.3511035542935133,
+ "grad_min_sv": 2.871881275012811e-08,
+ "grad_condition": 12420577.990074852,
+ "lr": 0.0008306559326618259,
+ "time_sec": 49.463754177093506
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.033934779319763,
+ "train_acc": 0.6312,
+ "test_loss": 2.5853637130737304,
+ "test_acc": 0.3827,
+ "lyapunov": null,
+ "grad_norm": 0.5626766992798455,
+ "grad_max_sv": 0.3680811390280724,
+ "grad_min_sv": 2.860611223454157e-08,
+ "grad_condition": 13030738.458713688,
+ "lr": 0.0008187119948743449,
+ "time_sec": 49.46650528907776
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.0245469808578491,
+ "train_acc": 0.63318,
+ "test_loss": 2.421029793548584,
+ "test_acc": 0.3777,
+ "lyapunov": null,
+ "grad_norm": 0.540434209171599,
+ "grad_max_sv": 0.33249553516507147,
+ "grad_min_sv": 2.5725369168227985e-08,
+ "grad_condition": 13074923.559065297,
+ "lr": 0.0008064535268264883,
+ "time_sec": 49.46920871734619
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.0157002903938293,
+ "train_acc": 0.63876,
+ "test_loss": 2.5748968841552733,
+ "test_acc": 0.353,
+ "lyapunov": null,
+ "grad_norm": 0.5335667641481916,
+ "grad_max_sv": 0.31497838646173476,
+ "grad_min_sv": 2.4617009453109516e-08,
+ "grad_condition": 12878002.467485525,
+ "lr": 0.0007938926261462367,
+ "time_sec": 49.47658443450928
+ },
+ {
+ "epoch": 31,
+ "train_loss": 1.0092763556671143,
+ "train_acc": 0.64072,
+ "test_loss": 2.575096744155884,
+ "test_acc": 0.3689,
+ "lyapunov": null,
+ "grad_norm": 0.5319602288309537,
+ "grad_max_sv": 0.33714523129165175,
+ "grad_min_sv": 2.6278444886784767e-08,
+ "grad_condition": 12997099.648816537,
+ "lr": 0.0007810416889260654,
+ "time_sec": 49.48014044761658
+ },
+ {
+ "epoch": 32,
+ "train_loss": 0.9945861617660523,
+ "train_acc": 0.64606,
+ "test_loss": 2.18585274848938,
+ "test_acc": 0.3591,
+ "lyapunov": null,
+ "grad_norm": 0.5207883539385971,
+ "grad_max_sv": 0.30190461575984956,
+ "grad_min_sv": 2.498473832268644e-08,
+ "grad_condition": 12302495.137337226,
+ "lr": 0.0007679133974894983,
+ "time_sec": 49.48141527175903
+ },
+ {
+ "epoch": 33,
+ "train_loss": 0.9839789762878418,
+ "train_acc": 0.65072,
+ "test_loss": 2.067453681182861,
+ "test_acc": 0.4015,
+ "lyapunov": null,
+ "grad_norm": 0.5202120303096632,
+ "grad_max_sv": 0.3107115812599659,
+ "grad_min_sv": 2.559975968985384e-08,
+ "grad_condition": 12183076.283694824,
+ "lr": 0.0007545207078751857,
+ "time_sec": 49.50013208389282
+ },
+ {
+ "epoch": 34,
+ "train_loss": 0.9741807369995117,
+ "train_acc": 0.6534,
+ "test_loss": 2.3987243717193603,
+ "test_acc": 0.3907,
+ "lyapunov": null,
+ "grad_norm": 0.5156705695841731,
+ "grad_max_sv": 0.3042212676256895,
+ "grad_min_sv": 2.4721938141070156e-08,
+ "grad_condition": 12439098.422273466,
+ "lr": 0.0007408768370508577,
+ "time_sec": 49.4883246421814
+ },
+ {
+ "epoch": 35,
+ "train_loss": 0.960876017742157,
+ "train_acc": 0.6604,
+ "test_loss": 2.952223745727539,
+ "test_acc": 0.3772,
+ "lyapunov": null,
+ "grad_norm": 0.49534065997567395,
+ "grad_max_sv": 0.3189103938639164,
+ "grad_min_sv": 2.6160001853625657e-08,
+ "grad_condition": 12245579.759729771,
+ "lr": 0.0007269952498697734,
+ "time_sec": 49.49185800552368
+ },
+ {
+ "epoch": 36,
+ "train_loss": 0.9563328867340087,
+ "train_acc": 0.66094,
+ "test_loss": 2.5444390853881838,
+ "test_acc": 0.3748,
+ "lyapunov": null,
+ "grad_norm": 0.5015211388674911,
+ "grad_max_sv": 0.301097634062171,
+ "grad_min_sv": 2.4840815004978368e-08,
+ "grad_condition": 12193384.34751702,
+ "lr": 0.0007128896457825364,
+ "time_sec": 49.473448038101196
+ },
+ {
+ "epoch": 37,
+ "train_loss": 0.9456947842597961,
+ "train_acc": 0.66318,
+ "test_loss": 2.8305119338989257,
+ "test_acc": 0.3608,
+ "lyapunov": null,
+ "grad_norm": 0.5027801927119517,
+ "grad_max_sv": 0.3191258400678635,
+ "grad_min_sv": 2.5498967737291876e-08,
+ "grad_condition": 12721385.179239903,
+ "lr": 0.0006985739453173903,
+ "time_sec": 49.47532916069031
+ },
+ {
+ "epoch": 38,
+ "train_loss": 0.9344060453033447,
+ "train_acc": 0.66828,
+ "test_loss": 2.3942235221862793,
+ "test_acc": 0.3846,
+ "lyapunov": null,
+ "grad_norm": 0.4893981754322751,
+ "grad_max_sv": 0.27843328677117823,
+ "grad_min_sv": 2.3813316207821345e-08,
+ "grad_condition": 11809731.27063098,
+ "lr": 0.0006840622763423391,
+ "time_sec": 49.466092109680176
+ },
+ {
+ "epoch": 39,
+ "train_loss": 0.9299031619262695,
+ "train_acc": 0.6701,
+ "test_loss": 2.5896951622009277,
+ "test_acc": 0.3377,
+ "lyapunov": null,
+ "grad_norm": 0.4877056898105668,
+ "grad_max_sv": 0.2895252756774426,
+ "grad_min_sv": 2.313919011953658e-08,
+ "grad_condition": 12624897.370656734,
+ "lr": 0.0006693689601226458,
+ "time_sec": 49.47689652442932
+ },
+ {
+ "epoch": 40,
+ "train_loss": 0.9202397887802124,
+ "train_acc": 0.67222,
+ "test_loss": 2.3479004539489745,
+ "test_acc": 0.3652,
+ "lyapunov": null,
+ "grad_norm": 0.48378803227864736,
+ "grad_max_sv": 0.2827453903853893,
+ "grad_min_sv": 2.3820017647224744e-08,
+ "grad_condition": 11971929.846932925,
+ "lr": 0.0006545084971874737,
+ "time_sec": 49.48384690284729
+ },
+ {
+ "epoch": 41,
+ "train_loss": 0.9035198735237122,
+ "train_acc": 0.67674,
+ "test_loss": 2.4544072883605956,
+ "test_acc": 0.4098,
+ "lyapunov": null,
+ "grad_norm": 0.48414477684461676,
+ "grad_max_sv": 0.2927399341017008,
+ "grad_min_sv": 2.5373001699691144e-08,
+ "grad_condition": 11722800.874950778,
+ "lr": 0.0006394955530196147,
+ "time_sec": 49.49253749847412
+ },
+ {
+ "epoch": 42,
+ "train_loss": 0.8996260007095337,
+ "train_acc": 0.67922,
+ "test_loss": 2.7968482540130615,
+ "test_acc": 0.3717,
+ "lyapunov": null,
+ "grad_norm": 0.47529519443329865,
+ "grad_max_sv": 0.2862662900239229,
+ "grad_min_sv": 2.4432264433826845e-08,
+ "grad_condition": 11830651.602965241,
+ "lr": 0.0006243449435824273,
+ "time_sec": 49.472256898880005
+ },
+ {
+ "epoch": 43,
+ "train_loss": 0.8935702981376648,
+ "train_acc": 0.68226,
+ "test_loss": 2.7968372314453127,
+ "test_acc": 0.3814,
+ "lyapunov": null,
+ "grad_norm": 0.47246322948696845,
+ "grad_max_sv": 0.2997207723557949,
+ "grad_min_sv": 2.4396437803275717e-08,
+ "grad_condition": 12442839.021676019,
+ "lr": 0.0006090716206982714,
+ "time_sec": 49.47343039512634
+ },
+ {
+ "epoch": 44,
+ "train_loss": 0.8839340761566162,
+ "train_acc": 0.68406,
+ "test_loss": 2.1332605548858643,
+ "test_acc": 0.4518,
+ "lyapunov": null,
+ "grad_norm": 0.4773353798688752,
+ "grad_max_sv": 0.287653349712491,
+ "grad_min_sv": 2.485683419095608e-08,
+ "grad_condition": 11744954.507169517,
+ "lr": 0.0005936906572928625,
+ "time_sec": 49.483134508132935
+ },
+ {
+ "epoch": 45,
+ "train_loss": 0.8809750416755676,
+ "train_acc": 0.6871,
+ "test_loss": 2.3744767669677733,
+ "test_acc": 0.4104,
+ "lyapunov": null,
+ "grad_norm": 0.47171575077424854,
+ "grad_max_sv": 0.2800353281199932,
+ "grad_min_sv": 2.4150169553038835e-08,
+ "grad_condition": 11697732.41688976,
+ "lr": 0.0005782172325201156,
+ "time_sec": 49.47827482223511
+ },
+ {
+ "epoch": 46,
+ "train_loss": 0.8651049407958984,
+ "train_acc": 0.69358,
+ "test_loss": 2.6672937103271486,
+ "test_acc": 0.4106,
+ "lyapunov": null,
+ "grad_norm": 0.46225804490680006,
+ "grad_max_sv": 0.2764727082103491,
+ "grad_min_sv": 2.4165243095453092e-08,
+ "grad_condition": 11539194.901861329,
+ "lr": 0.0005626666167821523,
+ "time_sec": 49.482288122177124
+ },
+ {
+ "epoch": 47,
+ "train_loss": 0.855909815826416,
+ "train_acc": 0.6953,
+ "test_loss": 2.1082290111541746,
+ "test_acc": 0.4302,
+ "lyapunov": null,
+ "grad_norm": 0.46665587567927413,
+ "grad_max_sv": 0.2777487523853779,
+ "grad_min_sv": 2.3157732442768975e-08,
+ "grad_condition": 12021773.98709596,
+ "lr": 0.0005470541566592572,
+ "time_sec": 49.48243308067322
+ },
+ {
+ "epoch": 48,
+ "train_loss": 0.8559737893295288,
+ "train_acc": 0.69554,
+ "test_loss": 2.6735187637329103,
+ "test_acc": 0.3758,
+ "lyapunov": null,
+ "grad_norm": 0.4613852081362787,
+ "grad_max_sv": 0.2753657314926386,
+ "grad_min_sv": 2.358262860546745e-08,
+ "grad_condition": 11826265.97781797,
+ "lr": 0.0005313952597646569,
+ "time_sec": 49.471890687942505
+ },
+ {
+ "epoch": 49,
+ "train_loss": 0.8440363460159301,
+ "train_acc": 0.69974,
+ "test_loss": 2.318854873275757,
+ "test_acc": 0.4239,
+ "lyapunov": null,
+ "grad_norm": 0.46468634824792515,
+ "grad_max_sv": 0.2798832211643457,
+ "grad_min_sv": 2.5059412145367333e-08,
+ "grad_condition": 11328180.182026755,
+ "lr": 0.0005157053795390643,
+ "time_sec": 49.46786379814148
+ },
+ {
+ "epoch": 50,
+ "train_loss": 0.8407046744155884,
+ "train_acc": 0.69938,
+ "test_loss": 2.2581016651153565,
+ "test_acc": 0.4586,
+ "lyapunov": null,
+ "grad_norm": 0.4552999687027473,
+ "grad_max_sv": 0.27262482419610023,
+ "grad_min_sv": 2.3505009449920066e-08,
+ "grad_condition": 11655869.156098623,
+ "lr": 0.0005000000000000002,
+ "time_sec": 49.46631741523743
+ },
+ {
+ "epoch": 51,
+ "train_loss": 0.8328268578910828,
+ "train_acc": 0.70616,
+ "test_loss": 2.021052066421509,
+ "test_acc": 0.4663,
+ "lyapunov": null,
+ "grad_norm": 0.45398371093616957,
+ "grad_max_sv": 0.2551860522478819,
+ "grad_min_sv": 2.261276339510232e-08,
+ "grad_condition": 11423398.903523896,
+ "lr": 0.00048429462046093607,
+ "time_sec": 49.49492907524109
+ },
+ {
+ "epoch": 52,
+ "train_loss": 0.8242957615280151,
+ "train_acc": 0.70608,
+ "test_loss": 2.4299042922973633,
+ "test_acc": 0.4339,
+ "lyapunov": null,
+ "grad_norm": 0.4518491350882313,
+ "grad_max_sv": 0.2677639227360487,
+ "grad_min_sv": 2.340493003849531e-08,
+ "grad_condition": 11498272.982724927,
+ "lr": 0.0004686047402353435,
+ "time_sec": 49.47549295425415
+ },
+ {
+ "epoch": 53,
+ "train_loss": 0.8202688133239746,
+ "train_acc": 0.70788,
+ "test_loss": 2.0557694828033446,
+ "test_acc": 0.4729,
+ "lyapunov": null,
+ "grad_norm": 0.45155452834894444,
+ "grad_max_sv": 0.2765634849667549,
+ "grad_min_sv": 2.294847063488703e-08,
+ "grad_condition": 12152279.677541133,
+ "lr": 0.000452945843340743,
+ "time_sec": 49.47136735916138
+ },
+ {
+ "epoch": 54,
+ "train_loss": 0.8075869009590149,
+ "train_acc": 0.71144,
+ "test_loss": 2.2601095848083497,
+ "test_acc": 0.469,
+ "lyapunov": null,
+ "grad_norm": 0.44703257607115265,
+ "grad_max_sv": 0.28669003024697304,
+ "grad_min_sv": 2.3961542838790707e-08,
+ "grad_condition": 11972426.895574057,
+ "lr": 0.00043733338321784806,
+ "time_sec": 49.472840785980225
+ },
+ {
+ "epoch": 55,
+ "train_loss": 0.8038845987319946,
+ "train_acc": 0.71234,
+ "test_loss": 1.9625594703674316,
+ "test_acc": 0.4966,
+ "lyapunov": null,
+ "grad_norm": 0.45158056349279113,
+ "grad_max_sv": 0.2616859499365091,
+ "grad_min_sv": 2.319859899735377e-08,
+ "grad_condition": 11323136.132990547,
+ "lr": 0.0004217827674798847,
+ "time_sec": 49.475728034973145
+ },
+ {
+ "epoch": 56,
+ "train_loss": 0.7961191424942017,
+ "train_acc": 0.71566,
+ "test_loss": 2.24710135345459,
+ "test_acc": 0.4678,
+ "lyapunov": null,
+ "grad_norm": 0.45114634744336685,
+ "grad_max_sv": 0.27140378654003144,
+ "grad_min_sv": 2.345107636969601e-08,
+ "grad_condition": 11702309.047382332,
+ "lr": 0.00040630934270713783,
+ "time_sec": 49.46745586395264
+ },
+ {
+ "epoch": 57,
+ "train_loss": 0.7886269653129577,
+ "train_acc": 0.71928,
+ "test_loss": 2.332701706314087,
+ "test_acc": 0.4392,
+ "lyapunov": null,
+ "grad_norm": 0.44691251964783024,
+ "grad_max_sv": 0.2512993272393942,
+ "grad_min_sv": 2.3577591501400263e-08,
+ "grad_condition": 10797942.504272973,
+ "lr": 0.000390928379301729,
+ "time_sec": 49.487914085388184
+ },
+ {
+ "epoch": 58,
+ "train_loss": 0.7809809253120422,
+ "train_acc": 0.72054,
+ "test_loss": 2.163261636352539,
+ "test_acc": 0.4825,
+ "lyapunov": null,
+ "grad_norm": 0.44707505885973187,
+ "grad_max_sv": 0.27487311884760857,
+ "grad_min_sv": 2.305816853009901e-08,
+ "grad_condition": 11921937.091947556,
+ "lr": 0.0003756550564175727,
+ "time_sec": 49.477548360824585
+ },
+ {
+ "epoch": 59,
+ "train_loss": 0.7728579918098449,
+ "train_acc": 0.72464,
+ "test_loss": 2.4211140827178954,
+ "test_acc": 0.4792,
+ "lyapunov": null,
+ "grad_norm": 0.442207932790873,
+ "grad_max_sv": 0.2551064256578684,
+ "grad_min_sv": 2.3925818348757842e-08,
+ "grad_condition": 10733599.660670992,
+ "lr": 0.00036050444698038553,
+ "time_sec": 49.47178077697754
+ },
+ {
+ "epoch": 60,
+ "train_loss": 0.7646781494522095,
+ "train_acc": 0.72672,
+ "test_loss": 2.02176361579895,
+ "test_acc": 0.4897,
+ "lyapunov": null,
+ "grad_norm": 0.4430698668925349,
+ "grad_max_sv": 0.26053123250603677,
+ "grad_min_sv": 2.3670396620545377e-08,
+ "grad_condition": 11170288.922506649,
+ "lr": 0.00034549150281252655,
+ "time_sec": 49.46177387237549
+ },
+ {
+ "epoch": 61,
+ "train_loss": 0.7588282846641541,
+ "train_acc": 0.7286,
+ "test_loss": 2.670531511688232,
+ "test_acc": 0.4198,
+ "lyapunov": null,
+ "grad_norm": 0.43898999083578233,
+ "grad_max_sv": 0.26667738817632197,
+ "grad_min_sv": 2.325178121154181e-08,
+ "grad_condition": 11623927.174902633,
+ "lr": 0.0003306310398773544,
+ "time_sec": 49.49580407142639
+ },
+ {
+ "epoch": 62,
+ "train_loss": 0.7492313718986511,
+ "train_acc": 0.73298,
+ "test_loss": 2.4778705802917482,
+ "test_acc": 0.449,
+ "lyapunov": null,
+ "grad_norm": 0.4417738790617677,
+ "grad_max_sv": 0.2574993997812271,
+ "grad_min_sv": 2.3859390374525445e-08,
+ "grad_condition": 10899105.692467105,
+ "lr": 0.00031593772365766127,
+ "time_sec": 49.486817836761475
+ },
+ {
+ "epoch": 63,
+ "train_loss": 0.7480638890266419,
+ "train_acc": 0.73324,
+ "test_loss": 2.1940598976135255,
+ "test_acc": 0.4734,
+ "lyapunov": null,
+ "grad_norm": 0.4366591281226868,
+ "grad_max_sv": 0.2512634038925171,
+ "grad_min_sv": 2.326989370082799e-08,
+ "grad_condition": 10851343.919251464,
+ "lr": 0.0003014260546826097,
+ "time_sec": 49.494584798812866
+ },
+ {
+ "epoch": 64,
+ "train_loss": 0.7451907014846801,
+ "train_acc": 0.73538,
+ "test_loss": 2.3143032501220704,
+ "test_acc": 0.4762,
+ "lyapunov": null,
+ "grad_norm": 0.4362314837898005,
+ "grad_max_sv": 0.2649652697145939,
+ "grad_min_sv": 2.3657484859995748e-08,
+ "grad_condition": 11323682.220760768,
+ "lr": 0.0002871103542174637,
+ "time_sec": 49.46461892127991
+ },
+ {
+ "epoch": 65,
+ "train_loss": 0.7316487748908996,
+ "train_acc": 0.73868,
+ "test_loss": 2.132633139801025,
+ "test_acc": 0.4893,
+ "lyapunov": null,
+ "grad_norm": 0.43117564557331234,
+ "grad_max_sv": 0.2554838340729475,
+ "grad_min_sv": 2.3040169683241628e-08,
+ "grad_condition": 11170455.423079647,
+ "lr": 0.0002730047501302267,
+ "time_sec": 49.4881227016449
+ },
+ {
+ "epoch": 66,
+ "train_loss": 0.7290266520881653,
+ "train_acc": 0.7408,
+ "test_loss": 2.396712022781372,
+ "test_acc": 0.4793,
+ "lyapunov": null,
+ "grad_norm": 0.43225303341958693,
+ "grad_max_sv": 0.2486136831343174,
+ "grad_min_sv": 2.2949348021938932e-08,
+ "grad_condition": 10962824.963370848,
+ "lr": 0.00025912316294914234,
+ "time_sec": 49.47016882896423
+ },
+ {
+ "epoch": 67,
+ "train_loss": 0.7191537443733216,
+ "train_acc": 0.74308,
+ "test_loss": 2.1576420639038085,
+ "test_acc": 0.4941,
+ "lyapunov": null,
+ "grad_norm": 0.42657147393758854,
+ "grad_max_sv": 0.2438450776040554,
+ "grad_min_sv": 2.3898531642529975e-08,
+ "grad_condition": 10287595.631951943,
+ "lr": 0.0002454792921248144,
+ "time_sec": 49.49215388298035
+ },
+ {
+ "epoch": 68,
+ "train_loss": 0.7169496524429322,
+ "train_acc": 0.74418,
+ "test_loss": 2.4695981254577637,
+ "test_acc": 0.4807,
+ "lyapunov": null,
+ "grad_norm": 0.4234097941028663,
+ "grad_max_sv": 0.24577417597174644,
+ "grad_min_sv": 2.2813544342525915e-08,
+ "grad_condition": 10779009.57251847,
+ "lr": 0.00023208660251050164,
+ "time_sec": 49.531681299209595
+ },
+ {
+ "epoch": 69,
+ "train_loss": 0.7072784723091126,
+ "train_acc": 0.74744,
+ "test_loss": 2.27939485244751,
+ "test_acc": 0.4853,
+ "lyapunov": null,
+ "grad_norm": 0.4251678846869415,
+ "grad_max_sv": 0.241105442866683,
+ "grad_min_sv": 2.3618906030975496e-08,
+ "grad_condition": 10243169.91188918,
+ "lr": 0.00021895831107393473,
+ "time_sec": 49.46745848655701
+ },
+ {
+ "epoch": 70,
+ "train_loss": 0.7093459980392456,
+ "train_acc": 0.74668,
+ "test_loss": 2.2168941738128662,
+ "test_acc": 0.4993,
+ "lyapunov": null,
+ "grad_norm": 0.4187232599688298,
+ "grad_max_sv": 0.2437821462750435,
+ "grad_min_sv": 2.330924906424059e-08,
+ "grad_condition": 10529543.438680641,
+ "lr": 0.00020610737385376356,
+ "time_sec": 49.46611166000366
+ },
+ {
+ "epoch": 71,
+ "train_loss": 0.7046173419761658,
+ "train_acc": 0.74866,
+ "test_loss": 2.6486716678619384,
+ "test_acc": 0.4604,
+ "lyapunov": null,
+ "grad_norm": 0.43152156311922873,
+ "grad_max_sv": 0.26821285113692284,
+ "grad_min_sv": 2.3308388552578663e-08,
+ "grad_condition": 11585490.938807528,
+ "lr": 0.00019354647317351177,
+ "time_sec": 49.484049558639526
+ },
+ {
+ "epoch": 72,
+ "train_loss": 0.6916852585601807,
+ "train_acc": 0.75164,
+ "test_loss": 2.4044878028869627,
+ "test_acc": 0.4868,
+ "lyapunov": null,
+ "grad_norm": 0.42974614402520106,
+ "grad_max_sv": 0.2577272642403841,
+ "grad_min_sv": 2.3734259935181968e-08,
+ "grad_condition": 10929944.700492647,
+ "lr": 0.0001812880051256552,
+ "time_sec": 49.47321033477783
+ },
+ {
+ "epoch": 73,
+ "train_loss": 0.6914860160255432,
+ "train_acc": 0.75462,
+ "test_loss": 2.459467795562744,
+ "test_acc": 0.4755,
+ "lyapunov": null,
+ "grad_norm": 0.4235499199054343,
+ "grad_max_sv": 0.2499073389917612,
+ "grad_min_sv": 2.312090292555524e-08,
+ "grad_condition": 10928192.758700397,
+ "lr": 0.00016934406733817422,
+ "time_sec": 49.47536325454712
+ },
+ {
+ "epoch": 74,
+ "train_loss": 0.6900841831016541,
+ "train_acc": 0.75346,
+ "test_loss": 2.529036985015869,
+ "test_acc": 0.4694,
+ "lyapunov": null,
+ "grad_norm": 0.4200493463432216,
+ "grad_max_sv": 0.24829606115818023,
+ "grad_min_sv": 2.3347005217999595e-08,
+ "grad_condition": 10777473.575533265,
+ "lr": 0.0001577264470356557,
+ "time_sec": 49.47671389579773
+ },
+ {
+ "epoch": 75,
+ "train_loss": 0.6844219914627075,
+ "train_acc": 0.75664,
+ "test_loss": 2.7192491188049317,
+ "test_acc": 0.4659,
+ "lyapunov": null,
+ "grad_norm": 0.41891725324120427,
+ "grad_max_sv": 0.2549721471965313,
+ "grad_min_sv": 2.308645701276646e-08,
+ "grad_condition": 11178421.697050892,
+ "lr": 0.00014644660940672634,
+ "time_sec": 49.475868701934814
+ },
+ {
+ "epoch": 76,
+ "train_loss": 0.6757127567672729,
+ "train_acc": 0.76002,
+ "test_loss": 2.228153326416016,
+ "test_acc": 0.4719,
+ "lyapunov": null,
+ "grad_norm": 0.41518783756559813,
+ "grad_max_sv": 0.24106829576194286,
+ "grad_min_sv": 2.3467413079458765e-08,
+ "grad_condition": 10331945.898118276,
+ "lr": 0.0001355156862892944,
+ "time_sec": 49.47853899002075
+ },
+ {
+ "epoch": 77,
+ "train_loss": 0.6663033656692505,
+ "train_acc": 0.7606,
+ "test_loss": 2.5164624114990235,
+ "test_acc": 0.4627,
+ "lyapunov": null,
+ "grad_norm": 0.41866630242016806,
+ "grad_max_sv": 0.2701979674398899,
+ "grad_min_sv": 2.4135091125643272e-08,
+ "grad_condition": 11260755.273271866,
+ "lr": 0.00012494446518477025,
+ "time_sec": 49.47706151008606
+ },
+ {
+ "epoch": 78,
+ "train_loss": 0.6645314185142517,
+ "train_acc": 0.76252,
+ "test_loss": 2.8226414447784425,
+ "test_acc": 0.4614,
+ "lyapunov": null,
+ "grad_norm": 0.4173542916715373,
+ "grad_max_sv": 0.2490392465144396,
+ "grad_min_sv": 2.3206901200722994e-08,
+ "grad_condition": 10823280.058633823,
+ "lr": 0.00011474337861210548,
+ "time_sec": 49.483954191207886
+ },
+ {
+ "epoch": 79,
+ "train_loss": 0.6665540114593506,
+ "train_acc": 0.76016,
+ "test_loss": 2.2122913623809812,
+ "test_acc": 0.4819,
+ "lyapunov": null,
+ "grad_norm": 0.4188547510844498,
+ "grad_max_sv": 0.25715495869517324,
+ "grad_min_sv": 2.4195212988686877e-08,
+ "grad_condition": 10755821.867443344,
+ "lr": 0.00010492249381215483,
+ "time_sec": 49.46640372276306
+ },
+ {
+ "epoch": 80,
+ "train_loss": 0.6579594387054444,
+ "train_acc": 0.76406,
+ "test_loss": 2.328022619628906,
+ "test_acc": 0.4922,
+ "lyapunov": null,
+ "grad_norm": 0.41446019268915407,
+ "grad_max_sv": 0.2467421844601631,
+ "grad_min_sv": 2.3609747978881047e-08,
+ "grad_condition": 10542743.78062649,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 49.47466158866882
+ },
+ {
+ "epoch": 81,
+ "train_loss": 0.6575078699111938,
+ "train_acc": 0.76504,
+ "test_loss": 2.435921426773071,
+ "test_acc": 0.4706,
+ "lyapunov": null,
+ "grad_norm": 0.41722587257024396,
+ "grad_max_sv": 0.2460654556751251,
+ "grad_min_sv": 2.2818005085412097e-08,
+ "grad_condition": 10871762.933690486,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 49.48575758934021
+ },
+ {
+ "epoch": 82,
+ "train_loss": 0.6540266362380981,
+ "train_acc": 0.7668,
+ "test_loss": 2.420010438537598,
+ "test_acc": 0.4873,
+ "lyapunov": null,
+ "grad_norm": 0.4134489054266664,
+ "grad_max_sv": 0.24872095324099064,
+ "grad_min_sv": 2.4063159953513492e-08,
+ "grad_condition": 10418409.724400165,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 49.4517502784729
+ },
+ {
+ "epoch": 83,
+ "train_loss": 0.6572029878616333,
+ "train_acc": 0.76728,
+ "test_loss": 2.509574550628662,
+ "test_acc": 0.4741,
+ "lyapunov": null,
+ "grad_norm": 0.40888921626022273,
+ "grad_max_sv": 0.24261515885591506,
+ "grad_min_sv": 2.325806733871616e-08,
+ "grad_condition": 10519103.211694924,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 49.47699522972107
+ },
+ {
+ "epoch": 84,
+ "train_loss": 0.648239343738556,
+ "train_acc": 0.76774,
+ "test_loss": 2.2645148223876954,
+ "test_acc": 0.485,
+ "lyapunov": null,
+ "grad_norm": 0.4120785615672335,
+ "grad_max_sv": 0.24379208087921142,
+ "grad_min_sv": 2.272370744904606e-08,
+ "grad_condition": 10771039.526767144,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 49.461183071136475
+ },
+ {
+ "epoch": 85,
+ "train_loss": 0.6412541982460022,
+ "train_acc": 0.77106,
+ "test_loss": 2.5437144912719725,
+ "test_acc": 0.4865,
+ "lyapunov": null,
+ "grad_norm": 0.41805406865324773,
+ "grad_max_sv": 0.2572408441454172,
+ "grad_min_sv": 2.2814066324983172e-08,
+ "grad_condition": 11337861.01159941,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 49.47793769836426
+ },
+ {
+ "epoch": 86,
+ "train_loss": 0.6463544520187378,
+ "train_acc": 0.76662,
+ "test_loss": 2.9264222496032715,
+ "test_acc": 0.4471,
+ "lyapunov": null,
+ "grad_norm": 0.4118969055764605,
+ "grad_max_sv": 0.2387235414236784,
+ "grad_min_sv": 2.2642364694291928e-08,
+ "grad_condition": 10550361.803450387,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 49.4726197719574
+ },
+ {
+ "epoch": 87,
+ "train_loss": 0.6428634425735473,
+ "train_acc": 0.7704,
+ "test_loss": 2.5568968086242676,
+ "test_acc": 0.4759,
+ "lyapunov": null,
+ "grad_norm": 0.415046593792845,
+ "grad_max_sv": 0.2535580638796091,
+ "grad_min_sv": 2.363120126247509e-08,
+ "grad_condition": 10837761.433894884,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 49.48099684715271
+ },
+ {
+ "epoch": 88,
+ "train_loss": 0.6407405834579468,
+ "train_acc": 0.77184,
+ "test_loss": 2.4600058319091795,
+ "test_acc": 0.475,
+ "lyapunov": null,
+ "grad_norm": 0.4135582126787873,
+ "grad_max_sv": 0.25508003048598765,
+ "grad_min_sv": 2.376858407870941e-08,
+ "grad_condition": 10837781.081215866,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 49.47017812728882
+ },
+ {
+ "epoch": 89,
+ "train_loss": 0.6344939192008973,
+ "train_acc": 0.77288,
+ "test_loss": 2.4250204902648926,
+ "test_acc": 0.4787,
+ "lyapunov": null,
+ "grad_norm": 0.4160361292383021,
+ "grad_max_sv": 0.25198650658130645,
+ "grad_min_sv": 2.3671872506625392e-08,
+ "grad_condition": 10764847.245073054,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 49.48287224769592
+ },
+ {
+ "epoch": 90,
+ "train_loss": 0.6344009274482727,
+ "train_acc": 0.77354,
+ "test_loss": 2.7001010314941407,
+ "test_acc": 0.4623,
+ "lyapunov": null,
+ "grad_norm": 0.4089648902673904,
+ "grad_max_sv": 0.24975020438432693,
+ "grad_min_sv": 2.2971467306120984e-08,
+ "grad_condition": 10990208.207150657,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 49.50636339187622
+ },
+ {
+ "epoch": 91,
+ "train_loss": 0.6388888354110718,
+ "train_acc": 0.77322,
+ "test_loss": 2.4007692584991456,
+ "test_acc": 0.482,
+ "lyapunov": null,
+ "grad_norm": 0.41394740295503574,
+ "grad_max_sv": 0.24785541072487832,
+ "grad_min_sv": 2.4093225903243366e-08,
+ "grad_condition": 10380601.978368312,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 49.47446608543396
+ },
+ {
+ "epoch": 92,
+ "train_loss": 0.6364776765632629,
+ "train_acc": 0.7745,
+ "test_loss": 2.399016780090332,
+ "test_acc": 0.4893,
+ "lyapunov": null,
+ "grad_norm": 0.4144776850028884,
+ "grad_max_sv": 0.23398316986858844,
+ "grad_min_sv": 2.3364770829203963e-08,
+ "grad_condition": 10152213.637178902,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 49.4903450012207
+ },
+ {
+ "epoch": 93,
+ "train_loss": 0.6323039393615723,
+ "train_acc": 0.7761,
+ "test_loss": 2.5661166526794434,
+ "test_acc": 0.4799,
+ "lyapunov": null,
+ "grad_norm": 0.4148058440423859,
+ "grad_max_sv": 0.25038140527904035,
+ "grad_min_sv": 2.3675201843431638e-08,
+ "grad_condition": 10621575.74650034,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 49.47283339500427
+ },
+ {
+ "epoch": 94,
+ "train_loss": 0.6312036778831482,
+ "train_acc": 0.77456,
+ "test_loss": 2.4954245025634765,
+ "test_acc": 0.4884,
+ "lyapunov": null,
+ "grad_norm": 0.41190158928123094,
+ "grad_max_sv": 0.23922828286886216,
+ "grad_min_sv": 2.3207600818864195e-08,
+ "grad_condition": 10426944.434691576,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 49.4705286026001
+ },
+ {
+ "epoch": 95,
+ "train_loss": 0.631898609752655,
+ "train_acc": 0.77374,
+ "test_loss": 2.496735878753662,
+ "test_acc": 0.484,
+ "lyapunov": null,
+ "grad_norm": 0.4118919272482802,
+ "grad_max_sv": 0.2545221421867609,
+ "grad_min_sv": 2.265429692727139e-08,
+ "grad_condition": 11229071.176658351,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 49.45284724235535
+ },
+ {
+ "epoch": 96,
+ "train_loss": 0.6379076655197143,
+ "train_acc": 0.77178,
+ "test_loss": 2.6363272483825684,
+ "test_acc": 0.476,
+ "lyapunov": null,
+ "grad_norm": 0.4109637736779776,
+ "grad_max_sv": 0.23244931511580944,
+ "grad_min_sv": 2.2822463163763017e-08,
+ "grad_condition": 10301145.344649881,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 49.47940802574158
+ },
+ {
+ "epoch": 97,
+ "train_loss": 0.6325872544288635,
+ "train_acc": 0.77334,
+ "test_loss": 2.7118479751586912,
+ "test_acc": 0.4606,
+ "lyapunov": null,
+ "grad_norm": 0.4111072193471729,
+ "grad_max_sv": 0.23797121047973632,
+ "grad_min_sv": 2.2607291239040707e-08,
+ "grad_condition": 10688228.14219837,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 49.482439041137695
+ },
+ {
+ "epoch": 98,
+ "train_loss": 0.6342727423286438,
+ "train_acc": 0.77484,
+ "test_loss": 2.50120391998291,
+ "test_acc": 0.4868,
+ "lyapunov": null,
+ "grad_norm": 0.4137394255148928,
+ "grad_max_sv": 0.24089130759239197,
+ "grad_min_sv": 2.424639040654597e-08,
+ "grad_condition": 10056603.153747398,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 49.48271298408508
+ },
+ {
+ "epoch": 99,
+ "train_loss": 0.628259766407013,
+ "train_acc": 0.77486,
+ "test_loss": 2.447319179916382,
+ "test_acc": 0.4885,
+ "lyapunov": null,
+ "grad_norm": 0.4076037809536703,
+ "grad_max_sv": 0.25056461431086063,
+ "grad_min_sv": 2.3701171647516616e-08,
+ "grad_condition": 10626762.207877642,
+ "lr": 2.467198171342e-07,
+ "time_sec": 49.45984363555908
+ },
+ {
+ "epoch": 100,
+ "train_loss": 0.6313758395767212,
+ "train_acc": 0.77534,
+ "test_loss": 2.4442952224731447,
+ "test_acc": 0.4905,
+ "lyapunov": null,
+ "grad_norm": 0.40858498927976306,
+ "grad_max_sv": 0.23060753419995308,
+ "grad_min_sv": 2.2785150743942496e-08,
+ "grad_condition": 10116355.973472353,
+ "lr": 0.0,
+ "time_sec": 49.46379518508911
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 2.717775194091797,
+ "train_acc": 0.12228,
+ "test_loss": 3.3459623817443847,
+ "test_acc": 0.1,
+ "lyapunov": null,
+ "grad_norm": 7.716699984005914,
+ "grad_max_sv": 7.287460565567017,
+ "grad_min_sv": 2.5165389772041635e-07,
+ "grad_condition": 29456429.211788226,
+ "lr": 0.0009997532801828658,
+ "time_sec": 66.53277444839478
+ },
+ {
+ "epoch": 2,
+ "train_loss": 2.2721379792785643,
+ "train_acc": 0.17654,
+ "test_loss": 4.04989028930664,
+ "test_acc": 0.1003,
+ "lyapunov": null,
+ "grad_norm": 6.63637414556116,
+ "grad_max_sv": 6.237935948371887,
+ "grad_min_sv": 2.2601446723058415e-07,
+ "grad_condition": 28188789.96425259,
+ "lr": 0.0009990133642141358,
+ "time_sec": 66.55316853523254
+ },
+ {
+ "epoch": 3,
+ "train_loss": 2.137921618881226,
+ "train_acc": 0.2105,
+ "test_loss": 5.869428012084961,
+ "test_acc": 0.1011,
+ "lyapunov": null,
+ "grad_norm": 5.7520031644476814,
+ "grad_max_sv": 5.452845233678818,
+ "grad_min_sv": 1.9201941405810886e-07,
+ "grad_condition": 28919609.465649594,
+ "lr": 0.00099778098230154,
+ "time_sec": 66.56071186065674
+ },
+ {
+ "epoch": 4,
+ "train_loss": 2.0486733519744873,
+ "train_acc": 0.23394,
+ "test_loss": 5.161107911682129,
+ "test_acc": 0.1097,
+ "lyapunov": null,
+ "grad_norm": 4.91519980042541,
+ "grad_max_sv": 4.5814680576324465,
+ "grad_min_sv": 1.6788343710771868e-07,
+ "grad_condition": 27707547.33712595,
+ "lr": 0.000996057350657239,
+ "time_sec": 66.55148816108704
+ },
+ {
+ "epoch": 5,
+ "train_loss": 1.9897926804351806,
+ "train_acc": 0.25822,
+ "test_loss": 4.115356592559815,
+ "test_acc": 0.1203,
+ "lyapunov": null,
+ "grad_norm": 4.476936137063571,
+ "grad_max_sv": 4.264879077672958,
+ "grad_min_sv": 1.6287330311115512e-07,
+ "grad_condition": 27434565.90350554,
+ "lr": 0.0009938441702975688,
+ "time_sec": 66.53483939170837
+ },
+ {
+ "epoch": 6,
+ "train_loss": 1.950422788543701,
+ "train_acc": 0.26598,
+ "test_loss": 6.161662875366211,
+ "test_acc": 0.1038,
+ "lyapunov": null,
+ "grad_norm": 4.078084494569751,
+ "grad_max_sv": 3.8316186487674715,
+ "grad_min_sv": 1.5860823996405315e-07,
+ "grad_condition": 24946451.178036533,
+ "lr": 0.0009911436253643444,
+ "time_sec": 66.544926404953
+ },
+ {
+ "epoch": 7,
+ "train_loss": 1.9193549822998046,
+ "train_acc": 0.28804,
+ "test_loss": 6.333303915405273,
+ "test_acc": 0.1006,
+ "lyapunov": null,
+ "grad_norm": 3.9544625089709906,
+ "grad_max_sv": 3.660486602783203,
+ "grad_min_sv": 1.3159545346752567e-07,
+ "grad_condition": 27858533.203216422,
+ "lr": 0.0009879583809693736,
+ "time_sec": 66.54343152046204
+ },
+ {
+ "epoch": 8,
+ "train_loss": 1.8974505254364014,
+ "train_acc": 0.29166,
+ "test_loss": 6.595959260559082,
+ "test_acc": 0.1052,
+ "lyapunov": null,
+ "grad_norm": 3.7716319720252063,
+ "grad_max_sv": 3.4488155782222747,
+ "grad_min_sv": 1.3156188991558792e-07,
+ "grad_condition": 26979104.149509914,
+ "lr": 0.0009842915805643154,
+ "time_sec": 66.53689360618591
+ },
+ {
+ "epoch": 9,
+ "train_loss": 1.8757565868377686,
+ "train_acc": 0.2988,
+ "test_loss": 8.294800563049316,
+ "test_acc": 0.1001,
+ "lyapunov": null,
+ "grad_norm": 3.606736816077247,
+ "grad_max_sv": 3.276396805047989,
+ "grad_min_sv": 1.2148574111137122e-07,
+ "grad_condition": 27354129.68622259,
+ "lr": 0.0009801468428384714,
+ "time_sec": 66.53859829902649
+ },
+ {
+ "epoch": 10,
+ "train_loss": 1.853810763168335,
+ "train_acc": 0.30818,
+ "test_loss": 7.528170121765137,
+ "test_acc": 0.1002,
+ "lyapunov": null,
+ "grad_norm": 3.590286745766664,
+ "grad_max_sv": 3.3836376488208773,
+ "grad_min_sv": 1.2300289498057282e-07,
+ "grad_condition": 28478996.179412544,
+ "lr": 0.0009755282581475767,
+ "time_sec": 66.54752492904663
+ },
+ {
+ "epoch": 11,
+ "train_loss": 1.8360865605926513,
+ "train_acc": 0.31554,
+ "test_loss": 8.300324632263184,
+ "test_acc": 0.1004,
+ "lyapunov": null,
+ "grad_norm": 3.4184867147228633,
+ "grad_max_sv": 3.2137346804141997,
+ "grad_min_sv": 1.2349632871888616e-07,
+ "grad_condition": 27052165.93028751,
+ "lr": 0.0009704403844771127,
+ "time_sec": 66.54567265510559
+ },
+ {
+ "epoch": 12,
+ "train_loss": 1.822631957397461,
+ "train_acc": 0.32436,
+ "test_loss": 7.752643719482422,
+ "test_acc": 0.1021,
+ "lyapunov": null,
+ "grad_norm": 3.4268104192911824,
+ "grad_max_sv": 3.0984551936388014,
+ "grad_min_sv": 1.1916837276970682e-07,
+ "grad_condition": 26678795.929163624,
+ "lr": 0.0009648882429441257,
+ "time_sec": 66.54143714904785
+ },
+ {
+ "epoch": 13,
+ "train_loss": 1.8042937320327759,
+ "train_acc": 0.33052,
+ "test_loss": 6.320642838287354,
+ "test_acc": 0.1016,
+ "lyapunov": null,
+ "grad_norm": 3.26500321242579,
+ "grad_max_sv": 3.034997683763504,
+ "grad_min_sv": 1.1198519924704443e-07,
+ "grad_condition": 27516714.34616376,
+ "lr": 0.0009588773128419905,
+ "time_sec": 66.54663801193237
+ },
+ {
+ "epoch": 14,
+ "train_loss": 1.7935633684539796,
+ "train_acc": 0.33378,
+ "test_loss": 8.591533955383301,
+ "test_acc": 0.1001,
+ "lyapunov": null,
+ "grad_norm": 3.205935962438017,
+ "grad_max_sv": 2.9335897117853165,
+ "grad_min_sv": 1.0952790088225584e-07,
+ "grad_condition": 27285541.83012454,
+ "lr": 0.0009524135262330098,
+ "time_sec": 66.54473447799683
+ },
+ {
+ "epoch": 15,
+ "train_loss": 1.7773359481811524,
+ "train_acc": 0.34102,
+ "test_loss": 9.823327029418945,
+ "test_acc": 0.1,
+ "lyapunov": null,
+ "grad_norm": 3.107803718888726,
+ "grad_max_sv": 2.8818213611841204,
+ "grad_min_sv": 1.1047076302617142e-07,
+ "grad_condition": 26466849.950957365,
+ "lr": 0.0009455032620941839,
+ "time_sec": 66.54632878303528
+ },
+ {
+ "epoch": 16,
+ "train_loss": 1.7638415741348266,
+ "train_acc": 0.3494,
+ "test_loss": 10.98111782836914,
+ "test_acc": 0.1,
+ "lyapunov": null,
+ "grad_norm": 2.991047436873543,
+ "grad_max_sv": 2.6788798362016677,
+ "grad_min_sv": 9.756340197952796e-08,
+ "grad_condition": 27546377.57163794,
+ "lr": 0.0009381533400219318,
+ "time_sec": 66.5387659072876
+ },
+ {
+ "epoch": 17,
+ "train_loss": 1.7545028717422486,
+ "train_acc": 0.3524,
+ "test_loss": 8.496100090026856,
+ "test_acc": 0.1005,
+ "lyapunov": null,
+ "grad_norm": 2.9405206102474817,
+ "grad_max_sv": 2.7797821670770646,
+ "grad_min_sv": 1.0545847413112597e-07,
+ "grad_condition": 26402272.837948732,
+ "lr": 0.0009303710135019719,
+ "time_sec": 66.53228521347046
+ },
+ {
+ "epoch": 18,
+ "train_loss": 1.7399513541412353,
+ "train_acc": 0.35946,
+ "test_loss": 9.442770735168457,
+ "test_acc": 0.1002,
+ "lyapunov": null,
+ "grad_norm": 2.876673477887061,
+ "grad_max_sv": 2.652202320098877,
+ "grad_min_sv": 1.0433013795108081e-07,
+ "grad_condition": 26098642.755907767,
+ "lr": 0.0009221639627510076,
+ "time_sec": 66.52799201011658
+ },
+ {
+ "epoch": 19,
+ "train_loss": 1.7275141513061523,
+ "train_acc": 0.36564,
+ "test_loss": 8.60740804901123,
+ "test_acc": 0.1,
+ "lyapunov": null,
+ "grad_norm": 2.820914668477109,
+ "grad_max_sv": 2.8074967473745347,
+ "grad_min_sv": 1.0515814725664541e-07,
+ "grad_condition": 27554948.172257036,
+ "lr": 0.000913540287137281,
+ "time_sec": 66.53072094917297
+ },
+ {
+ "epoch": 20,
+ "train_loss": 1.7184981283187866,
+ "train_acc": 0.36706,
+ "test_loss": 5.74347527923584,
+ "test_acc": 0.1074,
+ "lyapunov": null,
+ "grad_norm": 2.755999508826315,
+ "grad_max_sv": 2.4683564633131025,
+ "grad_min_sv": 9.147877104709323e-08,
+ "grad_condition": 27108387.83832861,
+ "lr": 0.0009045084971874739,
+ "time_sec": 66.53930997848511
+ },
+ {
+ "epoch": 21,
+ "train_loss": 1.7127495180892944,
+ "train_acc": 0.36988,
+ "test_loss": 5.374083380126953,
+ "test_acc": 0.1038,
+ "lyapunov": null,
+ "grad_norm": 2.7076782774581156,
+ "grad_max_sv": 2.415825995802879,
+ "grad_min_sv": 9.989069553739682e-08,
+ "grad_condition": 24996642.26521779,
+ "lr": 0.0008950775061878452,
+ "time_sec": 66.5274007320404
+ },
+ {
+ "epoch": 22,
+ "train_loss": 1.7080568863677978,
+ "train_acc": 0.37366,
+ "test_loss": 5.8365667526245115,
+ "test_acc": 0.1074,
+ "lyapunov": null,
+ "grad_norm": 2.777540200252398,
+ "grad_max_sv": 2.682383918762207,
+ "grad_min_sv": 1.0115953053002613e-07,
+ "grad_condition": 27062321.26943115,
+ "lr": 0.0008852566213878947,
+ "time_sec": 66.52736306190491
+ },
+ {
+ "epoch": 23,
+ "train_loss": 1.6937433179473877,
+ "train_acc": 0.378,
+ "test_loss": 5.908844201660156,
+ "test_acc": 0.102,
+ "lyapunov": null,
+ "grad_norm": 2.5943120813718052,
+ "grad_max_sv": 2.4230685472488402,
+ "grad_min_sv": 9.802377860523848e-08,
+ "grad_condition": 25663315.966033876,
+ "lr": 0.0008750555348152298,
+ "time_sec": 66.55514574050903
+ },
+ {
+ "epoch": 24,
+ "train_loss": 1.685849613647461,
+ "train_acc": 0.38486,
+ "test_loss": 6.484691570281982,
+ "test_acc": 0.1015,
+ "lyapunov": null,
+ "grad_norm": 2.470392685402757,
+ "grad_max_sv": 2.3409340023994445,
+ "grad_min_sv": 9.386610759776204e-08,
+ "grad_condition": 25307930.60423732,
+ "lr": 0.0008644843137107057,
+ "time_sec": 66.55581784248352
+ },
+ {
+ "epoch": 25,
+ "train_loss": 1.6830421477890014,
+ "train_acc": 0.38556,
+ "test_loss": 7.468188558959961,
+ "test_acc": 0.1022,
+ "lyapunov": null,
+ "grad_norm": 2.548563020510745,
+ "grad_max_sv": 2.1459918454289437,
+ "grad_min_sv": 8.803468158902205e-08,
+ "grad_condition": 24944715.33907653,
+ "lr": 0.0008535533905932737,
+ "time_sec": 66.53887248039246
+ },
+ {
+ "epoch": 26,
+ "train_loss": 1.6700520505523682,
+ "train_acc": 0.38856,
+ "test_loss": 7.895222584533691,
+ "test_acc": 0.1009,
+ "lyapunov": null,
+ "grad_norm": 2.5359070370837204,
+ "grad_max_sv": 2.4539994060993195,
+ "grad_min_sv": 9.640742533179037e-08,
+ "grad_condition": 26335532.748314124,
+ "lr": 0.0008422735529643444,
+ "time_sec": 66.54404091835022
+ },
+ {
+ "epoch": 27,
+ "train_loss": 1.6605180406951905,
+ "train_acc": 0.39334,
+ "test_loss": 6.994429248046875,
+ "test_acc": 0.101,
+ "lyapunov": null,
+ "grad_norm": 2.4258405770471474,
+ "grad_max_sv": 2.320448189973831,
+ "grad_min_sv": 9.107987271050888e-08,
+ "grad_condition": 26102152.790860306,
+ "lr": 0.0008306559326618259,
+ "time_sec": 66.53805947303772
+ },
+ {
+ "epoch": 28,
+ "train_loss": 1.6567610062408447,
+ "train_acc": 0.395,
+ "test_loss": 6.368250694274902,
+ "test_acc": 0.1099,
+ "lyapunov": null,
+ "grad_norm": 2.4482138479454654,
+ "grad_max_sv": 2.1421856224536895,
+ "grad_min_sv": 8.29846632299791e-08,
+ "grad_condition": 25968573.760956615,
+ "lr": 0.0008187119948743449,
+ "time_sec": 66.56613659858704
+ },
+ {
+ "epoch": 29,
+ "train_loss": 1.643007601623535,
+ "train_acc": 0.39978,
+ "test_loss": 5.360125735473633,
+ "test_acc": 0.1039,
+ "lyapunov": null,
+ "grad_norm": 2.4260201472737237,
+ "grad_max_sv": 2.2909662395715715,
+ "grad_min_sv": 9.427450295973471e-08,
+ "grad_condition": 24999199.08130427,
+ "lr": 0.0008064535268264883,
+ "time_sec": 66.5019998550415
+ },
+ {
+ "epoch": 30,
+ "train_loss": 1.6426652933120727,
+ "train_acc": 0.40242,
+ "test_loss": 5.846046133422852,
+ "test_acc": 0.1054,
+ "lyapunov": null,
+ "grad_norm": 2.4104230560175877,
+ "grad_max_sv": 2.2003868728876115,
+ "grad_min_sv": 8.557402386699664e-08,
+ "grad_condition": 26105024.01238749,
+ "lr": 0.0007938926261462367,
+ "time_sec": 66.54244065284729
+ },
+ {
+ "epoch": 31,
+ "train_loss": 1.6377650901031495,
+ "train_acc": 0.4032,
+ "test_loss": 5.6720462432861325,
+ "test_acc": 0.1037,
+ "lyapunov": null,
+ "grad_norm": 2.3941082742204367,
+ "grad_max_sv": 2.1774697691202163,
+ "grad_min_sv": 8.963231525882521e-08,
+ "grad_condition": 24809583.231536172,
+ "lr": 0.0007810416889260654,
+ "time_sec": 66.54210758209229
+ },
+ {
+ "epoch": 32,
+ "train_loss": 1.6306892547607421,
+ "train_acc": 0.40602,
+ "test_loss": 6.530587504577637,
+ "test_acc": 0.1021,
+ "lyapunov": null,
+ "grad_norm": 2.310788163521601,
+ "grad_max_sv": 2.3168098986148835,
+ "grad_min_sv": 8.591319300421674e-08,
+ "grad_condition": 27429040.418645225,
+ "lr": 0.0007679133974894983,
+ "time_sec": 66.54988598823547
+ },
+ {
+ "epoch": 33,
+ "train_loss": 1.616210421142578,
+ "train_acc": 0.41068,
+ "test_loss": 6.481897874450683,
+ "test_acc": 0.1047,
+ "lyapunov": null,
+ "grad_norm": 2.280822445658443,
+ "grad_max_sv": 2.0465356022119523,
+ "grad_min_sv": 8.811248948248363e-08,
+ "grad_condition": 23945215.471904326,
+ "lr": 0.0007545207078751857,
+ "time_sec": 66.54384207725525
+ },
+ {
+ "epoch": 34,
+ "train_loss": 1.6103173712921142,
+ "train_acc": 0.4129,
+ "test_loss": 7.558738642883301,
+ "test_acc": 0.1004,
+ "lyapunov": null,
+ "grad_norm": 2.268328370380239,
+ "grad_max_sv": 1.9925297170877456,
+ "grad_min_sv": 8.015654646698067e-08,
+ "grad_condition": 25172747.9746131,
+ "lr": 0.0007408768370508577,
+ "time_sec": 66.53899669647217
+ },
+ {
+ "epoch": 35,
+ "train_loss": 1.6033166294860839,
+ "train_acc": 0.41878,
+ "test_loss": 7.87334995880127,
+ "test_acc": 0.1014,
+ "lyapunov": null,
+ "grad_norm": 2.1857354046879727,
+ "grad_max_sv": 1.9975714191794396,
+ "grad_min_sv": 7.650004620884943e-08,
+ "grad_condition": 26089987.057969414,
+ "lr": 0.0007269952498697734,
+ "time_sec": 66.5277693271637
+ },
+ {
+ "epoch": 36,
+ "train_loss": 1.6046894992446898,
+ "train_acc": 0.41892,
+ "test_loss": 8.474886727905274,
+ "test_acc": 0.1054,
+ "lyapunov": null,
+ "grad_norm": 2.192178860403557,
+ "grad_max_sv": 2.002661418914795,
+ "grad_min_sv": 8.41961090181087e-08,
+ "grad_condition": 24123592.75292515,
+ "lr": 0.0007128896457825364,
+ "time_sec": 66.54011392593384
+ },
+ {
+ "epoch": 37,
+ "train_loss": 1.5938314058685303,
+ "train_acc": 0.42164,
+ "test_loss": 7.729584867858887,
+ "test_acc": 0.1023,
+ "lyapunov": null,
+ "grad_norm": 2.181177891654343,
+ "grad_max_sv": 2.0365157604217528,
+ "grad_min_sv": 8.0202053975853e-08,
+ "grad_condition": 26197254.249608647,
+ "lr": 0.0006985739453173903,
+ "time_sec": 66.53632307052612
+ },
+ {
+ "epoch": 38,
+ "train_loss": 1.5886405113220214,
+ "train_acc": 0.42264,
+ "test_loss": 5.7885481513977055,
+ "test_acc": 0.1062,
+ "lyapunov": null,
+ "grad_norm": 2.138587269147521,
+ "grad_max_sv": 1.933423602581024,
+ "grad_min_sv": 7.520017115680844e-08,
+ "grad_condition": 25928003.19539905,
+ "lr": 0.0006840622763423391,
+ "time_sec": 66.54145908355713
+ },
+ {
+ "epoch": 39,
+ "train_loss": 1.5804911177825929,
+ "train_acc": 0.42612,
+ "test_loss": 6.7240009689331055,
+ "test_acc": 0.106,
+ "lyapunov": null,
+ "grad_norm": 2.146582724428281,
+ "grad_max_sv": 1.8961839854717255,
+ "grad_min_sv": 7.674624242781647e-08,
+ "grad_condition": 24938086.191727363,
+ "lr": 0.0006693689601226458,
+ "time_sec": 66.54460453987122
+ },
+ {
+ "epoch": 40,
+ "train_loss": 1.5785979819488525,
+ "train_acc": 0.42734,
+ "test_loss": 6.793812344360352,
+ "test_acc": 0.1033,
+ "lyapunov": null,
+ "grad_norm": 2.0524354853565967,
+ "grad_max_sv": 1.9275713503360747,
+ "grad_min_sv": 7.654831097880788e-08,
+ "grad_condition": 25599705.595900334,
+ "lr": 0.0006545084971874737,
+ "time_sec": 66.78280329704285
+ },
+ {
+ "epoch": 41,
+ "train_loss": 1.5828138892364503,
+ "train_acc": 0.42612,
+ "test_loss": 6.44511951751709,
+ "test_acc": 0.1052,
+ "lyapunov": null,
+ "grad_norm": 2.1085813246105163,
+ "grad_max_sv": 1.9095334649085998,
+ "grad_min_sv": 7.941251247700621e-08,
+ "grad_condition": 24686632.04929278,
+ "lr": 0.0006394955530196147,
+ "time_sec": 66.53900074958801
+ },
+ {
+ "epoch": 42,
+ "train_loss": 1.5717257321548461,
+ "train_acc": 0.42996,
+ "test_loss": 8.174863388061523,
+ "test_acc": 0.1011,
+ "lyapunov": null,
+ "grad_norm": 2.0568855518830627,
+ "grad_max_sv": 1.8603438019752503,
+ "grad_min_sv": 8.168111662598676e-08,
+ "grad_condition": 23782864.12280636,
+ "lr": 0.0006243449435824273,
+ "time_sec": 66.54205513000488
+ },
+ {
+ "epoch": 43,
+ "train_loss": 1.562401286239624,
+ "train_acc": 0.43392,
+ "test_loss": 7.7131751495361325,
+ "test_acc": 0.1014,
+ "lyapunov": null,
+ "grad_norm": 2.0119184672620642,
+ "grad_max_sv": 1.8657386392354964,
+ "grad_min_sv": 7.582975278808135e-08,
+ "grad_condition": 24942971.18450144,
+ "lr": 0.0006090716206982714,
+ "time_sec": 66.53042316436768
+ },
+ {
+ "epoch": 44,
+ "train_loss": 1.5541102393341064,
+ "train_acc": 0.43712,
+ "test_loss": 8.247987678527831,
+ "test_acc": 0.1011,
+ "lyapunov": null,
+ "grad_norm": 1.9482695609274137,
+ "grad_max_sv": 1.6971077546477318,
+ "grad_min_sv": 7.249982623136474e-08,
+ "grad_condition": 23783887.230844818,
+ "lr": 0.0005936906572928625,
+ "time_sec": 66.5365047454834
+ },
+ {
+ "epoch": 45,
+ "train_loss": 1.551253000793457,
+ "train_acc": 0.43906,
+ "test_loss": 7.164133547973633,
+ "test_acc": 0.1021,
+ "lyapunov": null,
+ "grad_norm": 1.9478309625288126,
+ "grad_max_sv": 1.7972041130065919,
+ "grad_min_sv": 7.798710131012853e-08,
+ "grad_condition": 23697966.26066207,
+ "lr": 0.0005782172325201156,
+ "time_sec": 66.54136061668396
+ },
+ {
+ "epoch": 46,
+ "train_loss": 1.541000611190796,
+ "train_acc": 0.44134,
+ "test_loss": 6.376314013671875,
+ "test_acc": 0.1045,
+ "lyapunov": null,
+ "grad_norm": 1.8630241109997108,
+ "grad_max_sv": 1.6913443714380265,
+ "grad_min_sv": 7.214549819778427e-08,
+ "grad_condition": 23808757.926116575,
+ "lr": 0.0005626666167821523,
+ "time_sec": 66.55902171134949
+ },
+ {
+ "epoch": 47,
+ "train_loss": 1.5372591391754151,
+ "train_acc": 0.44398,
+ "test_loss": 6.5030721710205075,
+ "test_acc": 0.1069,
+ "lyapunov": null,
+ "grad_norm": 1.9024590490680153,
+ "grad_max_sv": 1.814224436879158,
+ "grad_min_sv": 7.368249033135044e-08,
+ "grad_condition": 25117471.09981022,
+ "lr": 0.0005470541566592572,
+ "time_sec": 66.52199673652649
+ },
+ {
+ "epoch": 48,
+ "train_loss": 1.5375283456802369,
+ "train_acc": 0.44544,
+ "test_loss": 7.119714102935791,
+ "test_acc": 0.1016,
+ "lyapunov": null,
+ "grad_norm": 1.8585907694205182,
+ "grad_max_sv": 1.7394830703735351,
+ "grad_min_sv": 7.501465217885084e-08,
+ "grad_condition": 23906344.012628905,
+ "lr": 0.0005313952597646569,
+ "time_sec": 66.54580640792847
+ },
+ {
+ "epoch": 49,
+ "train_loss": 1.5338307555770874,
+ "train_acc": 0.4442,
+ "test_loss": 5.397337831115722,
+ "test_acc": 0.1059,
+ "lyapunov": null,
+ "grad_norm": 1.7902731589528738,
+ "grad_max_sv": 1.6494132414460183,
+ "grad_min_sv": 6.831805556828386e-08,
+ "grad_condition": 24615282.56582328,
+ "lr": 0.0005157053795390643,
+ "time_sec": 66.53534126281738
+ },
+ {
+ "epoch": 50,
+ "train_loss": 1.5284276412963866,
+ "train_acc": 0.44778,
+ "test_loss": 5.524033654785156,
+ "test_acc": 0.1078,
+ "lyapunov": null,
+ "grad_norm": 1.7713612838130008,
+ "grad_max_sv": 1.5726667106151582,
+ "grad_min_sv": 6.907176626214096e-08,
+ "grad_condition": 22960902.516891498,
+ "lr": 0.0005000000000000002,
+ "time_sec": 66.5325882434845
+ },
+ {
+ "epoch": 51,
+ "train_loss": 1.5330605014801026,
+ "train_acc": 0.44666,
+ "test_loss": 6.847183532714844,
+ "test_acc": 0.1031,
+ "lyapunov": null,
+ "grad_norm": 1.7792073911302086,
+ "grad_max_sv": 1.6382696747779846,
+ "grad_min_sv": 6.6116589625409e-08,
+ "grad_condition": 24861349.651776347,
+ "lr": 0.00048429462046093607,
+ "time_sec": 66.53938388824463
+ },
+ {
+ "epoch": 52,
+ "train_loss": 1.515211699180603,
+ "train_acc": 0.45132,
+ "test_loss": 6.849605633544922,
+ "test_acc": 0.1046,
+ "lyapunov": null,
+ "grad_norm": 1.7110848232260776,
+ "grad_max_sv": 1.4070507645606996,
+ "grad_min_sv": 6.268320333902011e-08,
+ "grad_condition": 22502851.341604523,
+ "lr": 0.0004686047402353435,
+ "time_sec": 66.54575228691101
+ },
+ {
+ "epoch": 53,
+ "train_loss": 1.511851570777893,
+ "train_acc": 0.44984,
+ "test_loss": 6.742161424255371,
+ "test_acc": 0.1035,
+ "lyapunov": null,
+ "grad_norm": 1.6990701953393579,
+ "grad_max_sv": 1.5247679650783539,
+ "grad_min_sv": 6.360552236017725e-08,
+ "grad_condition": 24187524.31056104,
+ "lr": 0.000452945843340743,
+ "time_sec": 66.55630564689636
+ },
+ {
+ "epoch": 54,
+ "train_loss": 1.5134658539581298,
+ "train_acc": 0.45194,
+ "test_loss": 6.076722029113769,
+ "test_acc": 0.1055,
+ "lyapunov": null,
+ "grad_norm": 1.67595650149666,
+ "grad_max_sv": 1.521102523803711,
+ "grad_min_sv": 6.705203148271721e-08,
+ "grad_condition": 23102185.373464666,
+ "lr": 0.00043733338321784806,
+ "time_sec": 66.54796624183655
+ },
+ {
+ "epoch": 55,
+ "train_loss": 1.5127635479736328,
+ "train_acc": 0.45416,
+ "test_loss": 6.099140180969238,
+ "test_acc": 0.1054,
+ "lyapunov": null,
+ "grad_norm": 1.669713615396416,
+ "grad_max_sv": 1.4162977203726768,
+ "grad_min_sv": 5.9198181379116475e-08,
+ "grad_condition": 24265418.333155036,
+ "lr": 0.0004217827674798847,
+ "time_sec": 66.56652212142944
+ },
+ {
+ "epoch": 56,
+ "train_loss": 1.5037149493789672,
+ "train_acc": 0.45674,
+ "test_loss": 5.881203063964843,
+ "test_acc": 0.106,
+ "lyapunov": null,
+ "grad_norm": 1.6488336383475701,
+ "grad_max_sv": 1.5071144998073578,
+ "grad_min_sv": 6.376719170475554e-08,
+ "grad_condition": 23818554.434521496,
+ "lr": 0.00040630934270713783,
+ "time_sec": 66.53574323654175
+ },
+ {
+ "epoch": 57,
+ "train_loss": 1.504850189590454,
+ "train_acc": 0.459,
+ "test_loss": 5.68402534790039,
+ "test_acc": 0.1076,
+ "lyapunov": null,
+ "grad_norm": 1.6129911107480968,
+ "grad_max_sv": 1.4527282550930978,
+ "grad_min_sv": 6.286840470437483e-08,
+ "grad_condition": 23483060.334747117,
+ "lr": 0.000390928379301729,
+ "time_sec": 66.54559707641602
+ },
+ {
+ "epoch": 58,
+ "train_loss": 1.4977053466033936,
+ "train_acc": 0.45916,
+ "test_loss": 5.9823997062683105,
+ "test_acc": 0.1071,
+ "lyapunov": null,
+ "grad_norm": 1.6061924832487942,
+ "grad_max_sv": 1.3888853162527084,
+ "grad_min_sv": 6.253125484079192e-08,
+ "grad_condition": 22608679.418678027,
+ "lr": 0.0003756550564175727,
+ "time_sec": 66.55387783050537
+ },
+ {
+ "epoch": 59,
+ "train_loss": 1.4972542272949219,
+ "train_acc": 0.45872,
+ "test_loss": 5.0882811370849605,
+ "test_acc": 0.1151,
+ "lyapunov": null,
+ "grad_norm": 1.5591682163016796,
+ "grad_max_sv": 1.3346713334321976,
+ "grad_min_sv": 5.8280132453347735e-08,
+ "grad_condition": 23069467.539254077,
+ "lr": 0.00036050444698038553,
+ "time_sec": 66.54211473464966
+ },
+ {
+ "epoch": 60,
+ "train_loss": 1.4907029873657227,
+ "train_acc": 0.46126,
+ "test_loss": 7.020564842224121,
+ "test_acc": 0.1048,
+ "lyapunov": null,
+ "grad_norm": 1.5345406038505094,
+ "grad_max_sv": 1.4284722179174423,
+ "grad_min_sv": 6.001468877414595e-08,
+ "grad_condition": 24162295.485593982,
+ "lr": 0.00034549150281252655,
+ "time_sec": 66.55491805076599
+ },
+ {
+ "epoch": 61,
+ "train_loss": 1.4877613472366333,
+ "train_acc": 0.4653,
+ "test_loss": 4.854167632293701,
+ "test_acc": 0.1114,
+ "lyapunov": null,
+ "grad_norm": 1.5324361061772793,
+ "grad_max_sv": 1.325933101773262,
+ "grad_min_sv": 5.964644183009682e-08,
+ "grad_condition": 22280923.908054985,
+ "lr": 0.0003306310398773544,
+ "time_sec": 66.54050326347351
+ },
+ {
+ "epoch": 62,
+ "train_loss": 1.4875999914550782,
+ "train_acc": 0.4609,
+ "test_loss": 6.024991397094727,
+ "test_acc": 0.1045,
+ "lyapunov": null,
+ "grad_norm": 1.5157035873578593,
+ "grad_max_sv": 1.2820105284452439,
+ "grad_min_sv": 5.6854590901878056e-08,
+ "grad_condition": 22744392.831777684,
+ "lr": 0.00031593772365766127,
+ "time_sec": 66.56322026252747
+ },
+ {
+ "epoch": 63,
+ "train_loss": 1.4804442275238037,
+ "train_acc": 0.46586,
+ "test_loss": 6.877338618469238,
+ "test_acc": 0.1028,
+ "lyapunov": null,
+ "grad_norm": 1.5037529747226948,
+ "grad_max_sv": 1.3301736950874328,
+ "grad_min_sv": 6.064568385255597e-08,
+ "grad_condition": 22458783.805724658,
+ "lr": 0.0003014260546826097,
+ "time_sec": 66.55420660972595
+ },
+ {
+ "epoch": 64,
+ "train_loss": 1.4785625118637085,
+ "train_acc": 0.4676,
+ "test_loss": 5.8289501716613765,
+ "test_acc": 0.1058,
+ "lyapunov": null,
+ "grad_norm": 1.4955609555476688,
+ "grad_max_sv": 1.2231090664863586,
+ "grad_min_sv": 5.909942020210224e-08,
+ "grad_condition": 21200746.17398096,
+ "lr": 0.0002871103542174637,
+ "time_sec": 66.55184054374695
+ },
+ {
+ "epoch": 65,
+ "train_loss": 1.474054185218811,
+ "train_acc": 0.4692,
+ "test_loss": 6.821263113403321,
+ "test_acc": 0.1053,
+ "lyapunov": null,
+ "grad_norm": 1.4816881050330082,
+ "grad_max_sv": 1.304422627389431,
+ "grad_min_sv": 6.126439071607592e-08,
+ "grad_condition": 22262717.79019341,
+ "lr": 0.0002730047501302267,
+ "time_sec": 66.54631876945496
+ },
+ {
+ "epoch": 66,
+ "train_loss": 1.468451905593872,
+ "train_acc": 0.46872,
+ "test_loss": 6.21660086593628,
+ "test_acc": 0.1049,
+ "lyapunov": null,
+ "grad_norm": 1.4471343716270808,
+ "grad_max_sv": 1.2118137910962106,
+ "grad_min_sv": 5.677175121121536e-08,
+ "grad_condition": 21833909.31574912,
+ "lr": 0.00025912316294914234,
+ "time_sec": 66.54650139808655
+ },
+ {
+ "epoch": 67,
+ "train_loss": 1.473218607635498,
+ "train_acc": 0.46886,
+ "test_loss": 5.585741909790039,
+ "test_acc": 0.1093,
+ "lyapunov": null,
+ "grad_norm": 1.4454249735567377,
+ "grad_max_sv": 1.344612455368042,
+ "grad_min_sv": 5.805593232821593e-08,
+ "grad_condition": 23703781.24599778,
+ "lr": 0.0002454792921248144,
+ "time_sec": 66.54963803291321
+ },
+ {
+ "epoch": 68,
+ "train_loss": 1.464357560043335,
+ "train_acc": 0.47134,
+ "test_loss": 6.43534487915039,
+ "test_acc": 0.1036,
+ "lyapunov": null,
+ "grad_norm": 1.4158825945249984,
+ "grad_max_sv": 1.216756673157215,
+ "grad_min_sv": 5.594884520121468e-08,
+ "grad_condition": 22117575.184218023,
+ "lr": 0.00023208660251050164,
+ "time_sec": 66.53380155563354
+ },
+ {
+ "epoch": 69,
+ "train_loss": 1.4605754261016846,
+ "train_acc": 0.47354,
+ "test_loss": 6.361464812469483,
+ "test_acc": 0.1041,
+ "lyapunov": null,
+ "grad_norm": 1.4102858398212452,
+ "grad_max_sv": 1.2650031745433807,
+ "grad_min_sv": 5.616340708058942e-08,
+ "grad_condition": 22755240.415779583,
+ "lr": 0.00021895831107393473,
+ "time_sec": 66.55379509925842
+ },
+ {
+ "epoch": 70,
+ "train_loss": 1.4566728033065797,
+ "train_acc": 0.4732,
+ "test_loss": 7.030058961486817,
+ "test_acc": 0.1052,
+ "lyapunov": null,
+ "grad_norm": 1.4004542368068666,
+ "grad_max_sv": 1.1733321487903594,
+ "grad_min_sv": 5.324388059335661e-08,
+ "grad_condition": 22428640.626706712,
+ "lr": 0.00020610737385376356,
+ "time_sec": 66.53196001052856
+ },
+ {
+ "epoch": 71,
+ "train_loss": 1.4595127109909058,
+ "train_acc": 0.4747,
+ "test_loss": 6.251192915344238,
+ "test_acc": 0.1055,
+ "lyapunov": null,
+ "grad_norm": 1.4007518176750748,
+ "grad_max_sv": 1.2036359310150146,
+ "grad_min_sv": 5.3584219283919765e-08,
+ "grad_condition": 22661079.860923886,
+ "lr": 0.00019354647317351177,
+ "time_sec": 66.53831934928894
+ },
+ {
+ "epoch": 72,
+ "train_loss": 1.4561804718780518,
+ "train_acc": 0.47592,
+ "test_loss": 6.078685757446289,
+ "test_acc": 0.1053,
+ "lyapunov": null,
+ "grad_norm": 1.3882159701453969,
+ "grad_max_sv": 1.1710434511303902,
+ "grad_min_sv": 5.193670311598453e-08,
+ "grad_condition": 22617697.621583022,
+ "lr": 0.0001812880051256552,
+ "time_sec": 66.53273725509644
+ },
+ {
+ "epoch": 73,
+ "train_loss": 1.456334539833069,
+ "train_acc": 0.47646,
+ "test_loss": 6.318551240539551,
+ "test_acc": 0.1053,
+ "lyapunov": null,
+ "grad_norm": 1.3893052276682352,
+ "grad_max_sv": 1.262186436355114,
+ "grad_min_sv": 5.998066114898392e-08,
+ "grad_condition": 21695066.67305842,
+ "lr": 0.00016934406733817422,
+ "time_sec": 66.53349781036377
+ },
+ {
+ "epoch": 74,
+ "train_loss": 1.450936794128418,
+ "train_acc": 0.48046,
+ "test_loss": 5.979817550659179,
+ "test_acc": 0.105,
+ "lyapunov": null,
+ "grad_norm": 1.3659009379358413,
+ "grad_max_sv": 1.2089540883898735,
+ "grad_min_sv": 5.6734091380405974e-08,
+ "grad_condition": 21453559.245642237,
+ "lr": 0.0001577264470356557,
+ "time_sec": 66.5519745349884
+ },
+ {
+ "epoch": 75,
+ "train_loss": 1.4469789163970947,
+ "train_acc": 0.47906,
+ "test_loss": 6.295627461242676,
+ "test_acc": 0.1067,
+ "lyapunov": null,
+ "grad_norm": 1.3551347445295552,
+ "grad_max_sv": 1.1976817324757576,
+ "grad_min_sv": 5.458875831365617e-08,
+ "grad_condition": 22252931.086762276,
+ "lr": 0.00014644660940672634,
+ "time_sec": 66.55559992790222
+ },
+ {
+ "epoch": 76,
+ "train_loss": 1.4463843099212645,
+ "train_acc": 0.47934,
+ "test_loss": 6.197264282226563,
+ "test_acc": 0.1079,
+ "lyapunov": null,
+ "grad_norm": 1.3380208446863917,
+ "grad_max_sv": 1.2127704448997974,
+ "grad_min_sv": 5.3017609769057116e-08,
+ "grad_condition": 23070185.252038278,
+ "lr": 0.0001355156862892944,
+ "time_sec": 66.54188418388367
+ },
+ {
+ "epoch": 77,
+ "train_loss": 1.4422340731430054,
+ "train_acc": 0.47956,
+ "test_loss": 6.095625473022461,
+ "test_acc": 0.1068,
+ "lyapunov": null,
+ "grad_norm": 1.319834743092097,
+ "grad_max_sv": 1.0997839123010635,
+ "grad_min_sv": 5.253857917608684e-08,
+ "grad_condition": 21034235.602306478,
+ "lr": 0.00012494446518477025,
+ "time_sec": 66.54432153701782
+ },
+ {
+ "epoch": 78,
+ "train_loss": 1.4469564128875732,
+ "train_acc": 0.48036,
+ "test_loss": 5.388970955657959,
+ "test_acc": 0.11,
+ "lyapunov": null,
+ "grad_norm": 1.3475784983368762,
+ "grad_max_sv": 1.2046680554747582,
+ "grad_min_sv": 5.585839417676652e-08,
+ "grad_condition": 21905924.79288598,
+ "lr": 0.00011474337861210548,
+ "time_sec": 66.53302836418152
+ },
+ {
+ "epoch": 79,
+ "train_loss": 1.4366684397125244,
+ "train_acc": 0.4798,
+ "test_loss": 6.206115145874024,
+ "test_acc": 0.1069,
+ "lyapunov": null,
+ "grad_norm": 1.3130109628098805,
+ "grad_max_sv": 1.1744658067822455,
+ "grad_min_sv": 5.508810989596213e-08,
+ "grad_condition": 21715398.426144313,
+ "lr": 0.00010492249381215483,
+ "time_sec": 66.53135848045349
+ },
+ {
+ "epoch": 80,
+ "train_loss": 1.4392537023544312,
+ "train_acc": 0.48228,
+ "test_loss": 6.179986186218262,
+ "test_acc": 0.1064,
+ "lyapunov": null,
+ "grad_norm": 1.3256940413341314,
+ "grad_max_sv": 1.1846244156360626,
+ "grad_min_sv": 5.3839901603680576e-08,
+ "grad_condition": 22125564.09370377,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 66.5379912853241
+ },
+ {
+ "epoch": 81,
+ "train_loss": 1.4338660355377197,
+ "train_acc": 0.48616,
+ "test_loss": 6.177688023376465,
+ "test_acc": 0.1068,
+ "lyapunov": null,
+ "grad_norm": 1.331304941867422,
+ "grad_max_sv": 1.2059139341115952,
+ "grad_min_sv": 5.419374078385886e-08,
+ "grad_condition": 22342309.054380674,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 66.5526373386383
+ },
+ {
+ "epoch": 82,
+ "train_loss": 1.4322706761550903,
+ "train_acc": 0.48346,
+ "test_loss": 6.39905592956543,
+ "test_acc": 0.1049,
+ "lyapunov": null,
+ "grad_norm": 1.3160308800060254,
+ "grad_max_sv": 1.1150345966219901,
+ "grad_min_sv": 5.504024436220334e-08,
+ "grad_condition": 20495998.096470684,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 66.53385639190674
+ },
+ {
+ "epoch": 83,
+ "train_loss": 1.4299918703460692,
+ "train_acc": 0.48306,
+ "test_loss": 6.442905668640137,
+ "test_acc": 0.1051,
+ "lyapunov": null,
+ "grad_norm": 1.3113912638515688,
+ "grad_max_sv": 1.0838071212172509,
+ "grad_min_sv": 5.43203230840561e-08,
+ "grad_condition": 20241235.03989599,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 66.52077317237854
+ },
+ {
+ "epoch": 84,
+ "train_loss": 1.4280065909194946,
+ "train_acc": 0.4822,
+ "test_loss": 6.0934767837524415,
+ "test_acc": 0.1077,
+ "lyapunov": null,
+ "grad_norm": 1.3219999598887227,
+ "grad_max_sv": 1.1636987075209617,
+ "grad_min_sv": 5.4432569296380964e-08,
+ "grad_condition": 21698960.666762732,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 66.54324150085449
+ },
+ {
+ "epoch": 85,
+ "train_loss": 1.426846856918335,
+ "train_acc": 0.4865,
+ "test_loss": 5.9188161468505855,
+ "test_acc": 0.107,
+ "lyapunov": null,
+ "grad_norm": 1.2965845421535789,
+ "grad_max_sv": 1.1792906790971756,
+ "grad_min_sv": 5.5100021434384416e-08,
+ "grad_condition": 21690369.73733188,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 66.53187370300293
+ },
+ {
+ "epoch": 86,
+ "train_loss": 1.4228094031524658,
+ "train_acc": 0.48556,
+ "test_loss": 6.137683601379394,
+ "test_acc": 0.108,
+ "lyapunov": null,
+ "grad_norm": 1.292831856620217,
+ "grad_max_sv": 1.0124387323856354,
+ "grad_min_sv": 5.2233392278111523e-08,
+ "grad_condition": 19602805.79996558,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 66.53067183494568
+ },
+ {
+ "epoch": 87,
+ "train_loss": 1.429165520362854,
+ "train_acc": 0.48332,
+ "test_loss": 5.927753118133545,
+ "test_acc": 0.1088,
+ "lyapunov": null,
+ "grad_norm": 1.3101745862822605,
+ "grad_max_sv": 1.1612930461764335,
+ "grad_min_sv": 5.276717347513227e-08,
+ "grad_condition": 22472879.957919728,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 66.53908562660217
+ },
+ {
+ "epoch": 88,
+ "train_loss": 1.4288117279052734,
+ "train_acc": 0.48666,
+ "test_loss": 6.013241593933105,
+ "test_acc": 0.1075,
+ "lyapunov": null,
+ "grad_norm": 1.3007188330408852,
+ "grad_max_sv": 1.139727284014225,
+ "grad_min_sv": 5.308784185587001e-08,
+ "grad_condition": 21649216.459450316,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 66.52465963363647
+ },
+ {
+ "epoch": 89,
+ "train_loss": 1.4234879583358764,
+ "train_acc": 0.48672,
+ "test_loss": 5.440691387176513,
+ "test_acc": 0.1132,
+ "lyapunov": null,
+ "grad_norm": 1.286797693166196,
+ "grad_max_sv": 1.1378898680210114,
+ "grad_min_sv": 5.206395803369901e-08,
+ "grad_condition": 22299317.66856014,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 66.52217221260071
+ },
+ {
+ "epoch": 90,
+ "train_loss": 1.4255534106445313,
+ "train_acc": 0.4873,
+ "test_loss": 5.6889183303833,
+ "test_acc": 0.1089,
+ "lyapunov": null,
+ "grad_norm": 1.2907871997501676,
+ "grad_max_sv": 1.1832163825631141,
+ "grad_min_sv": 5.3787662057658284e-08,
+ "grad_condition": 22287194.786688134,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 66.53036832809448
+ },
+ {
+ "epoch": 91,
+ "train_loss": 1.4252548498916626,
+ "train_acc": 0.48792,
+ "test_loss": 6.261311422729492,
+ "test_acc": 0.1064,
+ "lyapunov": null,
+ "grad_norm": 1.3031797280361905,
+ "grad_max_sv": 1.1937354177236557,
+ "grad_min_sv": 5.396164546311866e-08,
+ "grad_condition": 22285756.773222417,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 66.53405451774597
+ },
+ {
+ "epoch": 92,
+ "train_loss": 1.4257716689300537,
+ "train_acc": 0.48484,
+ "test_loss": 5.9496440505981445,
+ "test_acc": 0.1083,
+ "lyapunov": null,
+ "grad_norm": 1.2963951565864091,
+ "grad_max_sv": 1.1119507551193237,
+ "grad_min_sv": 5.530857025703995e-08,
+ "grad_condition": 20517700.461063318,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 66.55413794517517
+ },
+ {
+ "epoch": 93,
+ "train_loss": 1.4217627249526978,
+ "train_acc": 0.48994,
+ "test_loss": 5.984926200866699,
+ "test_acc": 0.1075,
+ "lyapunov": null,
+ "grad_norm": 1.264014206865248,
+ "grad_max_sv": 1.0518594324588775,
+ "grad_min_sv": 4.926823864437324e-08,
+ "grad_condition": 21435816.94874554,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 66.52945113182068
+ },
+ {
+ "epoch": 94,
+ "train_loss": 1.4220651029205322,
+ "train_acc": 0.48712,
+ "test_loss": 5.9274788650512695,
+ "test_acc": 0.107,
+ "lyapunov": null,
+ "grad_norm": 1.2852744864782746,
+ "grad_max_sv": 1.194958347082138,
+ "grad_min_sv": 5.49836086882749e-08,
+ "grad_condition": 21876849.948771022,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 66.53060245513916
+ },
+ {
+ "epoch": 95,
+ "train_loss": 1.4127644922637939,
+ "train_acc": 0.4891,
+ "test_loss": 6.033211676025391,
+ "test_acc": 0.1068,
+ "lyapunov": null,
+ "grad_norm": 1.2852733904252112,
+ "grad_max_sv": 1.1103495568037034,
+ "grad_min_sv": 5.0794950290367066e-08,
+ "grad_condition": 21903481.59645809,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 66.54151201248169
+ },
+ {
+ "epoch": 96,
+ "train_loss": 1.42291917427063,
+ "train_acc": 0.48754,
+ "test_loss": 5.946468173217774,
+ "test_acc": 0.1078,
+ "lyapunov": null,
+ "grad_norm": 1.296502082808029,
+ "grad_max_sv": 1.1921778261661529,
+ "grad_min_sv": 5.59618015927299e-08,
+ "grad_condition": 21704630.944007598,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 66.53685402870178
+ },
+ {
+ "epoch": 97,
+ "train_loss": 1.4221784051132202,
+ "train_acc": 0.48922,
+ "test_loss": 5.77611974029541,
+ "test_acc": 0.1107,
+ "lyapunov": null,
+ "grad_norm": 1.283101201721102,
+ "grad_max_sv": 1.1582708179950714,
+ "grad_min_sv": 5.3498822172315384e-08,
+ "grad_condition": 21893400.606446274,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 66.51551508903503
+ },
+ {
+ "epoch": 98,
+ "train_loss": 1.4199727509307862,
+ "train_acc": 0.48888,
+ "test_loss": 5.947603340148926,
+ "test_acc": 0.1072,
+ "lyapunov": null,
+ "grad_norm": 1.2852084329880165,
+ "grad_max_sv": 1.12471182346344,
+ "grad_min_sv": 5.5720254987789984e-08,
+ "grad_condition": 20744598.237500653,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 66.54128313064575
+ },
+ {
+ "epoch": 99,
+ "train_loss": 1.4189085994720458,
+ "train_acc": 0.49036,
+ "test_loss": 6.019410075378418,
+ "test_acc": 0.1088,
+ "lyapunov": null,
+ "grad_norm": 1.2671570273045278,
+ "grad_max_sv": 1.044458197057247,
+ "grad_min_sv": 5.2453829901821794e-08,
+ "grad_condition": 20122144.845569003,
+ "lr": 2.467198171342e-07,
+ "time_sec": 66.5876886844635
+ },
+ {
+ "epoch": 100,
+ "train_loss": 1.4237549599456787,
+ "train_acc": 0.48696,
+ "test_loss": 6.123869666290283,
+ "test_acc": 0.1056,
+ "lyapunov": null,
+ "grad_norm": 1.2842958901976373,
+ "grad_max_sv": 1.0893320694565773,
+ "grad_min_sv": 5.240736280498481e-08,
+ "grad_condition": 20983923.24178537,
+ "lr": 0.0,
+ "time_sec": 66.52526140213013
+ }
+ ]
+ },
+ "lyapunov": {
+ "4": [
+ {
+ "epoch": 1,
+ "train_loss": 5.9559499659729,
+ "train_acc": 0.1816,
+ "test_loss": 2.127836145401001,
+ "test_acc": 0.2458,
+ "lyapunov": 3.1805403927707916,
+ "grad_norm": 7.669457973262479,
+ "grad_max_sv": 5.918661725521088,
+ "grad_min_sv": 2.931642846704108e-07,
+ "grad_condition": 20422744.62807854,
+ "lr": 0.0009997532801828658,
+ "time_sec": 38.74378061294556
+ },
+ {
+ "epoch": 2,
+ "train_loss": 4.402947195281983,
+ "train_acc": 0.19622,
+ "test_loss": 2.0710217851638792,
+ "test_acc": 0.2599,
+ "lyapunov": 2.5604425824206807,
+ "grad_norm": 5.322089969338386,
+ "grad_max_sv": 4.252373713254928,
+ "grad_min_sv": 1.9552239614029076e-07,
+ "grad_condition": 22174922.12126705,
+ "lr": 0.0009990133642141358,
+ "time_sec": 38.64048624038696
+ },
+ {
+ "epoch": 3,
+ "train_loss": 4.045168105316162,
+ "train_acc": 0.22284,
+ "test_loss": 2.047537351036072,
+ "test_acc": 0.275,
+ "lyapunov": 2.4094676093372236,
+ "grad_norm": 3.329135536451279,
+ "grad_max_sv": 2.700692330300808,
+ "grad_min_sv": 1.3114565362570828e-07,
+ "grad_condition": 21120674.055912692,
+ "lr": 0.00099778098230154,
+ "time_sec": 38.632225036621094
+ },
+ {
+ "epoch": 4,
+ "train_loss": 3.8760036846923827,
+ "train_acc": 0.23552,
+ "test_loss": 2.0494147090911867,
+ "test_acc": 0.2624,
+ "lyapunov": 2.323524356803016,
+ "grad_norm": 1.6169046791962502,
+ "grad_max_sv": 1.2880224913358689,
+ "grad_min_sv": 5.374016822656813e-08,
+ "grad_condition": 24107383.024291664,
+ "lr": 0.000996057350657239,
+ "time_sec": 38.643821477890015
+ },
+ {
+ "epoch": 5,
+ "train_loss": 3.7066750312805175,
+ "train_acc": 0.23364,
+ "test_loss": 2.073809361457825,
+ "test_acc": 0.2559,
+ "lyapunov": 2.2068090539454195,
+ "grad_norm": 0.6888041501699484,
+ "grad_max_sv": 0.4505885936319828,
+ "grad_min_sv": 2.5095627176341396e-08,
+ "grad_condition": 18224356.70160868,
+ "lr": 0.0009938441702975688,
+ "time_sec": 38.63996958732605
+ },
+ {
+ "epoch": 6,
+ "train_loss": 3.5870462338256837,
+ "train_acc": 0.22278,
+ "test_loss": 2.0948594261169435,
+ "test_acc": 0.2419,
+ "lyapunov": 2.1068829035819947,
+ "grad_norm": 0.4525297557038159,
+ "grad_max_sv": 0.2912705983966589,
+ "grad_min_sv": 1.4355599531334918e-08,
+ "grad_condition": 20443883.38963156,
+ "lr": 0.0009911436253643444,
+ "time_sec": 38.64875626564026
+ },
+ {
+ "epoch": 7,
+ "train_loss": 3.516497625274658,
+ "train_acc": 0.20518,
+ "test_loss": 2.122341016769409,
+ "test_acc": 0.2149,
+ "lyapunov": 2.031583094535886,
+ "grad_norm": 0.4192338818357315,
+ "grad_max_sv": 0.2666142761707306,
+ "grad_min_sv": 1.244383397436266e-08,
+ "grad_condition": 21524577.239365414,
+ "lr": 0.0009879583809693736,
+ "time_sec": 38.65327429771423
+ },
+ {
+ "epoch": 8,
+ "train_loss": 3.500787953567505,
+ "train_acc": 0.15934,
+ "test_loss": 2.30495919342041,
+ "test_acc": 0.1,
+ "lyapunov": 1.9705595735393826,
+ "grad_norm": 0.364806685633591,
+ "grad_max_sv": 0.19433156847953797,
+ "grad_min_sv": 7.78323775238877e-09,
+ "grad_condition": 1400511997.1550007,
+ "lr": 0.0009842915805643154,
+ "time_sec": 38.633607625961304
+ },
+ {
+ "epoch": 9,
+ "train_loss": 3.5612770445251463,
+ "train_acc": 0.0995,
+ "test_loss": 2.309052435684204,
+ "test_acc": 0.1,
+ "lyapunov": 1.9462372851188836,
+ "grad_norm": 0.1961322565486487,
+ "grad_max_sv": 0.08832639907486736,
+ "grad_min_sv": 7.733921171735724e-10,
+ "grad_condition": 10141008570.944132,
+ "lr": 0.0009801468428384714,
+ "time_sec": 38.646180152893066
+ },
+ {
+ "epoch": 10,
+ "train_loss": 3.538458889770508,
+ "train_acc": 0.09824,
+ "test_loss": 2.3040579429626464,
+ "test_acc": 0.1,
+ "lyapunov": 1.9283022353106447,
+ "grad_norm": 0.21318046705690488,
+ "grad_max_sv": 0.0782687779981643,
+ "grad_min_sv": 8.435315090236436e-10,
+ "grad_condition": 12098584585.465805,
+ "lr": 0.0009755282581475767,
+ "time_sec": 38.63904404640198
+ },
+ {
+ "epoch": 11,
+ "train_loss": 3.529650466461182,
+ "train_acc": 0.10062,
+ "test_loss": 2.302797904205322,
+ "test_acc": 0.1,
+ "lyapunov": 1.9214661554302401,
+ "grad_norm": 0.14436104663435,
+ "grad_max_sv": 0.07406298876740039,
+ "grad_min_sv": 1.8938792208460978e-10,
+ "grad_condition": 16582547419.599035,
+ "lr": 0.0009704403844771127,
+ "time_sec": 38.65141201019287
+ },
+ {
+ "epoch": 12,
+ "train_loss": 3.527643050994873,
+ "train_acc": 0.09804,
+ "test_loss": 2.3026904548645017,
+ "test_acc": 0.1,
+ "lyapunov": 1.9200294935489859,
+ "grad_norm": 0.13153432020985192,
+ "grad_max_sv": 0.05873946417123079,
+ "grad_min_sv": 2.2213949011783955e-10,
+ "grad_condition": 29679782911.168915,
+ "lr": 0.0009648882429441257,
+ "time_sec": 38.637062311172485
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.525748397216797,
+ "train_acc": 0.09986,
+ "test_loss": 2.3026839447021485,
+ "test_acc": 0.1,
+ "lyapunov": 1.9183377143367173,
+ "grad_norm": 0.1253530383790545,
+ "grad_max_sv": 0.054947068355977534,
+ "grad_min_sv": 2.484597018350735e-10,
+ "grad_condition": 32728296691.529114,
+ "lr": 0.0009588773128419905,
+ "time_sec": 38.639862060546875
+ },
+ {
+ "epoch": 14,
+ "train_loss": 3.5267535670471193,
+ "train_acc": 0.09928,
+ "test_loss": 2.303218070602417,
+ "test_acc": 0.1,
+ "lyapunov": 1.9196420743337372,
+ "grad_norm": 0.1092532269273596,
+ "grad_max_sv": 0.04395028324797749,
+ "grad_min_sv": 9.613613581557888e-11,
+ "grad_condition": 21168413985.92494,
+ "lr": 0.0009524135262330098,
+ "time_sec": 38.639400243759155
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.5285498448181154,
+ "train_acc": 0.0982,
+ "test_loss": 2.3035209484100343,
+ "test_acc": 0.1,
+ "lyapunov": 1.920996154055876,
+ "grad_norm": 0.10604045531455125,
+ "grad_max_sv": 0.030423881998285652,
+ "grad_min_sv": 8.947113291620313e-11,
+ "grad_condition": 14692894250.958597,
+ "lr": 0.0009455032620941839,
+ "time_sec": 38.645652770996094
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.5281584407806394,
+ "train_acc": 0.09964,
+ "test_loss": 2.3028687210083008,
+ "test_acc": 0.1,
+ "lyapunov": 1.9207957717768676,
+ "grad_norm": 0.09543807455983376,
+ "grad_max_sv": 0.006560872681438923,
+ "grad_min_sv": 4.056405124991419e-12,
+ "grad_condition": 3706750979.9989243,
+ "lr": 0.0009381533400219318,
+ "time_sec": 38.63558006286621
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.5265050379943848,
+ "train_acc": 0.09798,
+ "test_loss": 2.302896424102783,
+ "test_acc": 0.1,
+ "lyapunov": 1.9195188765635576,
+ "grad_norm": 0.09404328433417611,
+ "grad_max_sv": 0.005626836745068431,
+ "grad_min_sv": 8.896868440940896e-13,
+ "grad_condition": 3600570896.7918577,
+ "lr": 0.0009303710135019719,
+ "time_sec": 38.63581418991089
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.5274914381408693,
+ "train_acc": 0.09708,
+ "test_loss": 2.3026503776550293,
+ "test_acc": 0.1,
+ "lyapunov": 1.9202668194270804,
+ "grad_norm": 0.09620880376142034,
+ "grad_max_sv": 0.003721812926232815,
+ "grad_min_sv": 3.080583531323011e-13,
+ "grad_condition": 2605476049.955305,
+ "lr": 0.0009221639627510076,
+ "time_sec": 38.637654304504395
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.5240187657165527,
+ "train_acc": 0.09788,
+ "test_loss": 2.3026472286224364,
+ "test_acc": 0.1,
+ "lyapunov": 1.917564369833378,
+ "grad_norm": 0.08696272623748423,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000913540287137281,
+ "time_sec": 38.64585041999817
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.526093559265137,
+ "train_acc": 0.09698,
+ "test_loss": 2.302675205993652,
+ "test_acc": 0.1,
+ "lyapunov": 1.9192343212454521,
+ "grad_norm": 0.08759130668154863,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009045084971874739,
+ "time_sec": 38.63778305053711
+ },
+ {
+ "epoch": 21,
+ "train_loss": 3.5268382842254637,
+ "train_acc": 0.0963,
+ "test_loss": 2.302619518661499,
+ "test_acc": 0.1,
+ "lyapunov": 1.9198827185594212,
+ "grad_norm": 0.09131899089817433,
+ "grad_max_sv": 0.0007137967739254236,
+ "grad_min_sv": 1.2143662959650498e-34,
+ "grad_condition": 713796773.9254236,
+ "lr": 0.0008950775061878452,
+ "time_sec": 38.63694953918457
+ },
+ {
+ "epoch": 22,
+ "train_loss": 3.5266487127685546,
+ "train_acc": 0.09736,
+ "test_loss": 2.302595558166504,
+ "test_acc": 0.1,
+ "lyapunov": 1.919754564914557,
+ "grad_norm": 0.08451797479839518,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008852566213878947,
+ "time_sec": 38.62629771232605
+ },
+ {
+ "epoch": 23,
+ "train_loss": 3.526773832244873,
+ "train_acc": 0.09764,
+ "test_loss": 2.3026504470825193,
+ "test_acc": 0.1,
+ "lyapunov": 1.919811970132696,
+ "grad_norm": 0.0880141883169143,
+ "grad_max_sv": 0.003215626534074545,
+ "grad_min_sv": 6.757893669575438e-13,
+ "grad_condition": 421691349.6171393,
+ "lr": 0.0008750555348152298,
+ "time_sec": 38.627503395080566
+ },
+ {
+ "epoch": 24,
+ "train_loss": 3.5253559977722166,
+ "train_acc": 0.09686,
+ "test_loss": 2.302592763519287,
+ "test_acc": 0.1,
+ "lyapunov": 1.9186803285423142,
+ "grad_norm": 0.08625519727104183,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008644843137107057,
+ "time_sec": 38.62110924720764
+ },
+ {
+ "epoch": 25,
+ "train_loss": 3.5271505029296875,
+ "train_acc": 0.09882,
+ "test_loss": 2.3026457008361816,
+ "test_acc": 0.1,
+ "lyapunov": 1.9201455759575299,
+ "grad_norm": 0.08664315655618471,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008535533905932737,
+ "time_sec": 38.663304567337036
+ },
+ {
+ "epoch": 26,
+ "train_loss": 3.52567841835022,
+ "train_acc": 0.09848,
+ "test_loss": 2.302622730255127,
+ "test_acc": 0.1,
+ "lyapunov": 1.918919243775975,
+ "grad_norm": 0.08931714213407926,
+ "grad_max_sv": 0.0026560820173472167,
+ "grad_min_sv": 7.80326428931121e-27,
+ "grad_condition": 2656082017.346831,
+ "lr": 0.0008422735529643444,
+ "time_sec": 38.642497539520264
+ },
+ {
+ "epoch": 27,
+ "train_loss": 3.5247526208496094,
+ "train_acc": 0.09662,
+ "test_loss": 2.3026296226501466,
+ "test_acc": 0.1,
+ "lyapunov": 1.9182322189935943,
+ "grad_norm": 0.08339910325165188,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008306559326618259,
+ "time_sec": 38.63079476356506
+ },
+ {
+ "epoch": 28,
+ "train_loss": 3.5269400009155274,
+ "train_acc": 0.09728,
+ "test_loss": 2.3025920150756836,
+ "test_acc": 0.1,
+ "lyapunov": 1.9199587207316133,
+ "grad_norm": 0.08394537087665149,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008187119948743449,
+ "time_sec": 38.61244583129883
+ },
+ {
+ "epoch": 29,
+ "train_loss": 3.5242063328552247,
+ "train_acc": 0.09546,
+ "test_loss": 2.3025877166748048,
+ "test_acc": 0.1,
+ "lyapunov": 1.9176992738948149,
+ "grad_norm": 0.08393484553605075,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008064535268264883,
+ "time_sec": 38.62086057662964
+ },
+ {
+ "epoch": 30,
+ "train_loss": 3.524652021865845,
+ "train_acc": 0.09846,
+ "test_loss": 2.3025890396118163,
+ "test_acc": 0.1,
+ "lyapunov": 1.9180299269268886,
+ "grad_norm": 0.08604739858068552,
+ "grad_max_sv": 0.0037235306110233067,
+ "grad_min_sv": 2.2816656604449788e-14,
+ "grad_condition": 2522915018.0120707,
+ "lr": 0.0007938926261462367,
+ "time_sec": 38.63639521598816
+ },
+ {
+ "epoch": 31,
+ "train_loss": 3.5269307495117186,
+ "train_acc": 0.09852,
+ "test_loss": 2.302594734954834,
+ "test_acc": 0.1,
+ "lyapunov": 1.9199556487295635,
+ "grad_norm": 0.08308332919661195,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007810416889260654,
+ "time_sec": 38.632620334625244
+ },
+ {
+ "epoch": 32,
+ "train_loss": 3.526603982696533,
+ "train_acc": 0.0987,
+ "test_loss": 2.3026425048828125,
+ "test_acc": 0.1,
+ "lyapunov": 1.9197655053394835,
+ "grad_norm": 0.08373608851321027,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007679133974894983,
+ "time_sec": 38.6338005065918
+ },
+ {
+ "epoch": 33,
+ "train_loss": 3.5402134245300294,
+ "train_acc": 0.09648,
+ "test_loss": 2.3025889293670656,
+ "test_acc": 0.1,
+ "lyapunov": 1.926927990010937,
+ "grad_norm": 0.09981834537565924,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007545207078751857,
+ "time_sec": 38.6455602645874
+ },
+ {
+ "epoch": 34,
+ "train_loss": 3.5265413635253906,
+ "train_acc": 0.09788,
+ "test_loss": 2.302589825439453,
+ "test_acc": 0.1,
+ "lyapunov": 1.9196307095115448,
+ "grad_norm": 0.08459800727870437,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007408768370508577,
+ "time_sec": 38.652732133865356
+ },
+ {
+ "epoch": 35,
+ "train_loss": 3.526457656402588,
+ "train_acc": 0.09848,
+ "test_loss": 2.3025897277832033,
+ "test_acc": 0.1,
+ "lyapunov": 1.91963635930015,
+ "grad_norm": 0.08392830107993868,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007269952498697734,
+ "time_sec": 38.618977308273315
+ },
+ {
+ "epoch": 36,
+ "train_loss": 3.5264506495666503,
+ "train_acc": 0.09836,
+ "test_loss": 2.302591544342041,
+ "test_acc": 0.1,
+ "lyapunov": 1.919547389840226,
+ "grad_norm": 0.0844841992615646,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825364,
+ "time_sec": 38.635788917541504
+ },
+ {
+ "epoch": 37,
+ "train_loss": 3.525513755493164,
+ "train_acc": 0.09824,
+ "test_loss": 2.302587795257568,
+ "test_acc": 0.1,
+ "lyapunov": 1.9188998626626057,
+ "grad_norm": 0.08511865281250128,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006985739453173903,
+ "time_sec": 38.63599181175232
+ },
+ {
+ "epoch": 38,
+ "train_loss": 3.5258794207763673,
+ "train_acc": 0.09634,
+ "test_loss": 2.302587114715576,
+ "test_acc": 0.1,
+ "lyapunov": 1.9190363072983139,
+ "grad_norm": 0.08976844520779069,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006840622763423391,
+ "time_sec": 38.631999015808105
+ },
+ {
+ "epoch": 39,
+ "train_loss": 3.526812607116699,
+ "train_acc": 0.09782,
+ "test_loss": 2.3025868911743164,
+ "test_acc": 0.1,
+ "lyapunov": 1.9198928242144377,
+ "grad_norm": 0.08338895706252505,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006693689601226458,
+ "time_sec": 38.62815856933594
+ },
+ {
+ "epoch": 40,
+ "train_loss": 3.5299447924041747,
+ "train_acc": 0.09834,
+ "test_loss": 2.302587143325806,
+ "test_acc": 0.1,
+ "lyapunov": 1.9223552085554507,
+ "grad_norm": 0.09522270183573409,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006545084971874737,
+ "time_sec": 38.62764048576355
+ },
+ {
+ "epoch": 41,
+ "train_loss": 3.529573831253052,
+ "train_acc": 0.0978,
+ "test_loss": 2.3025870990753172,
+ "test_acc": 0.1,
+ "lyapunov": 1.922197810829143,
+ "grad_norm": 0.08338290015497958,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006394955530196147,
+ "time_sec": 38.63026428222656
+ },
+ {
+ "epoch": 42,
+ "train_loss": 3.5254642880249025,
+ "train_acc": 0.09878,
+ "test_loss": 2.302588144683838,
+ "test_acc": 0.1,
+ "lyapunov": 1.9188408784549256,
+ "grad_norm": 0.08333708848875665,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824273,
+ "time_sec": 38.63510298728943
+ },
+ {
+ "epoch": 43,
+ "train_loss": 3.527522850036621,
+ "train_acc": 0.09724,
+ "test_loss": 2.302586852264404,
+ "test_acc": 0.1,
+ "lyapunov": 1.920439124717127,
+ "grad_norm": 0.08392990999765709,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006090716206982714,
+ "time_sec": 38.61439347267151
+ },
+ {
+ "epoch": 44,
+ "train_loss": 3.5268155879211425,
+ "train_acc": 0.09854,
+ "test_loss": 2.302588026046753,
+ "test_acc": 0.1,
+ "lyapunov": 1.919859874583876,
+ "grad_norm": 0.08808142140863674,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005936906572928625,
+ "time_sec": 38.63164472579956
+ },
+ {
+ "epoch": 45,
+ "train_loss": 3.528644903793335,
+ "train_acc": 0.09726,
+ "test_loss": 2.302586632156372,
+ "test_acc": 0.1,
+ "lyapunov": 1.9213885017063306,
+ "grad_norm": 0.08163685266757659,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005782172325201156,
+ "time_sec": 38.63089060783386
+ },
+ {
+ "epoch": 46,
+ "train_loss": 3.5269173733520507,
+ "train_acc": 0.09548,
+ "test_loss": 2.302586455535889,
+ "test_acc": 0.1,
+ "lyapunov": 1.9199798500446408,
+ "grad_norm": 0.08000528496736534,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821523,
+ "time_sec": 38.636719703674316
+ },
+ {
+ "epoch": 47,
+ "train_loss": 3.525616721343994,
+ "train_acc": 0.0969,
+ "test_loss": 2.3025855419158936,
+ "test_acc": 0.1,
+ "lyapunov": 1.918914921753242,
+ "grad_norm": 0.0847797082901155,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005470541566592572,
+ "time_sec": 38.63527321815491
+ },
+ {
+ "epoch": 48,
+ "train_loss": 3.527122305908203,
+ "train_acc": 0.09908,
+ "test_loss": 2.302587979507446,
+ "test_acc": 0.1,
+ "lyapunov": 1.9201535523090216,
+ "grad_norm": 0.08334551671941194,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005313952597646569,
+ "time_sec": 38.6254460811615
+ },
+ {
+ "epoch": 49,
+ "train_loss": 3.529289007568359,
+ "train_acc": 0.09836,
+ "test_loss": 2.3025873039245606,
+ "test_acc": 0.1,
+ "lyapunov": 1.9219778029205243,
+ "grad_norm": 0.08239563380139257,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005157053795390643,
+ "time_sec": 38.63705110549927
+ },
+ {
+ "epoch": 50,
+ "train_loss": 3.5303411560821534,
+ "train_acc": 0.0977,
+ "test_loss": 2.3025870582580565,
+ "test_acc": 0.1,
+ "lyapunov": 1.9227478766380368,
+ "grad_norm": 0.08162963599167514,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005000000000000002,
+ "time_sec": 38.626914262771606
+ },
+ {
+ "epoch": 51,
+ "train_loss": 3.5286489057922363,
+ "train_acc": 0.09604,
+ "test_loss": 2.302586822128296,
+ "test_acc": 0.1,
+ "lyapunov": 1.9214349052180415,
+ "grad_norm": 0.08139452605749796,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00048429462046093607,
+ "time_sec": 38.64423418045044
+ },
+ {
+ "epoch": 52,
+ "train_loss": 3.525787140045166,
+ "train_acc": 0.09778,
+ "test_loss": 2.3025859855651856,
+ "test_acc": 0.1,
+ "lyapunov": 1.9190660763884444,
+ "grad_norm": 0.08146521230474718,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004686047402353435,
+ "time_sec": 38.6294162273407
+ },
+ {
+ "epoch": 53,
+ "train_loss": 3.5288507063293455,
+ "train_acc": 0.09546,
+ "test_loss": 2.3025855419158936,
+ "test_acc": 0.1,
+ "lyapunov": 1.9215699824530754,
+ "grad_norm": 0.08218605919682316,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000452945843340743,
+ "time_sec": 38.62653970718384
+ },
+ {
+ "epoch": 54,
+ "train_loss": 3.5271841695404054,
+ "train_acc": 0.09872,
+ "test_loss": 2.3025858070373535,
+ "test_acc": 0.1,
+ "lyapunov": 1.9201822860161666,
+ "grad_norm": 0.08216715344839949,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784806,
+ "time_sec": 38.638410806655884
+ },
+ {
+ "epoch": 55,
+ "train_loss": 3.526853522644043,
+ "train_acc": 0.09744,
+ "test_loss": 2.3025860900878907,
+ "test_acc": 0.1,
+ "lyapunov": 1.919959136897036,
+ "grad_norm": 0.0817176354250303,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004217827674798847,
+ "time_sec": 38.630091190338135
+ },
+ {
+ "epoch": 56,
+ "train_loss": 3.5288575717926025,
+ "train_acc": 0.09954,
+ "test_loss": 2.302586184310913,
+ "test_acc": 0.1,
+ "lyapunov": 1.921623296444983,
+ "grad_norm": 0.08257148205256129,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00040630934270713783,
+ "time_sec": 38.64346218109131
+ },
+ {
+ "epoch": 57,
+ "train_loss": 3.5272767601776125,
+ "train_acc": 0.09642,
+ "test_loss": 2.302586555480957,
+ "test_acc": 0.1,
+ "lyapunov": 1.9202661358791848,
+ "grad_norm": 0.08293348649238423,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000390928379301729,
+ "time_sec": 38.64233660697937
+ },
+ {
+ "epoch": 58,
+ "train_loss": 3.526464948577881,
+ "train_acc": 0.09672,
+ "test_loss": 2.3025856628417967,
+ "test_acc": 0.1,
+ "lyapunov": 1.9196561523105786,
+ "grad_norm": 0.08164186959675705,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003756550564175727,
+ "time_sec": 38.63249588012695
+ },
+ {
+ "epoch": 59,
+ "train_loss": 3.5295531370544433,
+ "train_acc": 0.09774,
+ "test_loss": 2.302585400390625,
+ "test_acc": 0.1,
+ "lyapunov": 1.9221740268990206,
+ "grad_norm": 0.08246273738852085,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036050444698038553,
+ "time_sec": 38.646018266677856
+ },
+ {
+ "epoch": 60,
+ "train_loss": 3.5271629650115965,
+ "train_acc": 0.0971,
+ "test_loss": 2.3025858444213867,
+ "test_acc": 0.1,
+ "lyapunov": 1.9201987954356787,
+ "grad_norm": 0.08208001883222767,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00034549150281252655,
+ "time_sec": 38.6309814453125
+ },
+ {
+ "epoch": 61,
+ "train_loss": 3.5265548262023927,
+ "train_acc": 0.0977,
+ "test_loss": 2.302585780715942,
+ "test_acc": 0.1,
+ "lyapunov": 1.9197500297785415,
+ "grad_norm": 0.08189736323511718,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003306310398773544,
+ "time_sec": 38.638221740722656
+ },
+ {
+ "epoch": 62,
+ "train_loss": 3.52600441986084,
+ "train_acc": 0.09678,
+ "test_loss": 2.302585761642456,
+ "test_acc": 0.1,
+ "lyapunov": 1.9192463177854142,
+ "grad_norm": 0.08137598978711448,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766127,
+ "time_sec": 38.63043713569641
+ },
+ {
+ "epoch": 63,
+ "train_loss": 3.5271013943481444,
+ "train_acc": 0.09814,
+ "test_loss": 2.302585670852661,
+ "test_acc": 0.1,
+ "lyapunov": 1.920157666096602,
+ "grad_norm": 0.0823619758981674,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003014260546826097,
+ "time_sec": 38.63147497177124
+ },
+ {
+ "epoch": 64,
+ "train_loss": 3.526780191192627,
+ "train_acc": 0.09852,
+ "test_loss": 2.302585818862915,
+ "test_acc": 0.1,
+ "lyapunov": 1.919904801546765,
+ "grad_norm": 0.08022492391600272,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002871103542174637,
+ "time_sec": 38.62516927719116
+ },
+ {
+ "epoch": 65,
+ "train_loss": 3.5343781797790528,
+ "train_acc": 0.09912,
+ "test_loss": 2.3025853904724123,
+ "test_acc": 0.1,
+ "lyapunov": 1.9257748550771143,
+ "grad_norm": 0.10073329729823817,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002730047501302267,
+ "time_sec": 38.634148836135864
+ },
+ {
+ "epoch": 66,
+ "train_loss": 3.5349793888092043,
+ "train_acc": 0.09842,
+ "test_loss": 2.3025853446960447,
+ "test_acc": 0.1,
+ "lyapunov": 1.9264679845336758,
+ "grad_norm": 0.11920770311136344,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00025912316294914234,
+ "time_sec": 38.61845135688782
+ },
+ {
+ "epoch": 67,
+ "train_loss": 3.526273007965088,
+ "train_acc": 0.09544,
+ "test_loss": 2.3025852378845215,
+ "test_acc": 0.1,
+ "lyapunov": 1.9194827823687697,
+ "grad_norm": 0.08304121043671493,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002454792921248144,
+ "time_sec": 38.626497983932495
+ },
+ {
+ "epoch": 68,
+ "train_loss": 3.5271414315795897,
+ "train_acc": 0.0966,
+ "test_loss": 2.3025850952148437,
+ "test_acc": 0.1,
+ "lyapunov": 1.9202514917344389,
+ "grad_norm": 0.08574615477087318,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00023208660251050164,
+ "time_sec": 38.627126693725586
+ },
+ {
+ "epoch": 69,
+ "train_loss": 3.529951874008179,
+ "train_acc": 0.0986,
+ "test_loss": 2.30258518447876,
+ "test_acc": 0.1,
+ "lyapunov": 1.9225430412365652,
+ "grad_norm": 0.08082947961897828,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00021895831107393473,
+ "time_sec": 38.630186319351196
+ },
+ {
+ "epoch": 70,
+ "train_loss": 3.526535584869385,
+ "train_acc": 0.09668,
+ "test_loss": 2.3025852592468263,
+ "test_acc": 0.1,
+ "lyapunov": 1.919725867183617,
+ "grad_norm": 0.08274796493939703,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376356,
+ "time_sec": 38.6431679725647
+ },
+ {
+ "epoch": 71,
+ "train_loss": 3.5277945655822753,
+ "train_acc": 0.09836,
+ "test_loss": 2.3025853775024414,
+ "test_acc": 0.1,
+ "lyapunov": 1.920768865843868,
+ "grad_norm": 0.08235441909099428,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019354647317351177,
+ "time_sec": 38.63748812675476
+ },
+ {
+ "epoch": 72,
+ "train_loss": 3.5274662791442872,
+ "train_acc": 0.0948,
+ "test_loss": 2.3025851234436034,
+ "test_acc": 0.1,
+ "lyapunov": 1.9204377185963,
+ "grad_norm": 0.08364637794680509,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001812880051256552,
+ "time_sec": 38.6381402015686
+ },
+ {
+ "epoch": 73,
+ "train_loss": 3.526118115386963,
+ "train_acc": 0.09886,
+ "test_loss": 2.302585259628296,
+ "test_acc": 0.1,
+ "lyapunov": 1.9193554836160995,
+ "grad_norm": 0.0826562338509352,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016934406733817422,
+ "time_sec": 38.65567326545715
+ },
+ {
+ "epoch": 74,
+ "train_loss": 3.527300643615723,
+ "train_acc": 0.09764,
+ "test_loss": 2.302585151672363,
+ "test_acc": 0.1,
+ "lyapunov": 1.9203089323190168,
+ "grad_norm": 0.08128595818241462,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001577264470356557,
+ "time_sec": 38.65558409690857
+ },
+ {
+ "epoch": 75,
+ "train_loss": 3.52685251663208,
+ "train_acc": 0.09664,
+ "test_loss": 2.3025852661132813,
+ "test_acc": 0.1,
+ "lyapunov": 1.9200191327068201,
+ "grad_norm": 0.08404244166329763,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014644660940672634,
+ "time_sec": 38.63766312599182
+ },
+ {
+ "epoch": 76,
+ "train_loss": 3.5262623787689207,
+ "train_acc": 0.09722,
+ "test_loss": 2.3025850158691408,
+ "test_acc": 0.1,
+ "lyapunov": 1.919482776271108,
+ "grad_norm": 0.08232879952859255,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001355156862892944,
+ "time_sec": 38.633180379867554
+ },
+ {
+ "epoch": 77,
+ "train_loss": 3.528319863128662,
+ "train_acc": 0.09596,
+ "test_loss": 2.3025850936889647,
+ "test_acc": 0.1,
+ "lyapunov": 1.9211895322555776,
+ "grad_norm": 0.08358594679641423,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012494446518477025,
+ "time_sec": 38.6444034576416
+ },
+ {
+ "epoch": 78,
+ "train_loss": 3.526455977935791,
+ "train_acc": 0.09646,
+ "test_loss": 2.3025851753234865,
+ "test_acc": 0.1,
+ "lyapunov": 1.919646045740913,
+ "grad_norm": 0.0800944099425941,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210548,
+ "time_sec": 38.63438820838928
+ },
+ {
+ "epoch": 79,
+ "train_loss": 3.528594108276367,
+ "train_acc": 0.09844,
+ "test_loss": 2.302585315704346,
+ "test_acc": 0.1,
+ "lyapunov": 1.9213674385529345,
+ "grad_norm": 0.0823521435571041,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010492249381215483,
+ "time_sec": 38.63344979286194
+ },
+ {
+ "epoch": 80,
+ "train_loss": 3.5273741276550292,
+ "train_acc": 0.09784,
+ "test_loss": 2.3025850051879884,
+ "test_acc": 0.1,
+ "lyapunov": 1.9203915013681592,
+ "grad_norm": 0.0830759912493753,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 38.62626814842224
+ },
+ {
+ "epoch": 81,
+ "train_loss": 3.5291355400848388,
+ "train_acc": 0.09736,
+ "test_loss": 2.3025851634979246,
+ "test_acc": 0.1,
+ "lyapunov": 1.921823484818344,
+ "grad_norm": 0.08275874029214267,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 38.62844204902649
+ },
+ {
+ "epoch": 82,
+ "train_loss": 3.525912507019043,
+ "train_acc": 0.09748,
+ "test_loss": 2.3025852321624756,
+ "test_acc": 0.1,
+ "lyapunov": 1.91920463874212,
+ "grad_norm": 0.08153852660653182,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 38.653265714645386
+ },
+ {
+ "epoch": 83,
+ "train_loss": 3.5292207734680177,
+ "train_acc": 0.0958,
+ "test_loss": 2.3025851135253905,
+ "test_acc": 0.1,
+ "lyapunov": 1.9219502158786939,
+ "grad_norm": 0.08350888633092267,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 38.634111642837524
+ },
+ {
+ "epoch": 84,
+ "train_loss": 3.5284012381744385,
+ "train_acc": 0.09624,
+ "test_loss": 2.30258512878418,
+ "test_acc": 0.1,
+ "lyapunov": 1.9212511674217556,
+ "grad_norm": 0.08116909186786311,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 38.64353036880493
+ },
+ {
+ "epoch": 85,
+ "train_loss": 3.5251765769195558,
+ "train_acc": 0.09792,
+ "test_loss": 2.30258514251709,
+ "test_acc": 0.1,
+ "lyapunov": 1.918617296401802,
+ "grad_norm": 0.07954191314548852,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 38.62560677528381
+ },
+ {
+ "epoch": 86,
+ "train_loss": 3.5287663554382322,
+ "train_acc": 0.09838,
+ "test_loss": 2.302585173034668,
+ "test_acc": 0.1,
+ "lyapunov": 1.9215295982482794,
+ "grad_norm": 0.08355699198177892,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 38.65434241294861
+ },
+ {
+ "epoch": 87,
+ "train_loss": 3.5260034490966796,
+ "train_acc": 0.09604,
+ "test_loss": 2.3025851554870607,
+ "test_acc": 0.1,
+ "lyapunov": 1.9192945807791122,
+ "grad_norm": 0.08149215014053633,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 38.63465094566345
+ },
+ {
+ "epoch": 88,
+ "train_loss": 3.5243265664672854,
+ "train_acc": 0.09828,
+ "test_loss": 2.302585033416748,
+ "test_acc": 0.1,
+ "lyapunov": 1.9179029281791824,
+ "grad_norm": 0.08154521467921626,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 38.6289963722229
+ },
+ {
+ "epoch": 89,
+ "train_loss": 3.5287904942321777,
+ "train_acc": 0.09666,
+ "test_loss": 2.302585191345215,
+ "test_acc": 0.1,
+ "lyapunov": 1.9215726117648737,
+ "grad_norm": 0.084132595254172,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 38.642388105392456
+ },
+ {
+ "epoch": 90,
+ "train_loss": 3.526969603881836,
+ "train_acc": 0.09754,
+ "test_loss": 2.302585014343262,
+ "test_acc": 0.1,
+ "lyapunov": 1.920039845549542,
+ "grad_norm": 0.0821271686806539,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 38.63814377784729
+ },
+ {
+ "epoch": 91,
+ "train_loss": 3.527617153930664,
+ "train_acc": 0.09638,
+ "test_loss": 2.302585041809082,
+ "test_acc": 0.1,
+ "lyapunov": 1.9205815706716474,
+ "grad_norm": 0.08312510555513332,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 38.61940360069275
+ },
+ {
+ "epoch": 92,
+ "train_loss": 3.5268433947753905,
+ "train_acc": 0.09684,
+ "test_loss": 2.3025852138519287,
+ "test_acc": 0.1,
+ "lyapunov": 1.9199492108181615,
+ "grad_norm": 0.0823876986166593,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 38.627458810806274
+ },
+ {
+ "epoch": 93,
+ "train_loss": 3.53038783744812,
+ "train_acc": 0.0982,
+ "test_loss": 2.3025850196838378,
+ "test_acc": 0.1,
+ "lyapunov": 1.9228984605320885,
+ "grad_norm": 0.08263085862758328,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 38.63483691215515
+ },
+ {
+ "epoch": 94,
+ "train_loss": 3.5289703980255127,
+ "train_acc": 0.09816,
+ "test_loss": 2.3025850566864015,
+ "test_acc": 0.1,
+ "lyapunov": 1.9216854218631754,
+ "grad_norm": 0.08327210271669083,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 38.63469362258911
+ },
+ {
+ "epoch": 95,
+ "train_loss": 3.5277647956848144,
+ "train_acc": 0.0995,
+ "test_loss": 2.3025852081298828,
+ "test_acc": 0.1,
+ "lyapunov": 1.9207559202028357,
+ "grad_norm": 0.08352486265414892,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 38.64616012573242
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.526619141845703,
+ "train_acc": 0.09938,
+ "test_loss": 2.3025851345062254,
+ "test_acc": 0.1,
+ "lyapunov": 1.9198539360709812,
+ "grad_norm": 0.08098182122024891,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 38.62220072746277
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.5280892516326903,
+ "train_acc": 0.1,
+ "test_loss": 2.3025852352142335,
+ "test_acc": 0.1,
+ "lyapunov": 1.921060741100165,
+ "grad_norm": 0.08211810367594433,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 38.645119190216064
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.5287079336547853,
+ "train_acc": 0.1,
+ "test_loss": 2.3025850273132322,
+ "test_acc": 0.1,
+ "lyapunov": 1.9215380800959398,
+ "grad_norm": 0.08325515946558669,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 38.63027763366699
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.5253015606689453,
+ "train_acc": 0.1,
+ "test_loss": 2.30258511428833,
+ "test_acc": 0.1,
+ "lyapunov": 1.9187132022569857,
+ "grad_norm": 0.08193671483030009,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.467198171342e-07,
+ "time_sec": 38.63921046257019
+ },
+ {
+ "epoch": 100,
+ "train_loss": 3.5272140621948243,
+ "train_acc": 0.1,
+ "test_loss": 2.302585135269165,
+ "test_acc": 0.1,
+ "lyapunov": 1.9202767503840843,
+ "grad_norm": 0.08222655054617872,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 38.6323139667511
+ }
+ ],
+ "8": [
+ {
+ "epoch": 1,
+ "train_loss": 8.479881681365967,
+ "train_acc": 0.15672,
+ "test_loss": 2.162619204711914,
+ "test_acc": 0.2125,
+ "lyapunov": 4.108346384199684,
+ "grad_norm": 7.697098833505723,
+ "grad_max_sv": 6.178906440734863,
+ "grad_min_sv": 2.761631513692464e-07,
+ "grad_condition": 23140136.221944965,
+ "lr": 0.0009997532801828658,
+ "time_sec": 81.47396469116211
+ },
+ {
+ "epoch": 2,
+ "train_loss": 5.665244631958008,
+ "train_acc": 0.18,
+ "test_loss": 2.1842808677673338,
+ "test_acc": 0.1923,
+ "lyapunov": 3.230283256686862,
+ "grad_norm": 5.392009012742897,
+ "grad_max_sv": 4.110089653730393,
+ "grad_min_sv": 1.9321651976156317e-07,
+ "grad_condition": 21420475.323837068,
+ "lr": 0.0009990133642141358,
+ "time_sec": 81.45991396903992
+ },
+ {
+ "epoch": 3,
+ "train_loss": 5.333162035522461,
+ "train_acc": 0.1952,
+ "test_loss": 2.225303956604004,
+ "test_acc": 0.167,
+ "lyapunov": 3.1082111679379594,
+ "grad_norm": 3.851771920219555,
+ "grad_max_sv": 3.176962560415268,
+ "grad_min_sv": 1.3438213457561688e-07,
+ "grad_condition": 23879291.498504233,
+ "lr": 0.00099778098230154,
+ "time_sec": 81.46788787841797
+ },
+ {
+ "epoch": 4,
+ "train_loss": 5.171234805908203,
+ "train_acc": 0.20002,
+ "test_loss": 2.235258939361572,
+ "test_acc": 0.159,
+ "lyapunov": 3.0473744570446746,
+ "grad_norm": 2.481126294013876,
+ "grad_max_sv": 2.0792742133140565,
+ "grad_min_sv": 8.9392968050106e-08,
+ "grad_condition": 24637829.84704242,
+ "lr": 0.000996057350657239,
+ "time_sec": 81.47967004776001
+ },
+ {
+ "epoch": 5,
+ "train_loss": 5.166805406799316,
+ "train_acc": 0.19452,
+ "test_loss": 2.237046794128418,
+ "test_acc": 0.1327,
+ "lyapunov": 3.0511742223559133,
+ "grad_norm": 1.3615579983642885,
+ "grad_max_sv": 1.0548206314444541,
+ "grad_min_sv": 4.5490313116403056e-08,
+ "grad_condition": 23987300.59429905,
+ "lr": 0.0009938441702975688,
+ "time_sec": 81.459157705307
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.8697237976074215,
+ "train_acc": 0.1737,
+ "test_loss": 2.2830872146606445,
+ "test_acc": 0.1253,
+ "lyapunov": 2.8754516471072535,
+ "grad_norm": 0.6903867745940513,
+ "grad_max_sv": 0.41943032629787924,
+ "grad_min_sv": 1.919375629544362e-08,
+ "grad_condition": 22192013.87340497,
+ "lr": 0.0009911436253643444,
+ "time_sec": 81.48192954063416
+ },
+ {
+ "epoch": 7,
+ "train_loss": 4.493588522949219,
+ "train_acc": 0.15938,
+ "test_loss": 2.3302653469085692,
+ "test_acc": 0.1,
+ "lyapunov": 2.653091859939458,
+ "grad_norm": 0.7557218960403191,
+ "grad_max_sv": 0.26077940948307515,
+ "grad_min_sv": 1.0986899512399616e-08,
+ "grad_condition": 25117189.859535195,
+ "lr": 0.0009879583809693736,
+ "time_sec": 81.4841628074646
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.350341845397949,
+ "train_acc": 0.15252,
+ "test_loss": 2.3086660652160647,
+ "test_acc": 0.1,
+ "lyapunov": 2.5555299291830234,
+ "grad_norm": 0.6250628446482196,
+ "grad_max_sv": 0.20942260958254338,
+ "grad_min_sv": 7.251302003297155e-09,
+ "grad_condition": 30522570.970140863,
+ "lr": 0.0009842915805643154,
+ "time_sec": 81.46237683296204
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.145118522186279,
+ "train_acc": 0.13274,
+ "test_loss": 2.315164138031006,
+ "test_acc": 0.1,
+ "lyapunov": 2.40533269762688,
+ "grad_norm": 0.6205908073118289,
+ "grad_max_sv": 0.14447018823120744,
+ "grad_min_sv": 4.4057232563565755e-09,
+ "grad_condition": 34238562.93985257,
+ "lr": 0.0009801468428384714,
+ "time_sec": 81.4730293750763
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.078840268859863,
+ "train_acc": 0.1284,
+ "test_loss": 2.3138900623321534,
+ "test_acc": 0.1,
+ "lyapunov": 2.363016066343888,
+ "grad_norm": 0.7930843872612708,
+ "grad_max_sv": 0.10398251404985785,
+ "grad_min_sv": 3.7019540950061767e-09,
+ "grad_condition": 60913515.913623154,
+ "lr": 0.0009755282581475767,
+ "time_sec": 81.45200657844543
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.092224692230225,
+ "train_acc": 0.1466,
+ "test_loss": 2.312975662994385,
+ "test_acc": 0.1,
+ "lyapunov": 2.3754844513085795,
+ "grad_norm": 1.1984655112922225,
+ "grad_max_sv": 0.17450910471379757,
+ "grad_min_sv": 5.5799074860640734e-09,
+ "grad_condition": 13168082812.37189,
+ "lr": 0.0009704403844771127,
+ "time_sec": 81.45421433448792
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.142614550323486,
+ "train_acc": 0.10048,
+ "test_loss": 2.3073625778198243,
+ "test_acc": 0.1,
+ "lyapunov": 2.36521298623146,
+ "grad_norm": 0.8201455961321854,
+ "grad_max_sv": 0.06452706009149552,
+ "grad_min_sv": 1.4042129118228878e-12,
+ "grad_condition": 50885083514.90724,
+ "lr": 0.0009648882429441257,
+ "time_sec": 81.46072387695312
+ },
+ {
+ "epoch": 13,
+ "train_loss": 3.979385091934204,
+ "train_acc": 0.10066,
+ "test_loss": 2.3081630187988282,
+ "test_acc": 0.1,
+ "lyapunov": 2.26381984696059,
+ "grad_norm": 0.16210184952823345,
+ "grad_max_sv": 0.04905642978847027,
+ "grad_min_sv": 2.7241308859756593e-12,
+ "grad_condition": 39268609789.13625,
+ "lr": 0.0009588773128419905,
+ "time_sec": 81.4600670337677
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.013840252990723,
+ "train_acc": 0.09774,
+ "test_loss": 2.3071225547790526,
+ "test_acc": 0.1,
+ "lyapunov": 2.2779995590219717,
+ "grad_norm": 0.2350799590612887,
+ "grad_max_sv": 0.03584399004466832,
+ "grad_min_sv": 2.4371194341884142e-11,
+ "grad_condition": 24256890299.017464,
+ "lr": 0.0009524135262330098,
+ "time_sec": 81.45963406562805
+ },
+ {
+ "epoch": 15,
+ "train_loss": 3.9913157040405274,
+ "train_acc": 0.09784,
+ "test_loss": 2.319146055984497,
+ "test_acc": 0.1,
+ "lyapunov": 2.268958825894329,
+ "grad_norm": 0.15763925383129676,
+ "grad_max_sv": 0.009183965646661818,
+ "grad_min_sv": 1.97946225383161e-12,
+ "grad_condition": 8163098832.376617,
+ "lr": 0.0009455032620941839,
+ "time_sec": 81.44594478607178
+ },
+ {
+ "epoch": 16,
+ "train_loss": 3.9718331854248046,
+ "train_acc": 0.0996,
+ "test_loss": 2.3092525833129884,
+ "test_acc": 0.1,
+ "lyapunov": 2.2586230457286396,
+ "grad_norm": 0.11766352456542575,
+ "grad_max_sv": 0.006989215174689889,
+ "grad_min_sv": 2.4024430389645366e-14,
+ "grad_condition": 6504081924.260536,
+ "lr": 0.0009381533400219318,
+ "time_sec": 81.44390797615051
+ },
+ {
+ "epoch": 17,
+ "train_loss": 3.9787883277130125,
+ "train_acc": 0.09702,
+ "test_loss": 2.3043574817657473,
+ "test_acc": 0.1,
+ "lyapunov": 2.2631307922665727,
+ "grad_norm": 0.1527010207412437,
+ "grad_max_sv": 0.009803948854096235,
+ "grad_min_sv": 1.4435005241224427e-33,
+ "grad_condition": 9803948854.096233,
+ "lr": 0.0009303710135019719,
+ "time_sec": 81.43403100967407
+ },
+ {
+ "epoch": 18,
+ "train_loss": 3.9913615090942383,
+ "train_acc": 0.09744,
+ "test_loss": 2.3033508323669434,
+ "test_acc": 0.1,
+ "lyapunov": 2.269262256524752,
+ "grad_norm": 0.11184179273021279,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009221639627510076,
+ "time_sec": 81.42399740219116
+ },
+ {
+ "epoch": 19,
+ "train_loss": 3.9763801429748535,
+ "train_acc": 0.0977,
+ "test_loss": 2.3026752422332764,
+ "test_acc": 0.1,
+ "lyapunov": 2.2619051079615913,
+ "grad_norm": 0.11713248666386221,
+ "grad_max_sv": 0.000484072370454669,
+ "grad_min_sv": 0.0,
+ "grad_condition": 484072370.454669,
+ "lr": 0.000913540287137281,
+ "time_sec": 81.4525249004364
+ },
+ {
+ "epoch": 20,
+ "train_loss": 3.976750040283203,
+ "train_acc": 0.09734,
+ "test_loss": 2.302591667175293,
+ "test_acc": 0.1,
+ "lyapunov": 2.262148560770332,
+ "grad_norm": 0.11345857984491753,
+ "grad_max_sv": 0.004815328773111105,
+ "grad_min_sv": 7.298523316195025e-36,
+ "grad_condition": 4815328773.111105,
+ "lr": 0.0009045084971874739,
+ "time_sec": 81.51628756523132
+ },
+ {
+ "epoch": 21,
+ "train_loss": 3.980269993438721,
+ "train_acc": 0.09802,
+ "test_loss": 2.302587752532959,
+ "test_acc": 0.1,
+ "lyapunov": 2.264334798164075,
+ "grad_norm": 0.13684662833237576,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008950775061878452,
+ "time_sec": 81.45560097694397
+ },
+ {
+ "epoch": 22,
+ "train_loss": 3.9804648877716065,
+ "train_acc": 0.0979,
+ "test_loss": 2.302587752532959,
+ "test_acc": 0.1,
+ "lyapunov": 2.2635294013011182,
+ "grad_norm": 0.13344079799844585,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008852566213878947,
+ "time_sec": 81.44366526603699
+ },
+ {
+ "epoch": 23,
+ "train_loss": 3.9813251597595216,
+ "train_acc": 0.09872,
+ "test_loss": 2.302596923828125,
+ "test_acc": 0.1,
+ "lyapunov": 2.264318755825462,
+ "grad_norm": 0.11240815342914404,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008750555348152298,
+ "time_sec": 81.4700722694397
+ },
+ {
+ "epoch": 24,
+ "train_loss": 3.9829969465637207,
+ "train_acc": 0.09762,
+ "test_loss": 2.302590003967285,
+ "test_acc": 0.1,
+ "lyapunov": 2.2655306484388267,
+ "grad_norm": 0.13657445352154945,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008644843137107057,
+ "time_sec": 81.44092345237732
+ },
+ {
+ "epoch": 25,
+ "train_loss": 3.9867445934295653,
+ "train_acc": 0.09768,
+ "test_loss": 2.3025884731292723,
+ "test_acc": 0.1,
+ "lyapunov": 2.2683042187215117,
+ "grad_norm": 0.13504220620651136,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008535533905932737,
+ "time_sec": 81.44885325431824
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.011947896575927,
+ "train_acc": 0.09772,
+ "test_loss": 2.302588147735596,
+ "test_acc": 0.1,
+ "lyapunov": 2.2796514083052535,
+ "grad_norm": 0.16320303411181733,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008422735529643444,
+ "time_sec": 81.45354628562927
+ },
+ {
+ "epoch": 27,
+ "train_loss": 3.9786824931335447,
+ "train_acc": 0.09896,
+ "test_loss": 2.302594832611084,
+ "test_acc": 0.1,
+ "lyapunov": 2.26323458300832,
+ "grad_norm": 0.10988564477689002,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008306559326618259,
+ "time_sec": 81.44628882408142
+ },
+ {
+ "epoch": 28,
+ "train_loss": 3.977536257247925,
+ "train_acc": 0.098,
+ "test_loss": 2.302598391723633,
+ "test_acc": 0.1,
+ "lyapunov": 2.262441022926584,
+ "grad_norm": 0.12595116922261335,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008187119948743449,
+ "time_sec": 81.4543764591217
+ },
+ {
+ "epoch": 29,
+ "train_loss": 3.976567816162109,
+ "train_acc": 0.09876,
+ "test_loss": 2.302590633010864,
+ "test_acc": 0.1,
+ "lyapunov": 2.2617232262935785,
+ "grad_norm": 0.11663224483129596,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008064535268264883,
+ "time_sec": 81.45405316352844
+ },
+ {
+ "epoch": 30,
+ "train_loss": 3.98611599609375,
+ "train_acc": 0.09902,
+ "test_loss": 2.302588882827759,
+ "test_acc": 0.1,
+ "lyapunov": 2.268034580723404,
+ "grad_norm": 0.12156603788402341,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007938926261462367,
+ "time_sec": 81.43305087089539
+ },
+ {
+ "epoch": 31,
+ "train_loss": 3.973400810546875,
+ "train_acc": 0.09778,
+ "test_loss": 2.3025912315368653,
+ "test_acc": 0.1,
+ "lyapunov": 2.259550383633665,
+ "grad_norm": 0.11416147448139306,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007810416889260654,
+ "time_sec": 81.45837593078613
+ },
+ {
+ "epoch": 32,
+ "train_loss": 3.988133301086426,
+ "train_acc": 0.0974,
+ "test_loss": 2.3025894966125486,
+ "test_acc": 0.1,
+ "lyapunov": 2.2669999562870817,
+ "grad_norm": 0.11056723038790034,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007679133974894983,
+ "time_sec": 81.44456076622009
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.005648225860596,
+ "train_acc": 0.09582,
+ "test_loss": 2.302590217590332,
+ "test_acc": 0.1,
+ "lyapunov": 2.2759649180390342,
+ "grad_norm": 0.15627582965327647,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007545207078751857,
+ "time_sec": 81.45507860183716
+ },
+ {
+ "epoch": 34,
+ "train_loss": 3.979487621154785,
+ "train_acc": 0.09842,
+ "test_loss": 2.3025886589050293,
+ "test_acc": 0.1,
+ "lyapunov": 2.2636950528225324,
+ "grad_norm": 0.11766964677730013,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007408768370508577,
+ "time_sec": 81.40873432159424
+ },
+ {
+ "epoch": 35,
+ "train_loss": 3.9761420146942137,
+ "train_acc": 0.09734,
+ "test_loss": 2.3025886192321776,
+ "test_acc": 0.1,
+ "lyapunov": 2.2615554509565348,
+ "grad_norm": 0.13516175590778773,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007269952498697734,
+ "time_sec": 81.41994976997375
+ },
+ {
+ "epoch": 36,
+ "train_loss": 3.982365760269165,
+ "train_acc": 0.09772,
+ "test_loss": 2.302588511276245,
+ "test_acc": 0.1,
+ "lyapunov": 2.2654811189607584,
+ "grad_norm": 0.11681074828605718,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825364,
+ "time_sec": 81.44073605537415
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.0145159342956545,
+ "train_acc": 0.09844,
+ "test_loss": 2.3025877605438234,
+ "test_acc": 0.1,
+ "lyapunov": 2.279959214617834,
+ "grad_norm": 0.16927419652036743,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006985739453173903,
+ "time_sec": 81.44942951202393
+ },
+ {
+ "epoch": 38,
+ "train_loss": 3.9834751657104492,
+ "train_acc": 0.0988,
+ "test_loss": 2.3025879089355468,
+ "test_acc": 0.1,
+ "lyapunov": 2.26584634939423,
+ "grad_norm": 0.14984272020285577,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006840622763423391,
+ "time_sec": 81.45499515533447
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.02413849609375,
+ "train_acc": 0.09734,
+ "test_loss": 2.30258787689209,
+ "test_acc": 0.1,
+ "lyapunov": 2.286009701316619,
+ "grad_norm": 0.22145868959770007,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006693689601226458,
+ "time_sec": 81.45317363739014
+ },
+ {
+ "epoch": 40,
+ "train_loss": 3.9736411520385744,
+ "train_acc": 0.09894,
+ "test_loss": 2.3025887702941894,
+ "test_acc": 0.1,
+ "lyapunov": 2.259992800710146,
+ "grad_norm": 0.08893647577966153,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006545084971874737,
+ "time_sec": 81.45592546463013
+ },
+ {
+ "epoch": 41,
+ "train_loss": 3.976674521484375,
+ "train_acc": 0.09844,
+ "test_loss": 2.302586205673218,
+ "test_acc": 0.1,
+ "lyapunov": 2.262093958647355,
+ "grad_norm": 0.09526075366227103,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006394955530196147,
+ "time_sec": 81.4629635810852
+ },
+ {
+ "epoch": 42,
+ "train_loss": 3.9767224240112307,
+ "train_acc": 0.09934,
+ "test_loss": 2.3025863662719726,
+ "test_acc": 0.1,
+ "lyapunov": 2.2621575853098994,
+ "grad_norm": 0.0889728077319319,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824273,
+ "time_sec": 81.4452486038208
+ },
+ {
+ "epoch": 43,
+ "train_loss": 3.9843084770202637,
+ "train_acc": 0.0983,
+ "test_loss": 2.302587857055664,
+ "test_acc": 0.1,
+ "lyapunov": 2.266823678980093,
+ "grad_norm": 0.14286833201945623,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006090716206982714,
+ "time_sec": 81.46053290367126
+ },
+ {
+ "epoch": 44,
+ "train_loss": 3.978666923828125,
+ "train_acc": 0.09862,
+ "test_loss": 2.302588472366333,
+ "test_acc": 0.1,
+ "lyapunov": 2.262758489764865,
+ "grad_norm": 0.10285858309556797,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005936906572928625,
+ "time_sec": 81.4441590309143
+ },
+ {
+ "epoch": 45,
+ "train_loss": 3.984368924102783,
+ "train_acc": 0.09714,
+ "test_loss": 2.3025872661590574,
+ "test_acc": 0.1,
+ "lyapunov": 2.2663481009890662,
+ "grad_norm": 0.11152947980914625,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005782172325201156,
+ "time_sec": 81.43797850608826
+ },
+ {
+ "epoch": 46,
+ "train_loss": 3.9835290453338623,
+ "train_acc": 0.09794,
+ "test_loss": 2.302588889694214,
+ "test_acc": 0.1,
+ "lyapunov": 2.2661942069792684,
+ "grad_norm": 0.12155880302110986,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821523,
+ "time_sec": 81.4439845085144
+ },
+ {
+ "epoch": 47,
+ "train_loss": 3.976571675872803,
+ "train_acc": 0.09746,
+ "test_loss": 2.302587047958374,
+ "test_acc": 0.1,
+ "lyapunov": 2.262034943646482,
+ "grad_norm": 0.09434388559512244,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005470541566592572,
+ "time_sec": 81.44648504257202
+ },
+ {
+ "epoch": 48,
+ "train_loss": 3.978961787414551,
+ "train_acc": 0.09674,
+ "test_loss": 2.302586452484131,
+ "test_acc": 0.1,
+ "lyapunov": 2.2636160929794507,
+ "grad_norm": 0.09388300184277713,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005313952597646569,
+ "time_sec": 81.50625872612
+ },
+ {
+ "epoch": 49,
+ "train_loss": 3.9766515798950195,
+ "train_acc": 0.09856,
+ "test_loss": 2.302586361694336,
+ "test_acc": 0.1,
+ "lyapunov": 2.2621047679725512,
+ "grad_norm": 0.08611192583269686,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005157053795390643,
+ "time_sec": 81.42919588088989
+ },
+ {
+ "epoch": 50,
+ "train_loss": 3.9754750718688965,
+ "train_acc": 0.09614,
+ "test_loss": 2.302587022018433,
+ "test_acc": 0.1,
+ "lyapunov": 2.261166003049182,
+ "grad_norm": 0.09585057441328976,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005000000000000002,
+ "time_sec": 81.43738746643066
+ },
+ {
+ "epoch": 51,
+ "train_loss": 3.9752406224823,
+ "train_acc": 0.09726,
+ "test_loss": 2.302586801147461,
+ "test_acc": 0.1,
+ "lyapunov": 2.2611102423704494,
+ "grad_norm": 0.09095072097377155,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00048429462046093607,
+ "time_sec": 81.45784163475037
+ },
+ {
+ "epoch": 52,
+ "train_loss": 3.98188600982666,
+ "train_acc": 0.0951,
+ "test_loss": 2.302586806488037,
+ "test_acc": 0.1,
+ "lyapunov": 2.265076126893768,
+ "grad_norm": 0.1123738428492386,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004686047402353435,
+ "time_sec": 81.47153091430664
+ },
+ {
+ "epoch": 53,
+ "train_loss": 3.980596968536377,
+ "train_acc": 0.0976,
+ "test_loss": 2.3025859146118166,
+ "test_acc": 0.1,
+ "lyapunov": 2.2645553932775315,
+ "grad_norm": 0.1076773200596488,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000452945843340743,
+ "time_sec": 81.44375872612
+ },
+ {
+ "epoch": 54,
+ "train_loss": 3.9776349996948244,
+ "train_acc": 0.09706,
+ "test_loss": 2.3025868438720702,
+ "test_acc": 0.1,
+ "lyapunov": 2.2628720568878875,
+ "grad_norm": 0.08828239082049001,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784806,
+ "time_sec": 81.42411518096924
+ },
+ {
+ "epoch": 55,
+ "train_loss": 3.9808822979736327,
+ "train_acc": 0.09588,
+ "test_loss": 2.302585488128662,
+ "test_acc": 0.1,
+ "lyapunov": 2.2643827629821076,
+ "grad_norm": 0.11262628002715089,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004217827674798847,
+ "time_sec": 81.4528546333313
+ },
+ {
+ "epoch": 56,
+ "train_loss": 3.974801806488037,
+ "train_acc": 0.09592,
+ "test_loss": 2.3025861625671387,
+ "test_acc": 0.1,
+ "lyapunov": 2.2608287944208327,
+ "grad_norm": 0.09195483599034024,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00040630934270713783,
+ "time_sec": 81.44676446914673
+ },
+ {
+ "epoch": 57,
+ "train_loss": 3.976495365371704,
+ "train_acc": 0.09736,
+ "test_loss": 2.3025858879089354,
+ "test_acc": 0.1,
+ "lyapunov": 2.262001718096721,
+ "grad_norm": 0.08361845913085657,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000390928379301729,
+ "time_sec": 81.45348882675171
+ },
+ {
+ "epoch": 58,
+ "train_loss": 3.980894155731201,
+ "train_acc": 0.09842,
+ "test_loss": 2.3025855281829832,
+ "test_acc": 0.1,
+ "lyapunov": 2.2647068646862683,
+ "grad_norm": 0.11991605921354555,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003756550564175727,
+ "time_sec": 81.47408199310303
+ },
+ {
+ "epoch": 59,
+ "train_loss": 3.994586195449829,
+ "train_acc": 0.0973,
+ "test_loss": 2.3025854663848877,
+ "test_acc": 0.1,
+ "lyapunov": 2.27294464672313,
+ "grad_norm": 0.18222829815312913,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036050444698038553,
+ "time_sec": 81.44711089134216
+ },
+ {
+ "epoch": 60,
+ "train_loss": 3.9781198291015625,
+ "train_acc": 0.09658,
+ "test_loss": 2.3025856033325196,
+ "test_acc": 0.1,
+ "lyapunov": 2.263154449365328,
+ "grad_norm": 0.08448254246697348,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00034549150281252655,
+ "time_sec": 81.44161295890808
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.02450031616211,
+ "train_acc": 0.0976,
+ "test_loss": 2.302585502624512,
+ "test_acc": 0.1,
+ "lyapunov": 2.286170544831649,
+ "grad_norm": 0.23432897685131301,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003306310398773544,
+ "time_sec": 81.45745611190796
+ },
+ {
+ "epoch": 62,
+ "train_loss": 3.988269701385498,
+ "train_acc": 0.09688,
+ "test_loss": 2.3025854175567626,
+ "test_acc": 0.1,
+ "lyapunov": 2.267505117084669,
+ "grad_norm": 0.10764931064603923,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766127,
+ "time_sec": 81.45787954330444
+ },
+ {
+ "epoch": 63,
+ "train_loss": 3.9736854934692385,
+ "train_acc": 0.09646,
+ "test_loss": 2.3025857013702393,
+ "test_acc": 0.1,
+ "lyapunov": 2.2600014398774833,
+ "grad_norm": 0.08382317206831051,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003014260546826097,
+ "time_sec": 81.44196057319641
+ },
+ {
+ "epoch": 64,
+ "train_loss": 3.9797292990875244,
+ "train_acc": 0.0969,
+ "test_loss": 2.3025853332519532,
+ "test_acc": 0.1,
+ "lyapunov": 2.264177340680681,
+ "grad_norm": 0.11933485737211565,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002871103542174637,
+ "time_sec": 81.45828652381897
+ },
+ {
+ "epoch": 65,
+ "train_loss": 3.9763733405303956,
+ "train_acc": 0.097,
+ "test_loss": 2.3025854026794432,
+ "test_acc": 0.1,
+ "lyapunov": 2.2618614468733065,
+ "grad_norm": 0.08601466707594763,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002730047501302267,
+ "time_sec": 81.44515085220337
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.001672252197266,
+ "train_acc": 0.09836,
+ "test_loss": 2.302585359954834,
+ "test_acc": 0.1,
+ "lyapunov": 2.276178054492492,
+ "grad_norm": 0.19097066416551475,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00025912316294914234,
+ "time_sec": 81.44997453689575
+ },
+ {
+ "epoch": 67,
+ "train_loss": 3.983064818649292,
+ "train_acc": 0.09848,
+ "test_loss": 2.302585221862793,
+ "test_acc": 0.1,
+ "lyapunov": 2.2660030678410052,
+ "grad_norm": 0.11726894505680324,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002454792921248144,
+ "time_sec": 81.45755219459534
+ },
+ {
+ "epoch": 68,
+ "train_loss": 3.9874353774261473,
+ "train_acc": 0.09726,
+ "test_loss": 2.302585542297363,
+ "test_acc": 0.1,
+ "lyapunov": 2.26753244497587,
+ "grad_norm": 0.1096052061821724,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00023208660251050164,
+ "time_sec": 81.45092463493347
+ },
+ {
+ "epoch": 69,
+ "train_loss": 3.984990802612305,
+ "train_acc": 0.09842,
+ "test_loss": 2.3025853466033936,
+ "test_acc": 0.1,
+ "lyapunov": 2.2674437922894803,
+ "grad_norm": 0.08538883278176537,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00021895831107393473,
+ "time_sec": 81.44036960601807
+ },
+ {
+ "epoch": 70,
+ "train_loss": 3.9768560768127443,
+ "train_acc": 0.09864,
+ "test_loss": 2.3025853176116944,
+ "test_acc": 0.1,
+ "lyapunov": 2.262266612113894,
+ "grad_norm": 0.0826759570118499,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376356,
+ "time_sec": 81.44237995147705
+ },
+ {
+ "epoch": 71,
+ "train_loss": 3.97729412109375,
+ "train_acc": 0.09838,
+ "test_loss": 2.3025852783203127,
+ "test_acc": 0.1,
+ "lyapunov": 2.262566337195199,
+ "grad_norm": 0.08149339121565821,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019354647317351177,
+ "time_sec": 81.46553111076355
+ },
+ {
+ "epoch": 72,
+ "train_loss": 3.999013508300781,
+ "train_acc": 0.09792,
+ "test_loss": 2.3025853332519532,
+ "test_acc": 0.1,
+ "lyapunov": 2.2738718602358534,
+ "grad_norm": 0.15690481475260892,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001812880051256552,
+ "time_sec": 81.440505027771
+ },
+ {
+ "epoch": 73,
+ "train_loss": 3.9769914697265625,
+ "train_acc": 0.09758,
+ "test_loss": 2.302585132598877,
+ "test_acc": 0.1,
+ "lyapunov": 2.262345004264656,
+ "grad_norm": 0.08468511131490652,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016934406733817422,
+ "time_sec": 81.45508050918579
+ },
+ {
+ "epoch": 74,
+ "train_loss": 3.9735559133148195,
+ "train_acc": 0.09684,
+ "test_loss": 2.302585078430176,
+ "test_acc": 0.1,
+ "lyapunov": 2.2599204360981426,
+ "grad_norm": 0.08407853053475459,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001577264470356557,
+ "time_sec": 81.43686723709106
+ },
+ {
+ "epoch": 75,
+ "train_loss": 3.975616183166504,
+ "train_acc": 0.09758,
+ "test_loss": 2.302585101699829,
+ "test_acc": 0.1,
+ "lyapunov": 2.2613788644980897,
+ "grad_norm": 0.08410718060667108,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014644660940672634,
+ "time_sec": 81.46202492713928
+ },
+ {
+ "epoch": 76,
+ "train_loss": 3.9777969396972654,
+ "train_acc": 0.09642,
+ "test_loss": 2.302585230255127,
+ "test_acc": 0.1,
+ "lyapunov": 2.262849387000589,
+ "grad_norm": 0.08412741392957411,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001355156862892944,
+ "time_sec": 81.69426202774048
+ },
+ {
+ "epoch": 77,
+ "train_loss": 3.997583436126709,
+ "train_acc": 0.09804,
+ "test_loss": 2.3025851612091066,
+ "test_acc": 0.1,
+ "lyapunov": 2.272977476534636,
+ "grad_norm": 0.19693507091470583,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012494446518477025,
+ "time_sec": 81.47962164878845
+ },
+ {
+ "epoch": 78,
+ "train_loss": 3.981567749633789,
+ "train_acc": 0.0972,
+ "test_loss": 2.302585176086426,
+ "test_acc": 0.1,
+ "lyapunov": 2.2653762513719253,
+ "grad_norm": 0.08819478927352292,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210548,
+ "time_sec": 81.44144415855408
+ },
+ {
+ "epoch": 79,
+ "train_loss": 3.979712967529297,
+ "train_acc": 0.09928,
+ "test_loss": 2.3025852310180666,
+ "test_acc": 0.1,
+ "lyapunov": 2.2640710157506607,
+ "grad_norm": 0.10900387268878003,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010492249381215483,
+ "time_sec": 81.44691228866577
+ },
+ {
+ "epoch": 80,
+ "train_loss": 3.9752784634399414,
+ "train_acc": 0.09612,
+ "test_loss": 2.3025851806640625,
+ "test_acc": 0.1,
+ "lyapunov": 2.2611999310495907,
+ "grad_norm": 0.08485114515050625,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 81.44573497772217
+ },
+ {
+ "epoch": 81,
+ "train_loss": 3.973998136444092,
+ "train_acc": 0.09674,
+ "test_loss": 2.302585205078125,
+ "test_acc": 0.1,
+ "lyapunov": 2.2602438634009006,
+ "grad_norm": 0.08193297107495977,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 81.44051194190979
+ },
+ {
+ "epoch": 82,
+ "train_loss": 3.9795581608581543,
+ "train_acc": 0.0974,
+ "test_loss": 2.3025851707458496,
+ "test_acc": 0.1,
+ "lyapunov": 2.2642151602088947,
+ "grad_norm": 0.08382214616673372,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 81.44579362869263
+ },
+ {
+ "epoch": 83,
+ "train_loss": 3.97544639793396,
+ "train_acc": 0.0975,
+ "test_loss": 2.3025851676940916,
+ "test_acc": 0.1,
+ "lyapunov": 2.261258240550985,
+ "grad_norm": 0.0830598190151241,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 81.46574568748474
+ },
+ {
+ "epoch": 84,
+ "train_loss": 3.9764262825775147,
+ "train_acc": 0.09818,
+ "test_loss": 2.302585060119629,
+ "test_acc": 0.1,
+ "lyapunov": 2.2619712322264376,
+ "grad_norm": 0.08369246247456191,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 81.45664143562317
+ },
+ {
+ "epoch": 85,
+ "train_loss": 3.9776910205078124,
+ "train_acc": 0.0955,
+ "test_loss": 2.3025851593017577,
+ "test_acc": 0.1,
+ "lyapunov": 2.2629058550080985,
+ "grad_norm": 0.08247891269837844,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 81.461270570755
+ },
+ {
+ "epoch": 86,
+ "train_loss": 3.9771215029907228,
+ "train_acc": 0.09536,
+ "test_loss": 2.3025850746154783,
+ "test_acc": 0.1,
+ "lyapunov": 2.2625219870711226,
+ "grad_norm": 0.08304329059000737,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 81.45261931419373
+ },
+ {
+ "epoch": 87,
+ "train_loss": 3.9780111279296877,
+ "train_acc": 0.09718,
+ "test_loss": 2.3025850124359133,
+ "test_acc": 0.1,
+ "lyapunov": 2.263096221572603,
+ "grad_norm": 0.08168556680409891,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 81.47083902359009
+ },
+ {
+ "epoch": 88,
+ "train_loss": 3.975586996154785,
+ "train_acc": 0.09506,
+ "test_loss": 2.3025851093292236,
+ "test_acc": 0.1,
+ "lyapunov": 2.261420638360026,
+ "grad_norm": 0.08585199329222436,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 81.46594524383545
+ },
+ {
+ "epoch": 89,
+ "train_loss": 3.9770257449340822,
+ "train_acc": 0.0982,
+ "test_loss": 2.3025851146698,
+ "test_acc": 0.1,
+ "lyapunov": 2.262422331153889,
+ "grad_norm": 0.08469063518506169,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 81.46577405929565
+ },
+ {
+ "epoch": 90,
+ "train_loss": 3.973931856689453,
+ "train_acc": 0.09746,
+ "test_loss": 2.3025850677490234,
+ "test_acc": 0.1,
+ "lyapunov": 2.2602365346210997,
+ "grad_norm": 0.08267580569635262,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 81.45771622657776
+ },
+ {
+ "epoch": 91,
+ "train_loss": 3.9777387670898436,
+ "train_acc": 0.09732,
+ "test_loss": 2.3025851654052736,
+ "test_acc": 0.1,
+ "lyapunov": 2.262757078765908,
+ "grad_norm": 0.10473963211370652,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 81.46830105781555
+ },
+ {
+ "epoch": 92,
+ "train_loss": 3.973895709075928,
+ "train_acc": 0.09754,
+ "test_loss": 2.302585176086426,
+ "test_acc": 0.1,
+ "lyapunov": 2.2601819568887698,
+ "grad_norm": 0.08524438116449506,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 81.45872473716736
+ },
+ {
+ "epoch": 93,
+ "train_loss": 3.975780742340088,
+ "train_acc": 0.09832,
+ "test_loss": 2.302585258483887,
+ "test_acc": 0.1,
+ "lyapunov": 2.261494060916364,
+ "grad_norm": 0.08296746372602809,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 81.44344329833984
+ },
+ {
+ "epoch": 94,
+ "train_loss": 3.9749393853759765,
+ "train_acc": 0.099,
+ "test_loss": 2.3025851181030275,
+ "test_acc": 0.1,
+ "lyapunov": 2.2609141049787516,
+ "grad_norm": 0.081703214219651,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 81.47197723388672
+ },
+ {
+ "epoch": 95,
+ "train_loss": 3.977360173110962,
+ "train_acc": 0.09844,
+ "test_loss": 2.3025852035522463,
+ "test_acc": 0.1,
+ "lyapunov": 2.2626446403200973,
+ "grad_norm": 0.08370580659845218,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 81.4649875164032
+ },
+ {
+ "epoch": 96,
+ "train_loss": 3.9748195641326904,
+ "train_acc": 0.09918,
+ "test_loss": 2.3025851348876953,
+ "test_acc": 0.1,
+ "lyapunov": 2.2608655974688125,
+ "grad_norm": 0.08506351899121649,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 81.45548796653748
+ },
+ {
+ "epoch": 97,
+ "train_loss": 3.977184408874512,
+ "train_acc": 0.09888,
+ "test_loss": 2.3025851238250734,
+ "test_acc": 0.1,
+ "lyapunov": 2.262512852163876,
+ "grad_norm": 0.08383579924614167,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 81.4503653049469
+ },
+ {
+ "epoch": 98,
+ "train_loss": 3.979651080627441,
+ "train_acc": 0.1,
+ "test_loss": 2.3025852249145506,
+ "test_acc": 0.1,
+ "lyapunov": 2.264271725778994,
+ "grad_norm": 0.08181479722385572,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 81.46501636505127
+ },
+ {
+ "epoch": 99,
+ "train_loss": 3.9744724880981446,
+ "train_acc": 0.1,
+ "test_loss": 2.302585131072998,
+ "test_acc": 0.1,
+ "lyapunov": 2.260578519547992,
+ "grad_norm": 0.08286890329554125,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.467198171342e-07,
+ "time_sec": 81.44538688659668
+ },
+ {
+ "epoch": 100,
+ "train_loss": 3.9755064764404295,
+ "train_acc": 0.1,
+ "test_loss": 2.302585161590576,
+ "test_acc": 0.1,
+ "lyapunov": 2.2613274374276475,
+ "grad_norm": 0.08253103448725845,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 81.44115138053894
+ }
+ ],
+ "12": [
+ {
+ "epoch": 1,
+ "train_loss": 11.514268187866211,
+ "train_acc": 0.12322,
+ "test_loss": 2.335220721435547,
+ "test_acc": 0.1082,
+ "lyapunov": 5.094494405609872,
+ "grad_norm": 6.68472372840091,
+ "grad_max_sv": 5.768041110038757,
+ "grad_min_sv": 2.425695402763495e-07,
+ "grad_condition": 23767971.115653183,
+ "lr": 0.0009997532801828658,
+ "time_sec": 124.28109288215637
+ },
+ {
+ "epoch": 2,
+ "train_loss": 6.767582432556153,
+ "train_acc": 0.13338,
+ "test_loss": 2.3135711360931395,
+ "test_acc": 0.1058,
+ "lyapunov": 3.703414491375389,
+ "grad_norm": 4.437490608687784,
+ "grad_max_sv": 3.688317948579788,
+ "grad_min_sv": 1.6068337682639822e-07,
+ "grad_condition": 23679624.47851156,
+ "lr": 0.0009990133642141358,
+ "time_sec": 124.28083038330078
+ },
+ {
+ "epoch": 3,
+ "train_loss": 6.359151521911621,
+ "train_acc": 0.1371,
+ "test_loss": 2.3046204761505127,
+ "test_acc": 0.1017,
+ "lyapunov": 3.53740519087028,
+ "grad_norm": 3.3992685611612004,
+ "grad_max_sv": 3.1906665176153184,
+ "grad_min_sv": 1.0806052515022202e-07,
+ "grad_condition": 30020073.39935509,
+ "lr": 0.00099778098230154,
+ "time_sec": 124.26130867004395
+ },
+ {
+ "epoch": 4,
+ "train_loss": 5.680015151367187,
+ "train_acc": 0.12346,
+ "test_loss": 2.4307143615722655,
+ "test_acc": 0.0946,
+ "lyapunov": 3.2194143725783015,
+ "grad_norm": 3.6284679983008856,
+ "grad_max_sv": 2.3083297662011844,
+ "grad_min_sv": 7.267783242878633e-08,
+ "grad_condition": 28802302.157710887,
+ "lr": 0.000996057350657239,
+ "time_sec": 124.2893226146698
+ },
+ {
+ "epoch": 5,
+ "train_loss": 5.515282614440918,
+ "train_acc": 0.11878,
+ "test_loss": 2.3333636627197265,
+ "test_acc": 0.0806,
+ "lyapunov": 3.1298821100493526,
+ "grad_norm": 2.1440857096164527,
+ "grad_max_sv": 1.8293321043252946,
+ "grad_min_sv": 6.11613814704981e-08,
+ "grad_condition": 30298382.919277746,
+ "lr": 0.0009938441702975688,
+ "time_sec": 124.24556708335876
+ },
+ {
+ "epoch": 6,
+ "train_loss": 4.830215334472657,
+ "train_acc": 0.10662,
+ "test_loss": 2.3030837219238283,
+ "test_acc": 0.1,
+ "lyapunov": 2.7727705700623106,
+ "grad_norm": 2.350059460657985,
+ "grad_max_sv": 1.5110829517245292,
+ "grad_min_sv": 2.7742502849842366e-08,
+ "grad_condition": 415971679.7996719,
+ "lr": 0.0009911436253643444,
+ "time_sec": 124.2670316696167
+ },
+ {
+ "epoch": 7,
+ "train_loss": 5.0002188845825195,
+ "train_acc": 0.1014,
+ "test_loss": 2.306517247772217,
+ "test_acc": 0.1,
+ "lyapunov": 2.8697540314910968,
+ "grad_norm": 4.791639177202153,
+ "grad_max_sv": 0.7900435705131315,
+ "grad_min_sv": 1.012708673176853e-08,
+ "grad_condition": 1185811132.9619708,
+ "lr": 0.0009879583809693736,
+ "time_sec": 124.2431480884552
+ },
+ {
+ "epoch": 8,
+ "train_loss": 5.872336234741211,
+ "train_acc": 0.10816,
+ "test_loss": 2.3033512046813964,
+ "test_acc": 0.1,
+ "lyapunov": 3.2996887185079666,
+ "grad_norm": 4.562165296743471,
+ "grad_max_sv": 0.4824362076822354,
+ "grad_min_sv": 1.352856967967285e-08,
+ "grad_condition": 33563973.110157445,
+ "lr": 0.0009842915805643154,
+ "time_sec": 124.24206638336182
+ },
+ {
+ "epoch": 9,
+ "train_loss": 5.207491922912598,
+ "train_acc": 0.1015,
+ "test_loss": 2.302657497024536,
+ "test_acc": 0.1,
+ "lyapunov": 2.982921624732444,
+ "grad_norm": 1.2857988530859297,
+ "grad_max_sv": 0.4782970450818539,
+ "grad_min_sv": 6.14909029240993e-09,
+ "grad_condition": 17001336844.82257,
+ "lr": 0.0009801468428384714,
+ "time_sec": 124.2599868774414
+ },
+ {
+ "epoch": 10,
+ "train_loss": 5.278977078552246,
+ "train_acc": 0.11042,
+ "test_loss": 2.303682248687744,
+ "test_acc": 0.1,
+ "lyapunov": 3.0210835842220374,
+ "grad_norm": 2.219210747930246,
+ "grad_max_sv": 0.26804067082703115,
+ "grad_min_sv": 5.793725242549423e-09,
+ "grad_condition": 7080161076.764597,
+ "lr": 0.0009755282581475767,
+ "time_sec": 124.2449324131012
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.803467753601074,
+ "train_acc": 0.1012,
+ "test_loss": 4.169252464294433,
+ "test_acc": 0.1,
+ "lyapunov": 2.77325821654571,
+ "grad_norm": 2.127622649938152,
+ "grad_max_sv": 0.1682983461767435,
+ "grad_min_sv": 5.603680153853458e-10,
+ "grad_condition": 68373983123.414894,
+ "lr": 0.0009704403844771127,
+ "time_sec": 124.30126142501831
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.544517149658203,
+ "train_acc": 0.09926,
+ "test_loss": 4.290980886840821,
+ "test_acc": 0.1,
+ "lyapunov": 2.62944141068422,
+ "grad_norm": 1.638854096476257,
+ "grad_max_sv": 0.07512564162607305,
+ "grad_min_sv": 2.6490731026315825e-12,
+ "grad_condition": 54196459261.33328,
+ "lr": 0.0009648882429441257,
+ "time_sec": 124.24927043914795
+ },
+ {
+ "epoch": 13,
+ "train_loss": 4.369602390441894,
+ "train_acc": 0.09752,
+ "test_loss": 4.109600519561767,
+ "test_acc": 0.1,
+ "lyapunov": 2.5177556279370243,
+ "grad_norm": 2.133122078616872,
+ "grad_max_sv": 0.09587469333782792,
+ "grad_min_sv": 2.093604774056981e-12,
+ "grad_condition": 86094204980.57991,
+ "lr": 0.0009588773128419905,
+ "time_sec": 124.26178216934204
+ },
+ {
+ "epoch": 14,
+ "train_loss": 4.34119681640625,
+ "train_acc": 0.09926,
+ "test_loss": 4.199708403778076,
+ "test_acc": 0.1,
+ "lyapunov": 2.495693293373908,
+ "grad_norm": 2.708849611541162,
+ "grad_max_sv": 0.09101940747350454,
+ "grad_min_sv": 8.368649587364072e-14,
+ "grad_condition": 87173383288.77208,
+ "lr": 0.0009524135262330098,
+ "time_sec": 124.24493861198425
+ },
+ {
+ "epoch": 15,
+ "train_loss": 5.13457500289917,
+ "train_acc": 0.10424,
+ "test_loss": 2.308458815765381,
+ "test_acc": 0.1,
+ "lyapunov": 2.9219820334783297,
+ "grad_norm": 3.354402938679459,
+ "grad_max_sv": 0.09543408825993538,
+ "grad_min_sv": 1.3719995468877692e-10,
+ "grad_condition": 59504120268.59434,
+ "lr": 0.0009455032620941839,
+ "time_sec": 124.29389190673828
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.3248897048950194,
+ "train_acc": 0.10296,
+ "test_loss": 2.302912854766846,
+ "test_acc": 0.1,
+ "lyapunov": 2.9764596306149613,
+ "grad_norm": 0.6322085012676749,
+ "grad_max_sv": 0.053145987424068154,
+ "grad_min_sv": 3.2089368939156336e-11,
+ "grad_condition": 21592510035.150898,
+ "lr": 0.0009381533400219318,
+ "time_sec": 124.22647547721863
+ },
+ {
+ "epoch": 17,
+ "train_loss": 4.330915478057861,
+ "train_acc": 0.09936,
+ "test_loss": 2.3026626167297364,
+ "test_acc": 0.1,
+ "lyapunov": 2.493599863613353,
+ "grad_norm": 0.20813626461361764,
+ "grad_max_sv": 0.0220638582482934,
+ "grad_min_sv": 5.079951297939575e-13,
+ "grad_condition": 7528215997.404785,
+ "lr": 0.0009303710135019719,
+ "time_sec": 124.25075626373291
+ },
+ {
+ "epoch": 18,
+ "train_loss": 4.329695655975342,
+ "train_acc": 0.09802,
+ "test_loss": 2.3026026527404784,
+ "test_acc": 0.1,
+ "lyapunov": 2.4943465003577034,
+ "grad_norm": 0.28764831256555634,
+ "grad_max_sv": 0.00430559329688549,
+ "grad_min_sv": 1.0630859058082507e-17,
+ "grad_condition": 4303763188.890272,
+ "lr": 0.0009221639627510076,
+ "time_sec": 124.26908159255981
+ },
+ {
+ "epoch": 19,
+ "train_loss": 4.449291636352539,
+ "train_acc": 0.09546,
+ "test_loss": 2.3025916465759275,
+ "test_acc": 0.1,
+ "lyapunov": 2.5493475122524956,
+ "grad_norm": 0.286977076303005,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000913540287137281,
+ "time_sec": 124.22392654418945
+ },
+ {
+ "epoch": 20,
+ "train_loss": 4.275282980957031,
+ "train_acc": 0.09758,
+ "test_loss": 2.3025943778991698,
+ "test_acc": 0.1,
+ "lyapunov": 2.4641005602639043,
+ "grad_norm": 0.11226214403634883,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0009045084971874739,
+ "time_sec": 124.30651044845581
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.299091949005127,
+ "train_acc": 0.09792,
+ "test_loss": 2.30259245262146,
+ "test_acc": 0.1,
+ "lyapunov": 2.477661563917194,
+ "grad_norm": 0.12888554972749486,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008950775061878452,
+ "time_sec": 124.23446798324585
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.315002240905762,
+ "train_acc": 0.0975,
+ "test_loss": 2.3025940551757813,
+ "test_acc": 0.1,
+ "lyapunov": 2.4848342008907776,
+ "grad_norm": 0.13926908971905202,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008852566213878947,
+ "time_sec": 124.30266809463501
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.362473590087891,
+ "train_acc": 0.09968,
+ "test_loss": 2.3025879684448243,
+ "test_acc": 0.1,
+ "lyapunov": 2.508172784619929,
+ "grad_norm": 0.25147158848993745,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008750555348152298,
+ "time_sec": 124.24051856994629
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.361022654266358,
+ "train_acc": 0.09674,
+ "test_loss": 2.3025897010803225,
+ "test_acc": 0.1,
+ "lyapunov": 2.5060998808087596,
+ "grad_norm": 0.25289701667178555,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008644843137107057,
+ "time_sec": 124.22614932060242
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.292231715545654,
+ "train_acc": 0.098,
+ "test_loss": 2.3025892387390137,
+ "test_acc": 0.1,
+ "lyapunov": 2.4726591543163483,
+ "grad_norm": 0.15846202884892668,
+ "grad_max_sv": 0.007139207795262337,
+ "grad_min_sv": 1.1884213096035809e-14,
+ "grad_condition": 5768863374.104107,
+ "lr": 0.0008535533905932737,
+ "time_sec": 124.29175138473511
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.278334856414795,
+ "train_acc": 0.09952,
+ "test_loss": 2.302597050857544,
+ "test_acc": 0.1,
+ "lyapunov": 2.46608062229498,
+ "grad_norm": 0.09871518957397614,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008422735529643444,
+ "time_sec": 124.22811436653137
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.279530144348144,
+ "train_acc": 0.09882,
+ "test_loss": 2.3025887565612795,
+ "test_acc": 0.1,
+ "lyapunov": 2.466456468757766,
+ "grad_norm": 0.09728576577451334,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008306559326618259,
+ "time_sec": 124.25813937187195
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.276873157348633,
+ "train_acc": 0.0965,
+ "test_loss": 2.302586852264404,
+ "test_acc": 0.1,
+ "lyapunov": 2.4651820092554897,
+ "grad_norm": 0.09336828927700111,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008187119948743449,
+ "time_sec": 124.22499465942383
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.274294167022705,
+ "train_acc": 0.09674,
+ "test_loss": 2.302587184906006,
+ "test_acc": 0.1,
+ "lyapunov": 2.4635079608244053,
+ "grad_norm": 0.08132883703681491,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008064535268264883,
+ "time_sec": 124.26223015785217
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.3161706869506835,
+ "train_acc": 0.09742,
+ "test_loss": 2.302589612197876,
+ "test_acc": 0.1,
+ "lyapunov": 2.4838878163291365,
+ "grad_norm": 0.1244076499240839,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007938926261462367,
+ "time_sec": 124.22068643569946
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.2865172996520995,
+ "train_acc": 0.09864,
+ "test_loss": 2.3025933723449707,
+ "test_acc": 0.1,
+ "lyapunov": 2.4704265179841416,
+ "grad_norm": 0.11325710428703713,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007810416889260654,
+ "time_sec": 124.27307343482971
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.276113499755859,
+ "train_acc": 0.09876,
+ "test_loss": 2.302595587158203,
+ "test_acc": 0.1,
+ "lyapunov": 2.464605447276474,
+ "grad_norm": 0.11188150655123451,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007679133974894983,
+ "time_sec": 124.21617436408997
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.390245020904541,
+ "train_acc": 0.09734,
+ "test_loss": 2.302589817047119,
+ "test_acc": 0.1,
+ "lyapunov": 2.5185477038478608,
+ "grad_norm": 0.2703519117597579,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007545207078751857,
+ "time_sec": 124.22293186187744
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.350401836242676,
+ "train_acc": 0.09758,
+ "test_loss": 2.302588123321533,
+ "test_acc": 0.1,
+ "lyapunov": 2.4999206596628176,
+ "grad_norm": 0.21853702579717843,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007408768370508577,
+ "time_sec": 124.26609373092651
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.305715147399902,
+ "train_acc": 0.09856,
+ "test_loss": 2.302589534378052,
+ "test_acc": 0.1,
+ "lyapunov": 2.4810556158080432,
+ "grad_norm": 0.17605927419881373,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007269952498697734,
+ "time_sec": 124.22794723510742
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.305906265258789,
+ "train_acc": 0.09718,
+ "test_loss": 2.302591007232666,
+ "test_acc": 0.1,
+ "lyapunov": 2.477643119709571,
+ "grad_norm": 0.1236420897514881,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825364,
+ "time_sec": 124.26314496994019
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.27584158996582,
+ "train_acc": 0.0968,
+ "test_loss": 2.302587622451782,
+ "test_acc": 0.1,
+ "lyapunov": 2.464479011038075,
+ "grad_norm": 0.09532844351778941,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006985739453173903,
+ "time_sec": 124.25255799293518
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.283268468475342,
+ "train_acc": 0.097,
+ "test_loss": 2.302587129211426,
+ "test_acc": 0.1,
+ "lyapunov": 2.4685643030249556,
+ "grad_norm": 0.12053745808537034,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006840622763423391,
+ "time_sec": 124.26603984832764
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.340071802978516,
+ "train_acc": 0.09756,
+ "test_loss": 2.302587187576294,
+ "test_acc": 0.1,
+ "lyapunov": 2.496372491807279,
+ "grad_norm": 0.2265015040889252,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006693689601226458,
+ "time_sec": 124.26093554496765
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.285524172973632,
+ "train_acc": 0.0976,
+ "test_loss": 2.302589253234863,
+ "test_acc": 0.1,
+ "lyapunov": 2.4703913722806576,
+ "grad_norm": 0.12837922155849044,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006545084971874737,
+ "time_sec": 124.23279547691345
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.353975823822021,
+ "train_acc": 0.0984,
+ "test_loss": 2.3025891468048094,
+ "test_acc": 0.1,
+ "lyapunov": 2.502122705854723,
+ "grad_norm": 0.31834434179235455,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006394955530196147,
+ "time_sec": 124.27406620979309
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.285235863494873,
+ "train_acc": 0.0975,
+ "test_loss": 2.3025873653411866,
+ "test_acc": 0.1,
+ "lyapunov": 2.4699011251444705,
+ "grad_norm": 0.16460675806479913,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824273,
+ "time_sec": 124.23745155334473
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.273813045043945,
+ "train_acc": 0.09694,
+ "test_loss": 2.3025889190673827,
+ "test_acc": 0.1,
+ "lyapunov": 2.463189967148139,
+ "grad_norm": 0.09609475828794435,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006090716206982714,
+ "time_sec": 124.27437806129456
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.297922962646484,
+ "train_acc": 0.09686,
+ "test_loss": 2.3025868633270266,
+ "test_acc": 0.1,
+ "lyapunov": 2.474009756541923,
+ "grad_norm": 0.14502465560049782,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005936906572928625,
+ "time_sec": 124.22268414497375
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.279574555053711,
+ "train_acc": 0.09652,
+ "test_loss": 2.3025878047943116,
+ "test_acc": 0.1,
+ "lyapunov": 2.4667322599064665,
+ "grad_norm": 0.12003136414158579,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005782172325201156,
+ "time_sec": 124.28323554992676
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.273971158905029,
+ "train_acc": 0.0966,
+ "test_loss": 2.302587424468994,
+ "test_acc": 0.1,
+ "lyapunov": 2.463305209908644,
+ "grad_norm": 0.09172584937965118,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821523,
+ "time_sec": 124.20362710952759
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.313593041381836,
+ "train_acc": 0.09574,
+ "test_loss": 2.302586856460571,
+ "test_acc": 0.1,
+ "lyapunov": 2.4801262095761114,
+ "grad_norm": 0.15167690922053198,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005470541566592572,
+ "time_sec": 124.29144883155823
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.295382699737549,
+ "train_acc": 0.09748,
+ "test_loss": 2.302586772155762,
+ "test_acc": 0.1,
+ "lyapunov": 2.4740971671345897,
+ "grad_norm": 0.10879569327624422,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005313952597646569,
+ "time_sec": 124.23017454147339
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.2751529647827144,
+ "train_acc": 0.09936,
+ "test_loss": 2.3025859580993653,
+ "test_acc": 0.1,
+ "lyapunov": 2.4640432062661253,
+ "grad_norm": 0.10568439425734225,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005157053795390643,
+ "time_sec": 124.25622701644897
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.273743729553223,
+ "train_acc": 0.0957,
+ "test_loss": 2.3025863090515135,
+ "test_acc": 0.1,
+ "lyapunov": 2.4630955387564266,
+ "grad_norm": 0.11615112587060138,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005000000000000002,
+ "time_sec": 124.27268052101135
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.280425806427002,
+ "train_acc": 0.09628,
+ "test_loss": 2.302586248397827,
+ "test_acc": 0.1,
+ "lyapunov": 2.466461474938161,
+ "grad_norm": 0.10654878565362114,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00048429462046093607,
+ "time_sec": 124.24109268188477
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.279801727294922,
+ "train_acc": 0.09702,
+ "test_loss": 2.3025866828918455,
+ "test_acc": 0.1,
+ "lyapunov": 2.4669952484043054,
+ "grad_norm": 0.130514829251149,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004686047402353435,
+ "time_sec": 124.26980781555176
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.315970222320557,
+ "train_acc": 0.09704,
+ "test_loss": 2.3025870681762695,
+ "test_acc": 0.1,
+ "lyapunov": 2.484521316445392,
+ "grad_norm": 0.1939414239261272,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000452945843340743,
+ "time_sec": 124.22718167304993
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.311761430969239,
+ "train_acc": 0.09862,
+ "test_loss": 2.3025857872009277,
+ "test_acc": 0.1,
+ "lyapunov": 2.482763496506245,
+ "grad_norm": 0.18263667447361673,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784806,
+ "time_sec": 124.2686333656311
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.277025068054199,
+ "train_acc": 0.09778,
+ "test_loss": 2.3025857639312743,
+ "test_acc": 0.1,
+ "lyapunov": 2.465040735576464,
+ "grad_norm": 0.09424723224869033,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004217827674798847,
+ "time_sec": 124.23272252082825
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.308205063934326,
+ "train_acc": 0.0989,
+ "test_loss": 2.3025861671447756,
+ "test_acc": 0.1,
+ "lyapunov": 2.4804823679082535,
+ "grad_norm": 0.20788469844558666,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00040630934270713783,
+ "time_sec": 124.45265817642212
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.282971714477539,
+ "train_acc": 0.09876,
+ "test_loss": 2.3025856742858886,
+ "test_acc": 0.1,
+ "lyapunov": 2.4687917086169544,
+ "grad_norm": 0.1374470775631024,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000390928379301729,
+ "time_sec": 124.2466242313385
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.311033409729004,
+ "train_acc": 0.09662,
+ "test_loss": 2.302585438156128,
+ "test_acc": 0.1,
+ "lyapunov": 2.4805221582007837,
+ "grad_norm": 0.15017627742331574,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003756550564175727,
+ "time_sec": 124.22827982902527
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.29637522354126,
+ "train_acc": 0.09756,
+ "test_loss": 2.302585637664795,
+ "test_acc": 0.1,
+ "lyapunov": 2.4749210880845403,
+ "grad_norm": 0.1570135955415664,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036050444698038553,
+ "time_sec": 124.30038142204285
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.307900915527344,
+ "train_acc": 0.09804,
+ "test_loss": 2.302586008834839,
+ "test_acc": 0.1,
+ "lyapunov": 2.4804043434465024,
+ "grad_norm": 0.21537262268091628,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00034549150281252655,
+ "time_sec": 124.21648406982422
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.294828899230957,
+ "train_acc": 0.09696,
+ "test_loss": 2.302585659408569,
+ "test_acc": 0.1,
+ "lyapunov": 2.474180576441538,
+ "grad_norm": 0.15175328138376964,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003306310398773544,
+ "time_sec": 124.26800394058228
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.27745719039917,
+ "train_acc": 0.09794,
+ "test_loss": 2.302585639190674,
+ "test_acc": 0.1,
+ "lyapunov": 2.465500669406198,
+ "grad_norm": 0.10570315629890674,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766127,
+ "time_sec": 124.23925018310547
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.2727640603637695,
+ "train_acc": 0.09586,
+ "test_loss": 2.3025855934143067,
+ "test_acc": 0.1,
+ "lyapunov": 2.4626387360760624,
+ "grad_norm": 0.0890330369346984,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003014260546826097,
+ "time_sec": 124.27016854286194
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.272457419738769,
+ "train_acc": 0.09604,
+ "test_loss": 2.3025855697631834,
+ "test_acc": 0.1,
+ "lyapunov": 2.4623735072972526,
+ "grad_norm": 0.0847950891199477,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002871103542174637,
+ "time_sec": 124.20920252799988
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.273480668334961,
+ "train_acc": 0.09808,
+ "test_loss": 2.302585276031494,
+ "test_acc": 0.1,
+ "lyapunov": 2.4630366255865073,
+ "grad_norm": 0.08372012214032937,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002730047501302267,
+ "time_sec": 124.22656655311584
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.307428127746582,
+ "train_acc": 0.09712,
+ "test_loss": 2.302585486602783,
+ "test_acc": 0.1,
+ "lyapunov": 2.4764473944368874,
+ "grad_norm": 0.12238051774317063,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00025912316294914234,
+ "time_sec": 124.28961944580078
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.310281341094971,
+ "train_acc": 0.09792,
+ "test_loss": 2.3025853305816653,
+ "test_acc": 0.1,
+ "lyapunov": 2.480989251295319,
+ "grad_norm": 0.27019424894200594,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002454792921248144,
+ "time_sec": 124.25288558006287
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.282535659484863,
+ "train_acc": 0.09756,
+ "test_loss": 2.3025853900909423,
+ "test_acc": 0.1,
+ "lyapunov": 2.4676397261412246,
+ "grad_norm": 0.1281762106524609,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00023208660251050164,
+ "time_sec": 124.26717019081116
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.276787458190918,
+ "train_acc": 0.09688,
+ "test_loss": 2.3025852905273436,
+ "test_acc": 0.1,
+ "lyapunov": 2.4651669858361753,
+ "grad_norm": 0.08124252440804115,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00021895831107393473,
+ "time_sec": 124.23096060752869
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.28195741897583,
+ "train_acc": 0.09668,
+ "test_loss": 2.302585355377197,
+ "test_acc": 0.1,
+ "lyapunov": 2.468135183729479,
+ "grad_norm": 0.11112746909721634,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376356,
+ "time_sec": 124.27119207382202
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.284729679412842,
+ "train_acc": 0.09706,
+ "test_loss": 2.302585294342041,
+ "test_acc": 0.1,
+ "lyapunov": 2.469655635716665,
+ "grad_norm": 0.12307199730963861,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019354647317351177,
+ "time_sec": 124.23093914985657
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.276600415039063,
+ "train_acc": 0.09806,
+ "test_loss": 2.3025852252960206,
+ "test_acc": 0.1,
+ "lyapunov": 2.464849721440269,
+ "grad_norm": 0.12908363321506647,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001812880051256552,
+ "time_sec": 124.25842094421387
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.3069706353759765,
+ "train_acc": 0.09654,
+ "test_loss": 2.3025852447509765,
+ "test_acc": 0.1,
+ "lyapunov": 2.479751230810609,
+ "grad_norm": 0.183601868909449,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016934406733817422,
+ "time_sec": 124.21842932701111
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.287112475280762,
+ "train_acc": 0.09722,
+ "test_loss": 2.302585179901123,
+ "test_acc": 0.1,
+ "lyapunov": 2.4702408582048343,
+ "grad_norm": 0.1331148526919891,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001577264470356557,
+ "time_sec": 124.22039604187012
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.271034491882324,
+ "train_acc": 0.09664,
+ "test_loss": 2.3025851165771485,
+ "test_acc": 0.1,
+ "lyapunov": 2.461448823704439,
+ "grad_norm": 0.08255701875769623,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014644660940672634,
+ "time_sec": 124.30420184135437
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.272865072021484,
+ "train_acc": 0.09542,
+ "test_loss": 2.302585235977173,
+ "test_acc": 0.1,
+ "lyapunov": 2.462638800101512,
+ "grad_norm": 0.08790859271963604,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001355156862892944,
+ "time_sec": 124.23553800582886
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.271533363189698,
+ "train_acc": 0.09712,
+ "test_loss": 2.3025852149963377,
+ "test_acc": 0.1,
+ "lyapunov": 2.4617462914313197,
+ "grad_norm": 0.08471091537010327,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012494446518477025,
+ "time_sec": 124.25954508781433
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.290692696685791,
+ "train_acc": 0.09754,
+ "test_loss": 2.302585163116455,
+ "test_acc": 0.1,
+ "lyapunov": 2.470475591357102,
+ "grad_norm": 0.10652401748252295,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210548,
+ "time_sec": 124.22494149208069
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.274790961608887,
+ "train_acc": 0.09758,
+ "test_loss": 2.302585228347778,
+ "test_acc": 0.1,
+ "lyapunov": 2.4638520756645885,
+ "grad_norm": 0.08078835262733591,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010492249381215483,
+ "time_sec": 124.29019331932068
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.272836723175049,
+ "train_acc": 0.09616,
+ "test_loss": 2.3025851444244383,
+ "test_acc": 0.1,
+ "lyapunov": 2.462624883407827,
+ "grad_norm": 0.08161990901444113,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 124.22851657867432
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.39987655090332,
+ "train_acc": 0.0985,
+ "test_loss": 2.302585282897949,
+ "test_acc": 0.1,
+ "lyapunov": 2.5367127757548067,
+ "grad_norm": 0.6635822194594717,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 124.23617506027222
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.297471022949218,
+ "train_acc": 0.0953,
+ "test_loss": 2.3025852149963377,
+ "test_acc": 0.1,
+ "lyapunov": 2.475090144540343,
+ "grad_norm": 0.729945935366233,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 124.25805640220642
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.269278663024902,
+ "train_acc": 0.09916,
+ "test_loss": 2.3025850776672363,
+ "test_acc": 0.1,
+ "lyapunov": 2.4603407303695484,
+ "grad_norm": 0.09631779246548546,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 124.23541116714478
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.2767918655395505,
+ "train_acc": 0.09902,
+ "test_loss": 2.3025851837158204,
+ "test_acc": 0.1,
+ "lyapunov": 2.464642455815659,
+ "grad_norm": 0.15914456443799777,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 124.2600998878479
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.275007407989502,
+ "train_acc": 0.09774,
+ "test_loss": 2.302585231781006,
+ "test_acc": 0.1,
+ "lyapunov": 2.4639958829221213,
+ "grad_norm": 0.08948000358835351,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 124.19096970558167
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.282883452606201,
+ "train_acc": 0.0984,
+ "test_loss": 2.3025849563598633,
+ "test_acc": 0.1,
+ "lyapunov": 2.46685717294893,
+ "grad_norm": 0.20955582940776452,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 124.28308463096619
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.273255398712158,
+ "train_acc": 0.09732,
+ "test_loss": 2.3025850818634033,
+ "test_acc": 0.1,
+ "lyapunov": 2.4628877334887416,
+ "grad_norm": 0.08251896757547691,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 124.24707794189453
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.27318275390625,
+ "train_acc": 0.09818,
+ "test_loss": 2.3025852210998536,
+ "test_acc": 0.1,
+ "lyapunov": 2.462852593273153,
+ "grad_norm": 0.08488796189115587,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 124.27159857749939
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.274446720886231,
+ "train_acc": 0.0964,
+ "test_loss": 2.3025852279663086,
+ "test_acc": 0.1,
+ "lyapunov": 2.463662301792818,
+ "grad_norm": 0.08254333748035417,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 124.20991706848145
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.282081894989013,
+ "train_acc": 0.09898,
+ "test_loss": 2.302585124206543,
+ "test_acc": 0.1,
+ "lyapunov": 2.4669584868204257,
+ "grad_norm": 0.11057422059552115,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 124.23175573348999
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.270762037200928,
+ "train_acc": 0.09742,
+ "test_loss": 2.302585070037842,
+ "test_acc": 0.1,
+ "lyapunov": 2.4613021468872303,
+ "grad_norm": 0.08094752788352252,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 124.28751397132874
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.2731778295898435,
+ "train_acc": 0.0967,
+ "test_loss": 2.3025849838256836,
+ "test_acc": 0.1,
+ "lyapunov": 2.4628693057448054,
+ "grad_norm": 0.08218150011851272,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 124.20022916793823
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.271317660827637,
+ "train_acc": 0.09598,
+ "test_loss": 2.302585059738159,
+ "test_acc": 0.1,
+ "lyapunov": 2.461685863602192,
+ "grad_norm": 0.09351987385512874,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 124.32517552375793
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.271005298614502,
+ "train_acc": 0.09678,
+ "test_loss": 2.3025850238800047,
+ "test_acc": 0.1,
+ "lyapunov": 2.461446201100069,
+ "grad_norm": 0.08051510852574385,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 124.25493431091309
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.272550579528809,
+ "train_acc": 0.0975,
+ "test_loss": 2.302585118865967,
+ "test_acc": 0.1,
+ "lyapunov": 2.462437502258574,
+ "grad_norm": 0.08133134154526532,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 124.2907202243805
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.27599407836914,
+ "train_acc": 0.09808,
+ "test_loss": 2.302585164642334,
+ "test_acc": 0.1,
+ "lyapunov": 2.464714573472357,
+ "grad_norm": 0.08129994421530186,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 124.2441520690918
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.27250137512207,
+ "train_acc": 0.1,
+ "test_loss": 2.3025850723266603,
+ "test_acc": 0.1,
+ "lyapunov": 2.462406137105449,
+ "grad_norm": 0.08085760651650271,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 124.25383496284485
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.272909243469238,
+ "train_acc": 0.1,
+ "test_loss": 2.30258510017395,
+ "test_acc": 0.1,
+ "lyapunov": 2.462700468195064,
+ "grad_norm": 0.08430371763203995,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 124.2897834777832
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.27265819152832,
+ "train_acc": 0.1,
+ "test_loss": 2.302585132598877,
+ "test_acc": 0.1,
+ "lyapunov": 2.462563226290066,
+ "grad_norm": 0.08009730488173318,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.467198171342e-07,
+ "time_sec": 124.25932240486145
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.272679078521729,
+ "train_acc": 0.1,
+ "test_loss": 2.302585071182251,
+ "test_acc": 0.1,
+ "lyapunov": 2.462542835708774,
+ "grad_norm": 0.08019670403901732,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 124.30135154724121
+ }
+ ],
+ "16": [
+ {
+ "epoch": 1,
+ "train_loss": 11.842812671203614,
+ "train_acc": 0.14506,
+ "test_loss": 2.34111376953125,
+ "test_acc": 0.1088,
+ "lyapunov": 5.111980842507404,
+ "grad_norm": 6.803328171635302,
+ "grad_max_sv": 5.664273583889008,
+ "grad_min_sv": 2.45656453401466e-07,
+ "grad_condition": 23556170.622745253,
+ "lr": 0.0009997532801828658,
+ "time_sec": 167.03577542304993
+ },
+ {
+ "epoch": 2,
+ "train_loss": 6.864391835327148,
+ "train_acc": 0.1532,
+ "test_loss": 2.3584522315979,
+ "test_acc": 0.1126,
+ "lyapunov": 3.7626322760911246,
+ "grad_norm": 5.449127371208671,
+ "grad_max_sv": 4.509619396924973,
+ "grad_min_sv": 1.816841066926145e-07,
+ "grad_condition": 25473679.781934455,
+ "lr": 0.0009990133642141358,
+ "time_sec": 167.0620617866516
+ },
+ {
+ "epoch": 3,
+ "train_loss": 6.632632642822266,
+ "train_acc": 0.16122,
+ "test_loss": 2.358525146102905,
+ "test_acc": 0.1,
+ "lyapunov": 3.702555048496217,
+ "grad_norm": 3.996691628576675,
+ "grad_max_sv": 3.4047091096639632,
+ "grad_min_sv": 1.1248512699069124e-07,
+ "grad_condition": 30963953.097301744,
+ "lr": 0.00099778098230154,
+ "time_sec": 167.01362991333008
+ },
+ {
+ "epoch": 4,
+ "train_loss": 6.508619455108643,
+ "train_acc": 0.15906,
+ "test_loss": 2.3301877449035646,
+ "test_acc": 0.1,
+ "lyapunov": 3.647035371312095,
+ "grad_norm": 3.2655343849407332,
+ "grad_max_sv": 3.0296140223741532,
+ "grad_min_sv": 9.594998209294659e-08,
+ "grad_condition": 32002571.000903092,
+ "lr": 0.000996057350657239,
+ "time_sec": 166.97752714157104
+ },
+ {
+ "epoch": 5,
+ "train_loss": 5.912459800109863,
+ "train_acc": 0.13794,
+ "test_loss": 2.3143163734436034,
+ "test_acc": 0.1,
+ "lyapunov": 3.364570482917454,
+ "grad_norm": 2.882730301769821,
+ "grad_max_sv": 2.836460363864899,
+ "grad_min_sv": 8.620691849259288e-08,
+ "grad_condition": 34084982.42197102,
+ "lr": 0.0009938441702975688,
+ "time_sec": 167.01780152320862
+ },
+ {
+ "epoch": 6,
+ "train_loss": 5.365990347290039,
+ "train_acc": 0.12352,
+ "test_loss": 2.307030549240112,
+ "test_acc": 0.1,
+ "lyapunov": 3.0800778951181473,
+ "grad_norm": 2.6661229845796357,
+ "grad_max_sv": 1.9664998756031884,
+ "grad_min_sv": 4.7012965353151585e-08,
+ "grad_condition": 714227055.0495954,
+ "lr": 0.0009911436253643444,
+ "time_sec": 166.95626974105835
+ },
+ {
+ "epoch": 7,
+ "train_loss": 5.098499784545899,
+ "train_acc": 0.11974,
+ "test_loss": 2.306401748275757,
+ "test_acc": 0.1,
+ "lyapunov": 2.9394846096672973,
+ "grad_norm": 2.0425554711132987,
+ "grad_max_sv": 1.3562358289975485,
+ "grad_min_sv": 3.416944161021407e-08,
+ "grad_condition": 430074872.43269414,
+ "lr": 0.0009879583809693736,
+ "time_sec": 167.02987694740295
+ },
+ {
+ "epoch": 8,
+ "train_loss": 4.836283032226563,
+ "train_acc": 0.1193,
+ "test_loss": 2.3056865058898928,
+ "test_acc": 0.1,
+ "lyapunov": 2.8134650903589584,
+ "grad_norm": 1.9015682902174655,
+ "grad_max_sv": 1.3965314358472825,
+ "grad_min_sv": 2.998794566512128e-08,
+ "grad_condition": 984527791.9432541,
+ "lr": 0.0009842915805643154,
+ "time_sec": 166.99379587173462
+ },
+ {
+ "epoch": 9,
+ "train_loss": 4.799866871795654,
+ "train_acc": 0.11898,
+ "test_loss": 2.3078849700927733,
+ "test_acc": 0.1,
+ "lyapunov": 2.7906805755537185,
+ "grad_norm": 1.830247256824178,
+ "grad_max_sv": 1.0446476072072983,
+ "grad_min_sv": 2.2101311034875437e-08,
+ "grad_condition": 6442199712.909399,
+ "lr": 0.0009801468428384714,
+ "time_sec": 167.04091095924377
+ },
+ {
+ "epoch": 10,
+ "train_loss": 4.8418486264038085,
+ "train_acc": 0.1198,
+ "test_loss": 2.306636996841431,
+ "test_acc": 0.1,
+ "lyapunov": 2.8099952402627073,
+ "grad_norm": 2.137959073318514,
+ "grad_max_sv": 0.7742668629978022,
+ "grad_min_sv": 1.0732185378244782e-08,
+ "grad_condition": 12825727231.027037,
+ "lr": 0.0009755282581475767,
+ "time_sec": 167.01724100112915
+ },
+ {
+ "epoch": 11,
+ "train_loss": 4.899544752502441,
+ "train_acc": 0.11034,
+ "test_loss": 2.303115463256836,
+ "test_acc": 0.1,
+ "lyapunov": 2.8371418083415314,
+ "grad_norm": 1.6003418244695304,
+ "grad_max_sv": 0.6158522295280715,
+ "grad_min_sv": 3.796369944507449e-09,
+ "grad_condition": 6480545635.210354,
+ "lr": 0.0009704403844771127,
+ "time_sec": 167.04382944107056
+ },
+ {
+ "epoch": 12,
+ "train_loss": 4.951635014648438,
+ "train_acc": 0.10792,
+ "test_loss": 2.3031677284240724,
+ "test_acc": 0.1,
+ "lyapunov": 2.866735147393268,
+ "grad_norm": 2.666838044816494,
+ "grad_max_sv": 0.5319730836898089,
+ "grad_min_sv": 3.372458990007535e-10,
+ "grad_condition": 39511669967.92405,
+ "lr": 0.0009648882429441257,
+ "time_sec": 166.9957308769226
+ },
+ {
+ "epoch": 13,
+ "train_loss": 6.152256243286133,
+ "train_acc": 0.10692,
+ "test_loss": 2.303246379852295,
+ "test_acc": 0.1,
+ "lyapunov": 3.4366153896312275,
+ "grad_norm": 6.342546880123247,
+ "grad_max_sv": 0.2403870326364995,
+ "grad_min_sv": 2.6050612198124816e-10,
+ "grad_condition": 34925794452.094666,
+ "lr": 0.0009588773128419905,
+ "time_sec": 167.01189947128296
+ },
+ {
+ "epoch": 14,
+ "train_loss": 6.052201841888428,
+ "train_acc": 0.10886,
+ "test_loss": 2.3029991958618163,
+ "test_acc": 0.1,
+ "lyapunov": 3.407372230154169,
+ "grad_norm": 3.751884478526656,
+ "grad_max_sv": 0.3085380573000293,
+ "grad_min_sv": 1.7481779514657177e-10,
+ "grad_condition": 69456467004.02864,
+ "lr": 0.0009524135262330098,
+ "time_sec": 166.99195837974548
+ },
+ {
+ "epoch": 15,
+ "train_loss": 6.174399379577637,
+ "train_acc": 0.10784,
+ "test_loss": 2.3030965816497804,
+ "test_acc": 0.1,
+ "lyapunov": 3.468341021891445,
+ "grad_norm": 2.2149403643105514,
+ "grad_max_sv": 0.2665206765946223,
+ "grad_min_sv": 7.174466620587407e-11,
+ "grad_condition": 25279718153.525455,
+ "lr": 0.0009455032620941839,
+ "time_sec": 167.02302026748657
+ },
+ {
+ "epoch": 16,
+ "train_loss": 5.8687522245788575,
+ "train_acc": 0.10852,
+ "test_loss": 2.302928673553467,
+ "test_acc": 0.1,
+ "lyapunov": 3.3205134075925784,
+ "grad_norm": 2.1727798236859517,
+ "grad_max_sv": 0.1694878804436172,
+ "grad_min_sv": 5.284483110394732e-11,
+ "grad_condition": 29825093550.928566,
+ "lr": 0.0009381533400219318,
+ "time_sec": 166.98851919174194
+ },
+ {
+ "epoch": 17,
+ "train_loss": 5.00506268585205,
+ "train_acc": 0.10292,
+ "test_loss": 2.3029050621032714,
+ "test_acc": 0.1,
+ "lyapunov": 2.8923883834458373,
+ "grad_norm": 1.1450970364565718,
+ "grad_max_sv": 0.12666865187754867,
+ "grad_min_sv": 2.4102328364569327e-11,
+ "grad_condition": 25147403549.501667,
+ "lr": 0.0009303710135019719,
+ "time_sec": 167.02036666870117
+ },
+ {
+ "epoch": 18,
+ "train_loss": 4.855449399719238,
+ "train_acc": 0.104,
+ "test_loss": 2.3028139762878417,
+ "test_acc": 0.1,
+ "lyapunov": 2.8120573298705507,
+ "grad_norm": 0.7305556308720836,
+ "grad_max_sv": 0.09714378891512751,
+ "grad_min_sv": 8.150729035001414e-12,
+ "grad_condition": 58264297783.12268,
+ "lr": 0.0009221639627510076,
+ "time_sec": 167.08689284324646
+ },
+ {
+ "epoch": 19,
+ "train_loss": 4.96336449584961,
+ "train_acc": 0.1041,
+ "test_loss": 2.3027950325012205,
+ "test_acc": 0.1,
+ "lyapunov": 2.8725837020922804,
+ "grad_norm": 1.182474133176391,
+ "grad_max_sv": 0.07083241189830006,
+ "grad_min_sv": 7.22405413796021e-12,
+ "grad_condition": 38280733847.458176,
+ "lr": 0.000913540287137281,
+ "time_sec": 167.00970244407654
+ },
+ {
+ "epoch": 20,
+ "train_loss": 4.743826732025147,
+ "train_acc": 0.10382,
+ "test_loss": 2.3027557773590086,
+ "test_acc": 0.1,
+ "lyapunov": 2.7483980515423942,
+ "grad_norm": 0.6554501104680703,
+ "grad_max_sv": 0.05732933725230396,
+ "grad_min_sv": 5.653544739145854e-12,
+ "grad_condition": 35503198727.48572,
+ "lr": 0.0009045084971874739,
+ "time_sec": 167.09380722045898
+ },
+ {
+ "epoch": 21,
+ "train_loss": 4.678205784606933,
+ "train_acc": 0.10294,
+ "test_loss": 3.7050921539306643,
+ "test_acc": 0.1,
+ "lyapunov": 2.712228787219738,
+ "grad_norm": 0.9024618566776086,
+ "grad_max_sv": 0.03976228955434635,
+ "grad_min_sv": 5.291108131013551e-11,
+ "grad_condition": 16349739158.901342,
+ "lr": 0.0008950775061878452,
+ "time_sec": 167.0224826335907
+ },
+ {
+ "epoch": 22,
+ "train_loss": 4.63441824432373,
+ "train_acc": 0.09868,
+ "test_loss": 2.678515822601318,
+ "test_acc": 0.1,
+ "lyapunov": 2.6848394797586113,
+ "grad_norm": 0.9464113383195869,
+ "grad_max_sv": 0.03219134085811674,
+ "grad_min_sv": 3.575371656772674e-11,
+ "grad_condition": 22552839587.69338,
+ "lr": 0.0008852566213878947,
+ "time_sec": 167.0608777999878
+ },
+ {
+ "epoch": 23,
+ "train_loss": 4.728675323486328,
+ "train_acc": 0.09932,
+ "test_loss": 3.68248123626709,
+ "test_acc": 0.1,
+ "lyapunov": 2.732565569450788,
+ "grad_norm": 1.1845032429393016,
+ "grad_max_sv": 0.009998515527695418,
+ "grad_min_sv": 1.095997224005267e-20,
+ "grad_condition": 9998514820.705112,
+ "lr": 0.0008750555348152298,
+ "time_sec": 167.0682075023651
+ },
+ {
+ "epoch": 24,
+ "train_loss": 4.65850959197998,
+ "train_acc": 0.09912,
+ "test_loss": 3.6423350326538086,
+ "test_acc": 0.1,
+ "lyapunov": 2.6980338791752105,
+ "grad_norm": 1.5417542431510867,
+ "grad_max_sv": 0.008353105513378978,
+ "grad_min_sv": 1.9907194983962853e-18,
+ "grad_condition": 8352993676.098096,
+ "lr": 0.0008644843137107057,
+ "time_sec": 167.08017802238464
+ },
+ {
+ "epoch": 25,
+ "train_loss": 4.584089448547363,
+ "train_acc": 0.09784,
+ "test_loss": 2.3033696189880373,
+ "test_acc": 0.1,
+ "lyapunov": 2.653346909891309,
+ "grad_norm": 0.9625814425500707,
+ "grad_max_sv": 0.0027962074615061282,
+ "grad_min_sv": 1.8178542286825737e-15,
+ "grad_condition": 2726213455.6624613,
+ "lr": 0.0008535533905932737,
+ "time_sec": 167.05963444709778
+ },
+ {
+ "epoch": 26,
+ "train_loss": 4.562473741149902,
+ "train_acc": 0.0972,
+ "test_loss": 2.5531665412902833,
+ "test_acc": 0.1,
+ "lyapunov": 2.6440261763989774,
+ "grad_norm": 1.0966601277478685,
+ "grad_max_sv": 0.0009299686178565025,
+ "grad_min_sv": 7.864982908802376e-35,
+ "grad_condition": 929968617.8565025,
+ "lr": 0.0008422735529643444,
+ "time_sec": 167.0820574760437
+ },
+ {
+ "epoch": 27,
+ "train_loss": 4.557928927612305,
+ "train_acc": 0.10072,
+ "test_loss": 2.3032149608612063,
+ "test_acc": 0.1,
+ "lyapunov": 2.640467453490743,
+ "grad_norm": 1.5990578945087282,
+ "grad_max_sv": 0.001147926412522793,
+ "grad_min_sv": 2.0663573730241894e-15,
+ "grad_condition": 1060288974.8907245,
+ "lr": 0.0008306559326618259,
+ "time_sec": 167.0413818359375
+ },
+ {
+ "epoch": 28,
+ "train_loss": 4.533458753051757,
+ "train_acc": 0.09686,
+ "test_loss": 2.303218946838379,
+ "test_acc": 0.1,
+ "lyapunov": 2.6252909279845253,
+ "grad_norm": 0.6753306901464893,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0008187119948743449,
+ "time_sec": 167.0830535888672
+ },
+ {
+ "epoch": 29,
+ "train_loss": 4.496531313171387,
+ "train_acc": 0.09852,
+ "test_loss": 2.3032687267303467,
+ "test_acc": 0.1,
+ "lyapunov": 2.6040675938891633,
+ "grad_norm": 0.18386399798172356,
+ "grad_max_sv": 0.00110331317409873,
+ "grad_min_sv": 7.969612926285099e-35,
+ "grad_condition": 1103313174.09873,
+ "lr": 0.0008064535268264883,
+ "time_sec": 167.04623770713806
+ },
+ {
+ "epoch": 30,
+ "train_loss": 4.504303005065918,
+ "train_acc": 0.0976,
+ "test_loss": 2.303500841522217,
+ "test_acc": 0.1,
+ "lyapunov": 2.6081804003556974,
+ "grad_norm": 0.15236154258308318,
+ "grad_max_sv": 0.0028056097216904163,
+ "grad_min_sv": 0.0,
+ "grad_condition": 2805609721.6904163,
+ "lr": 0.0007938926261462367,
+ "time_sec": 167.02854776382446
+ },
+ {
+ "epoch": 31,
+ "train_loss": 4.50321345703125,
+ "train_acc": 0.09666,
+ "test_loss": 2.3035490158081053,
+ "test_acc": 0.1,
+ "lyapunov": 2.607592426602493,
+ "grad_norm": 0.10039091720588617,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007810416889260654,
+ "time_sec": 167.07999300956726
+ },
+ {
+ "epoch": 32,
+ "train_loss": 4.501663753662109,
+ "train_acc": 0.09806,
+ "test_loss": 2.3034838943481444,
+ "test_acc": 0.1,
+ "lyapunov": 2.607143198437703,
+ "grad_norm": 0.1048906506411198,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007679133974894983,
+ "time_sec": 167.00407528877258
+ },
+ {
+ "epoch": 33,
+ "train_loss": 4.5019655114746095,
+ "train_acc": 0.09498,
+ "test_loss": 2.30348473739624,
+ "test_acc": 0.1,
+ "lyapunov": 2.607365154549289,
+ "grad_norm": 0.09466991605122166,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007545207078751857,
+ "time_sec": 167.04430413246155
+ },
+ {
+ "epoch": 34,
+ "train_loss": 4.4972885162353515,
+ "train_acc": 0.09806,
+ "test_loss": 2.3035587966918945,
+ "test_acc": 0.1,
+ "lyapunov": 2.6045894854513887,
+ "grad_norm": 0.094802640603578,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007408768370508577,
+ "time_sec": 167.01064467430115
+ },
+ {
+ "epoch": 35,
+ "train_loss": 4.496900313110352,
+ "train_acc": 0.09916,
+ "test_loss": 2.3035878532409666,
+ "test_acc": 0.1,
+ "lyapunov": 2.6043496991667294,
+ "grad_norm": 0.08505627865784493,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007269952498697734,
+ "time_sec": 167.04931592941284
+ },
+ {
+ "epoch": 36,
+ "train_loss": 4.498045174407959,
+ "train_acc": 0.09896,
+ "test_loss": 2.303556993865967,
+ "test_acc": 0.1,
+ "lyapunov": 2.6051284626621722,
+ "grad_norm": 0.08865673943824036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0007128896457825364,
+ "time_sec": 166.99707579612732
+ },
+ {
+ "epoch": 37,
+ "train_loss": 4.494941578521728,
+ "train_acc": 0.09764,
+ "test_loss": 2.3035079292297365,
+ "test_acc": 0.1,
+ "lyapunov": 2.6031092463247,
+ "grad_norm": 0.09732931123675816,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006985739453173903,
+ "time_sec": 167.02038192749023
+ },
+ {
+ "epoch": 38,
+ "train_loss": 4.496269936523437,
+ "train_acc": 0.09764,
+ "test_loss": 2.3035408573150633,
+ "test_acc": 0.1,
+ "lyapunov": 2.604000445217123,
+ "grad_norm": 0.08852073271727623,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006840622763423391,
+ "time_sec": 167.02108144760132
+ },
+ {
+ "epoch": 39,
+ "train_loss": 4.493522086791992,
+ "train_acc": 0.09734,
+ "test_loss": 2.303493659210205,
+ "test_acc": 0.1,
+ "lyapunov": 2.6023181265272446,
+ "grad_norm": 0.08748337786673831,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006693689601226458,
+ "time_sec": 167.05211973190308
+ },
+ {
+ "epoch": 40,
+ "train_loss": 4.498229814758301,
+ "train_acc": 0.09844,
+ "test_loss": 2.3034747520446777,
+ "test_acc": 0.1,
+ "lyapunov": 2.6050954608966017,
+ "grad_norm": 0.10483613599174303,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006545084971874737,
+ "time_sec": 167.01571893692017
+ },
+ {
+ "epoch": 41,
+ "train_loss": 4.498432325286865,
+ "train_acc": 0.09692,
+ "test_loss": 2.3034770004272462,
+ "test_acc": 0.1,
+ "lyapunov": 2.6052994520767876,
+ "grad_norm": 0.09650951998583779,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006394955530196147,
+ "time_sec": 167.06526255607605
+ },
+ {
+ "epoch": 42,
+ "train_loss": 4.496120017395019,
+ "train_acc": 0.09806,
+ "test_loss": 2.303461635971069,
+ "test_acc": 0.1,
+ "lyapunov": 2.6038818706941727,
+ "grad_norm": 0.08793824539769711,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006243449435824273,
+ "time_sec": 167.0240659713745
+ },
+ {
+ "epoch": 43,
+ "train_loss": 4.50342136932373,
+ "train_acc": 0.0968,
+ "test_loss": 3.123962462234497,
+ "test_acc": 0.1,
+ "lyapunov": 2.6082677432643178,
+ "grad_norm": 0.10763460634241757,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0006090716206982714,
+ "time_sec": 167.04283785820007
+ },
+ {
+ "epoch": 44,
+ "train_loss": 4.497545390930176,
+ "train_acc": 0.0993,
+ "test_loss": 2.30349365196228,
+ "test_acc": 0.1,
+ "lyapunov": 2.6048193215714086,
+ "grad_norm": 0.0914051250208073,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005936906572928625,
+ "time_sec": 167.00522899627686
+ },
+ {
+ "epoch": 45,
+ "train_loss": 4.497059263458252,
+ "train_acc": 0.0983,
+ "test_loss": 2.303560007476807,
+ "test_acc": 0.1,
+ "lyapunov": 2.604434971919145,
+ "grad_norm": 0.09665268401606698,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005782172325201156,
+ "time_sec": 166.98798084259033
+ },
+ {
+ "epoch": 46,
+ "train_loss": 4.496945586547851,
+ "train_acc": 0.09766,
+ "test_loss": 2.303540351486206,
+ "test_acc": 0.1,
+ "lyapunov": 2.6044252626121502,
+ "grad_norm": 0.08182959271154387,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005626666167821523,
+ "time_sec": 167.05580401420593
+ },
+ {
+ "epoch": 47,
+ "train_loss": 4.5494916119384765,
+ "train_acc": 0.0975,
+ "test_loss": 2.3035491088867186,
+ "test_acc": 0.1,
+ "lyapunov": 2.6250632187289655,
+ "grad_norm": 0.16118104591565238,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005470541566592572,
+ "time_sec": 167.02027297019958
+ },
+ {
+ "epoch": 48,
+ "train_loss": 4.527786728515625,
+ "train_acc": 0.09808,
+ "test_loss": 2.303548764038086,
+ "test_acc": 0.1,
+ "lyapunov": 2.6161820851933317,
+ "grad_norm": 0.1522047852768872,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005313952597646569,
+ "time_sec": 167.08899068832397
+ },
+ {
+ "epoch": 49,
+ "train_loss": 4.49808083328247,
+ "train_acc": 0.0977,
+ "test_loss": 2.3034967575073244,
+ "test_acc": 0.1,
+ "lyapunov": 2.6051423244769008,
+ "grad_norm": 0.09227111356756569,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005157053795390643,
+ "time_sec": 167.04247641563416
+ },
+ {
+ "epoch": 50,
+ "train_loss": 4.506656402282715,
+ "train_acc": 0.09788,
+ "test_loss": 2.3035506187438965,
+ "test_acc": 0.1,
+ "lyapunov": 2.6092079515042514,
+ "grad_norm": 0.0989012749171036,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0005000000000000002,
+ "time_sec": 167.06817507743835
+ },
+ {
+ "epoch": 51,
+ "train_loss": 4.518285944213867,
+ "train_acc": 0.09874,
+ "test_loss": 2.303562999343872,
+ "test_acc": 0.1,
+ "lyapunov": 2.6132117506793087,
+ "grad_norm": 0.14702247022618603,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00048429462046093607,
+ "time_sec": 167.00237131118774
+ },
+ {
+ "epoch": 52,
+ "train_loss": 4.510767389526367,
+ "train_acc": 0.0985,
+ "test_loss": 2.303548727416992,
+ "test_acc": 0.1,
+ "lyapunov": 2.611425805884554,
+ "grad_norm": 0.12770796891288963,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004686047402353435,
+ "time_sec": 167.03129529953003
+ },
+ {
+ "epoch": 53,
+ "train_loss": 4.524528532714844,
+ "train_acc": 0.09758,
+ "test_loss": 2.3034987804412843,
+ "test_acc": 0.1,
+ "lyapunov": 2.6168906950889648,
+ "grad_norm": 0.16221922023587404,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000452945843340743,
+ "time_sec": 167.0302333831787
+ },
+ {
+ "epoch": 54,
+ "train_loss": 4.514558558197021,
+ "train_acc": 0.09898,
+ "test_loss": 2.3035224128723146,
+ "test_acc": 0.1,
+ "lyapunov": 2.6116219816915214,
+ "grad_norm": 0.11874932612009399,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00043733338321784806,
+ "time_sec": 167.03262758255005
+ },
+ {
+ "epoch": 55,
+ "train_loss": 4.500117692108154,
+ "train_acc": 0.0969,
+ "test_loss": 2.303501333999634,
+ "test_acc": 0.1,
+ "lyapunov": 2.6062854854652033,
+ "grad_norm": 0.10674428233360923,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0004217827674798847,
+ "time_sec": 166.98121881484985
+ },
+ {
+ "epoch": 56,
+ "train_loss": 4.51960044921875,
+ "train_acc": 0.09628,
+ "test_loss": 2.30349303855896,
+ "test_acc": 0.1,
+ "lyapunov": 2.616247482616883,
+ "grad_norm": 0.14277503967283073,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00040630934270713783,
+ "time_sec": 167.03360319137573
+ },
+ {
+ "epoch": 57,
+ "train_loss": 4.538308909759522,
+ "train_acc": 0.0975,
+ "test_loss": 2.303505461502075,
+ "test_acc": 0.1,
+ "lyapunov": 2.624653117431094,
+ "grad_norm": 0.17354441507562746,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.000390928379301729,
+ "time_sec": 167.00332236289978
+ },
+ {
+ "epoch": 58,
+ "train_loss": 4.5402243867492675,
+ "train_acc": 0.09768,
+ "test_loss": 2.3034944499969483,
+ "test_acc": 0.1,
+ "lyapunov": 2.6235652969926213,
+ "grad_norm": 0.18590049129605235,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003756550564175727,
+ "time_sec": 166.94713830947876
+ },
+ {
+ "epoch": 59,
+ "train_loss": 4.497288510131836,
+ "train_acc": 0.09656,
+ "test_loss": 2.303503835296631,
+ "test_acc": 0.1,
+ "lyapunov": 2.60465430237753,
+ "grad_norm": 0.08925667815477244,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00036050444698038553,
+ "time_sec": 166.97111773490906
+ },
+ {
+ "epoch": 60,
+ "train_loss": 4.520837378082275,
+ "train_acc": 0.09746,
+ "test_loss": 2.3035025501251223,
+ "test_acc": 0.1,
+ "lyapunov": 2.6177086183787,
+ "grad_norm": 0.14390327015753798,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00034549150281252655,
+ "time_sec": 166.95851969718933
+ },
+ {
+ "epoch": 61,
+ "train_loss": 4.503204351348877,
+ "train_acc": 0.09616,
+ "test_loss": 2.3035063259124757,
+ "test_acc": 0.1,
+ "lyapunov": 2.6079881752238556,
+ "grad_norm": 0.11060100204296372,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003306310398773544,
+ "time_sec": 167.04684805870056
+ },
+ {
+ "epoch": 62,
+ "train_loss": 4.529549421844482,
+ "train_acc": 0.0966,
+ "test_loss": 2.303504373550415,
+ "test_acc": 0.1,
+ "lyapunov": 2.620155497889994,
+ "grad_norm": 0.25260476730678916,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00031593772365766127,
+ "time_sec": 166.9670557975769
+ },
+ {
+ "epoch": 63,
+ "train_loss": 4.504642747955322,
+ "train_acc": 0.09824,
+ "test_loss": 2.302585437011719,
+ "test_acc": 0.1,
+ "lyapunov": 2.6090027182303426,
+ "grad_norm": 0.14482467729355822,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0003014260546826097,
+ "time_sec": 167.07136464118958
+ },
+ {
+ "epoch": 64,
+ "train_loss": 4.5207818331909175,
+ "train_acc": 0.09658,
+ "test_loss": 2.302585619735718,
+ "test_acc": 0.1,
+ "lyapunov": 2.6153993130949758,
+ "grad_norm": 0.14340140289375716,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002871103542174637,
+ "time_sec": 167.0296709537506
+ },
+ {
+ "epoch": 65,
+ "train_loss": 4.514579942321777,
+ "train_acc": 0.09692,
+ "test_loss": 2.302585908126831,
+ "test_acc": 0.1,
+ "lyapunov": 2.612202508370285,
+ "grad_norm": 0.11615853114383813,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002730047501302267,
+ "time_sec": 167.06110525131226
+ },
+ {
+ "epoch": 66,
+ "train_loss": 4.539550397949219,
+ "train_acc": 0.09668,
+ "test_loss": 2.3025857189178467,
+ "test_acc": 0.1,
+ "lyapunov": 2.6239442215551194,
+ "grad_norm": 0.24377422344866448,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00025912316294914234,
+ "time_sec": 166.96833562850952
+ },
+ {
+ "epoch": 67,
+ "train_loss": 4.520765433959961,
+ "train_acc": 0.09678,
+ "test_loss": 2.3025856506347657,
+ "test_acc": 0.1,
+ "lyapunov": 2.6144380130426352,
+ "grad_norm": 0.17143215114502838,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0002454792921248144,
+ "time_sec": 167.06375288963318
+ },
+ {
+ "epoch": 68,
+ "train_loss": 4.501224665222168,
+ "train_acc": 0.09848,
+ "test_loss": 2.3025851860046385,
+ "test_acc": 0.1,
+ "lyapunov": 2.606965447935607,
+ "grad_norm": 0.22167025880962787,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00023208660251050164,
+ "time_sec": 166.97689723968506
+ },
+ {
+ "epoch": 69,
+ "train_loss": 4.516330520629883,
+ "train_acc": 0.09716,
+ "test_loss": 2.3025853271484373,
+ "test_acc": 0.1,
+ "lyapunov": 2.6127135893877815,
+ "grad_norm": 0.1178159153430125,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00021895831107393473,
+ "time_sec": 167.03971099853516
+ },
+ {
+ "epoch": 70,
+ "train_loss": 4.518335289764404,
+ "train_acc": 0.09628,
+ "test_loss": 2.3025851623535156,
+ "test_acc": 0.1,
+ "lyapunov": 2.614670734576252,
+ "grad_norm": 0.19910468609269888,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00020610737385376356,
+ "time_sec": 167.01087379455566
+ },
+ {
+ "epoch": 71,
+ "train_loss": 4.506198991699219,
+ "train_acc": 0.0961,
+ "test_loss": 2.3025853843688964,
+ "test_acc": 0.1,
+ "lyapunov": 2.6081283720557953,
+ "grad_norm": 0.09098734124729495,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00019354647317351177,
+ "time_sec": 167.0194799900055
+ },
+ {
+ "epoch": 72,
+ "train_loss": 4.49574895111084,
+ "train_acc": 0.09856,
+ "test_loss": 2.3025853591918946,
+ "test_acc": 0.1,
+ "lyapunov": 2.603733692632612,
+ "grad_norm": 0.08176729544229487,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001812880051256552,
+ "time_sec": 167.05306220054626
+ },
+ {
+ "epoch": 73,
+ "train_loss": 4.497463835449219,
+ "train_acc": 0.09886,
+ "test_loss": 2.3025851680755616,
+ "test_acc": 0.1,
+ "lyapunov": 2.604736436053615,
+ "grad_norm": 0.082986396115534,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00016934406733817422,
+ "time_sec": 166.98811650276184
+ },
+ {
+ "epoch": 74,
+ "train_loss": 4.4971358953857425,
+ "train_acc": 0.09738,
+ "test_loss": 2.302585493850708,
+ "test_acc": 0.1,
+ "lyapunov": 2.6045719363805278,
+ "grad_norm": 0.08151196821637299,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001577264470356557,
+ "time_sec": 167.01667833328247
+ },
+ {
+ "epoch": 75,
+ "train_loss": 4.50925322631836,
+ "train_acc": 0.0967,
+ "test_loss": 2.302585232925415,
+ "test_acc": 0.1,
+ "lyapunov": 2.6094926751178242,
+ "grad_norm": 0.21190207725464844,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00014644660940672634,
+ "time_sec": 166.97911548614502
+ },
+ {
+ "epoch": 76,
+ "train_loss": 4.496390933227539,
+ "train_acc": 0.0967,
+ "test_loss": 2.302585297393799,
+ "test_acc": 0.1,
+ "lyapunov": 2.6040706823549002,
+ "grad_norm": 0.08435313407684436,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0001355156862892944,
+ "time_sec": 167.0480306148529
+ },
+ {
+ "epoch": 77,
+ "train_loss": 4.496095029296875,
+ "train_acc": 0.0965,
+ "test_loss": 2.3025853218078614,
+ "test_acc": 0.1,
+ "lyapunov": 2.6039189987475306,
+ "grad_norm": 0.1373346720572696,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00012494446518477025,
+ "time_sec": 166.97820734977722
+ },
+ {
+ "epoch": 78,
+ "train_loss": 4.499068414611816,
+ "train_acc": 0.096,
+ "test_loss": 2.3025852237701416,
+ "test_acc": 0.1,
+ "lyapunov": 2.605743714305751,
+ "grad_norm": 0.10939849657650327,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00011474337861210548,
+ "time_sec": 166.98934531211853
+ },
+ {
+ "epoch": 79,
+ "train_loss": 4.4964453392028805,
+ "train_acc": 0.09828,
+ "test_loss": 2.302585151672363,
+ "test_acc": 0.1,
+ "lyapunov": 2.604178778655694,
+ "grad_norm": 0.08774538011729731,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.00010492249381215483,
+ "time_sec": 167.02672863006592
+ },
+ {
+ "epoch": 80,
+ "train_loss": 4.499743932647705,
+ "train_acc": 0.09862,
+ "test_loss": 2.302585228347778,
+ "test_acc": 0.1,
+ "lyapunov": 2.606093951808217,
+ "grad_norm": 0.2420142867175763,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.549150281252637e-05,
+ "time_sec": 167.10957646369934
+ },
+ {
+ "epoch": 81,
+ "train_loss": 4.502734872436523,
+ "train_acc": 0.09578,
+ "test_loss": 2.302585201263428,
+ "test_acc": 0.1,
+ "lyapunov": 2.6076697900776975,
+ "grad_norm": 0.13251791023485532,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.645971286271918e-05,
+ "time_sec": 166.9769287109375
+ },
+ {
+ "epoch": 82,
+ "train_loss": 4.494626608581543,
+ "train_acc": 0.09758,
+ "test_loss": 2.3025851295471194,
+ "test_acc": 0.1,
+ "lyapunov": 2.6029957383489974,
+ "grad_norm": 0.08170465976084904,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 7.78360372489926e-05,
+ "time_sec": 167.00449562072754
+ },
+ {
+ "epoch": 83,
+ "train_loss": 4.495700520019532,
+ "train_acc": 0.09822,
+ "test_loss": 2.3025853286743163,
+ "test_acc": 0.1,
+ "lyapunov": 2.6036597090913816,
+ "grad_norm": 0.1210411913955966,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.962898649802815e-05,
+ "time_sec": 166.96435856819153
+ },
+ {
+ "epoch": 84,
+ "train_loss": 4.49369448425293,
+ "train_acc": 0.09848,
+ "test_loss": 2.3025850296020507,
+ "test_acc": 0.1,
+ "lyapunov": 2.6024485061235745,
+ "grad_norm": 0.1169116031555102,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.184665997806824e-05,
+ "time_sec": 166.9589819908142
+ },
+ {
+ "epoch": 85,
+ "train_loss": 4.493269319915772,
+ "train_acc": 0.09772,
+ "test_loss": 2.3025851333618164,
+ "test_acc": 0.1,
+ "lyapunov": 2.60219204151417,
+ "grad_norm": 0.08026909865070977,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 5.449673790581613e-05,
+ "time_sec": 167.0204620361328
+ },
+ {
+ "epoch": 86,
+ "train_loss": 4.4974218487548825,
+ "train_acc": 0.09802,
+ "test_loss": 2.302585245895386,
+ "test_acc": 0.1,
+ "lyapunov": 2.604730949987231,
+ "grad_norm": 0.08689607041758553,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.758647376699034e-05,
+ "time_sec": 166.964524269104
+ },
+ {
+ "epoch": 87,
+ "train_loss": 4.495326493072509,
+ "train_acc": 0.0982,
+ "test_loss": 2.3025850296020507,
+ "test_acc": 0.1,
+ "lyapunov": 2.603457776481843,
+ "grad_norm": 0.09583928752803095,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 4.112268715800956e-05,
+ "time_sec": 167.03006196022034
+ },
+ {
+ "epoch": 88,
+ "train_loss": 4.494311538085937,
+ "train_acc": 0.09762,
+ "test_loss": 2.3025852684020998,
+ "test_acc": 0.1,
+ "lyapunov": 2.602831931980065,
+ "grad_norm": 0.08201988600112256,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.511175705587434e-05,
+ "time_sec": 166.98635745048523
+ },
+ {
+ "epoch": 89,
+ "train_loss": 4.497406745605469,
+ "train_acc": 0.09872,
+ "test_loss": 2.302585092926025,
+ "test_acc": 0.1,
+ "lyapunov": 2.6046652647540394,
+ "grad_norm": 0.11011286998675665,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.9559615522887284e-05,
+ "time_sec": 167.0066351890564
+ },
+ {
+ "epoch": 90,
+ "train_loss": 4.495393841552734,
+ "train_acc": 0.0955,
+ "test_loss": 2.3025851219177245,
+ "test_acc": 0.1,
+ "lyapunov": 2.603500037546963,
+ "grad_norm": 0.08854801622590937,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.447174185242324e-05,
+ "time_sec": 166.98117446899414
+ },
+ {
+ "epoch": 91,
+ "train_loss": 4.496799105529785,
+ "train_acc": 0.09778,
+ "test_loss": 2.3025851669311526,
+ "test_acc": 0.1,
+ "lyapunov": 2.6043886601772455,
+ "grad_norm": 0.08317548392372451,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.9853157161528526e-05,
+ "time_sec": 167.05606770515442
+ },
+ {
+ "epoch": 92,
+ "train_loss": 4.501456503753662,
+ "train_acc": 0.09732,
+ "test_loss": 2.302585040283203,
+ "test_acc": 0.1,
+ "lyapunov": 2.6069688260402826,
+ "grad_norm": 0.09601255447418665,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.570841943568452e-05,
+ "time_sec": 166.95690035820007
+ },
+ {
+ "epoch": 93,
+ "train_loss": 4.4988940646362305,
+ "train_acc": 0.09822,
+ "test_loss": 2.302585070037842,
+ "test_acc": 0.1,
+ "lyapunov": 2.6056473828337685,
+ "grad_norm": 0.11345521860163729,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 1.204161903062634e-05,
+ "time_sec": 167.01007437705994
+ },
+ {
+ "epoch": 94,
+ "train_loss": 4.500971371002198,
+ "train_acc": 0.09656,
+ "test_loss": 2.3025852294921876,
+ "test_acc": 0.1,
+ "lyapunov": 2.606662953296281,
+ "grad_norm": 0.10989679012817173,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 8.85637463565564e-06,
+ "time_sec": 166.93790555000305
+ },
+ {
+ "epoch": 95,
+ "train_loss": 4.496245345458984,
+ "train_acc": 0.09824,
+ "test_loss": 2.3025850425720216,
+ "test_acc": 0.1,
+ "lyapunov": 2.6040014677950185,
+ "grad_norm": 0.13386825999790872,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 6.155829702431171e-06,
+ "time_sec": 166.99875664710999
+ },
+ {
+ "epoch": 96,
+ "train_loss": 4.4964897052001955,
+ "train_acc": 0.09874,
+ "test_loss": 2.302585097122192,
+ "test_acc": 0.1,
+ "lyapunov": 2.6042159268313356,
+ "grad_norm": 0.09409731933962433,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 3.942649342761118e-06,
+ "time_sec": 166.96930813789368
+ },
+ {
+ "epoch": 97,
+ "train_loss": 4.499828433837891,
+ "train_acc": 0.1,
+ "test_loss": 2.3025849605560302,
+ "test_acc": 0.1,
+ "lyapunov": 2.6062122037648545,
+ "grad_norm": 0.16887612557601597,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.2190176984600023e-06,
+ "time_sec": 166.9714593887329
+ },
+ {
+ "epoch": 98,
+ "train_loss": 4.496156484069824,
+ "train_acc": 0.1,
+ "test_loss": 2.302585231781006,
+ "test_acc": 0.1,
+ "lyapunov": 2.603946977259253,
+ "grad_norm": 0.08139214809285189,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 9.866357858642206e-07,
+ "time_sec": 167.0184144973755
+ },
+ {
+ "epoch": 99,
+ "train_loss": 4.497607230377198,
+ "train_acc": 0.1,
+ "test_loss": 2.302585125350952,
+ "test_acc": 0.1,
+ "lyapunov": 2.6048427774473226,
+ "grad_norm": 0.08064979301518677,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 2.467198171342e-07,
+ "time_sec": 166.95221614837646
+ },
+ {
+ "epoch": 100,
+ "train_loss": 4.493742803955078,
+ "train_acc": 0.1,
+ "test_loss": 2.302585009765625,
+ "test_acc": 0.1,
+ "lyapunov": 2.602488872035385,
+ "grad_norm": 0.08215126330977654,
+ "grad_max_sv": 0.0,
+ "grad_min_sv": 0.0,
+ "grad_condition": 0.0,
+ "lr": 0.0,
+ "time_sec": 166.99254083633423
+ }
+ ]
+ }
+} \ No newline at end of file